fix: correct model architecture in config.json (from actual weights inspection)

Files changed (1) hide show

config.json CHANGED Viewed

@@ -1,28 +1,31 @@
 {
-  "model_type": "hydra-bitnet",
-  "architectures": ["HydraBitNetForSequenceClassification"],
-  "vocab_size": 256,
-  "hidden_size": 256,
-  "num_hidden_layers": 6,
   "num_experts": 4,
   "top_k_experts": 2,
-  "intermediate_size": 512,
-  "max_position_embeddings": 512,
   "torch_dtype": "float32",
-  "bitnet_config": {
-    "quantization": "ternary",
-    "weight_bits": 2,
-    "weight_values": [-1, 0, 1],
-    "activation_bits": 8
-  },
   "task_heads": {
     "compression": {
       "num_labels": 4,
-      "labels": ["NONE", "BPE", "BROTLI", "ZLIB"]
     },
     "security": {
       "num_labels": 2,
-      "labels": ["SAFE", "UNSAFE"]
     }
-  }
-}

 {
+  "model_type": "hydra-moe",
+  "architectures": [
+    "HydraMoEForSequenceClassification"
+  ],
+  "vocab_size": 32000,
+  "hidden_size": 192,
+  "num_hidden_layers": 4,
   "num_experts": 4,
   "top_k_experts": 2,
   "torch_dtype": "float32",
   "task_heads": {
     "compression": {
       "num_labels": 4,
+      "labels": [
+        "NONE",
+        "BPE",
+        "BROTLI",
+        "ZLIB"
+      ]
     },
     "security": {
       "num_labels": 2,
+      "labels": [
+        "SAFE",
+        "UNSAFE"
+      ]
     }
+  },
+  "_note": "Architecture derived from actual model.safetensors inspection"
+}