icxcn commited on
Commit
3afe319
·
verified ·
1 Parent(s): f557352

fix: correct model architecture in config.json (from actual weights inspection)

Browse files
Files changed (1) hide show
  1. config.json +20 -17
config.json CHANGED
@@ -1,28 +1,31 @@
1
  {
2
- "model_type": "hydra-bitnet",
3
- "architectures": ["HydraBitNetForSequenceClassification"],
4
- "vocab_size": 256,
5
- "hidden_size": 256,
6
- "num_hidden_layers": 6,
 
 
7
  "num_experts": 4,
8
  "top_k_experts": 2,
9
- "intermediate_size": 512,
10
- "max_position_embeddings": 512,
11
  "torch_dtype": "float32",
12
- "bitnet_config": {
13
- "quantization": "ternary",
14
- "weight_bits": 2,
15
- "weight_values": [-1, 0, 1],
16
- "activation_bits": 8
17
- },
18
  "task_heads": {
19
  "compression": {
20
  "num_labels": 4,
21
- "labels": ["NONE", "BPE", "BROTLI", "ZLIB"]
 
 
 
 
 
22
  },
23
  "security": {
24
  "num_labels": 2,
25
- "labels": ["SAFE", "UNSAFE"]
 
 
 
26
  }
27
- }
28
- }
 
 
1
  {
2
+ "model_type": "hydra-moe",
3
+ "architectures": [
4
+ "HydraMoEForSequenceClassification"
5
+ ],
6
+ "vocab_size": 32000,
7
+ "hidden_size": 192,
8
+ "num_hidden_layers": 4,
9
  "num_experts": 4,
10
  "top_k_experts": 2,
 
 
11
  "torch_dtype": "float32",
 
 
 
 
 
 
12
  "task_heads": {
13
  "compression": {
14
  "num_labels": 4,
15
+ "labels": [
16
+ "NONE",
17
+ "BPE",
18
+ "BROTLI",
19
+ "ZLIB"
20
+ ]
21
  },
22
  "security": {
23
  "num_labels": 2,
24
+ "labels": [
25
+ "SAFE",
26
+ "UNSAFE"
27
+ ]
28
  }
29
+ },
30
+ "_note": "Architecture derived from actual model.safetensors inspection"
31
+ }