rfi-irfos commited on
Commit
5e7de7f
·
verified ·
1 Parent(s): 1a8e318

update: num_hidden_layers 21->22 (S10 complete)

Browse files
Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -2,7 +2,7 @@
2
  "architectures": ["AlbertMoE"],
3
  "model_type": "albert-moe",
4
  "hidden_size": 256,
5
- "num_hidden_layers": 21,
6
  "num_attention_heads": 4,
7
  "num_experts": 12,
8
  "num_experts_per_tok": 3,
@@ -17,6 +17,6 @@
17
  "training_framework": "candle",
18
  "training_language": "rust",
19
  "max_seq_len": 256,
20
- "num_layers": 21,
21
  "num_heads": 4
22
  }
 
2
  "architectures": ["AlbertMoE"],
3
  "model_type": "albert-moe",
4
  "hidden_size": 256,
5
+ "num_hidden_layers": 22,
6
  "num_attention_heads": 4,
7
  "num_experts": 12,
8
  "num_experts_per_tok": 3,
 
17
  "training_framework": "candle",
18
  "training_language": "rust",
19
  "max_seq_len": 256,
20
+ "num_layers": 22,
21
  "num_heads": 4
22
  }