update: num_hidden_layers 21->22 (S10 complete)

Files changed (1) hide show

config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "architectures": ["AlbertMoE"],
   "model_type": "albert-moe",
   "hidden_size": 256,
-  "num_hidden_layers": 21,
   "num_attention_heads": 4,
   "num_experts": 12,
   "num_experts_per_tok": 3,
@@ -17,6 +17,6 @@
   "training_framework": "candle",
   "training_language": "rust",
   "max_seq_len": 256,
-  "num_layers": 21,
   "num_heads": 4
 }

   "architectures": ["AlbertMoE"],
   "model_type": "albert-moe",
   "hidden_size": 256,
+  "num_hidden_layers": 22,
   "num_attention_heads": 4,
   "num_experts": 12,
   "num_experts_per_tok": 3,
   "training_framework": "candle",
   "training_language": "rust",
   "max_seq_len": 256,
+  "num_layers": 22,
   "num_heads": 4
 }