yunconglong
/

7Bx4_DPO_2e

Text Generation

text-generation-inference

Model card Files Files and versions

yunconglong commited on Jan 20, 2024

Commit

1c0343c

·

verified ·

1 Parent(s): 013457e

Update config.json

Files changed (1) hide show

config.json +2 -2

config.json CHANGED Viewed

@@ -13,10 +13,10 @@
   "max_position_embeddings": 32768,
   "model_type": "mixtral",
   "num_attention_heads": 32,
-  "num_experts_per_tok": 4,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
-  "num_local_experts": 2,
   "output_router_logits": false,
   "rms_norm_eps": 1e-05,
   "rope_theta": 10000.0,

   "max_position_embeddings": 32768,
   "model_type": "mixtral",
   "num_attention_heads": 32,
+  "num_experts_per_tok": 2,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
+  "num_local_experts": 4,
   "output_router_logits": false,
   "rms_norm_eps": 1e-05,
   "rope_theta": 10000.0,