Umair Imam commited on
Commit
fae5cb1
·
1 Parent(s): 395587c

Update config to match original: 262K context, rope_theta 10M

Browse files
Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -14,7 +14,7 @@
14
  "hidden_size": 2048,
15
  "initializer_range": 0.02,
16
  "intermediate_size": 6144,
17
- "max_position_embeddings": 40960,
18
  "max_window_layers": 48,
19
  "mlp_only_layers": [],
20
  "model_type": "qwen3_moe",
@@ -28,7 +28,7 @@
28
  "output_router_logits": false,
29
  "rms_norm_eps": 1e-06,
30
  "rope_scaling": null,
31
- "rope_theta": 1000000.0,
32
  "router_aux_loss_coef": 0.001,
33
  "sliding_window": null,
34
  "tie_word_embeddings": false,
 
14
  "hidden_size": 2048,
15
  "initializer_range": 0.02,
16
  "intermediate_size": 6144,
17
+ "max_position_embeddings": 262144,
18
  "max_window_layers": 48,
19
  "mlp_only_layers": [],
20
  "model_type": "qwen3_moe",
 
28
  "output_router_logits": false,
29
  "rms_norm_eps": 1e-06,
30
  "rope_scaling": null,
31
+ "rope_theta": 10000000,
32
  "router_aux_loss_coef": 0.001,
33
  "sliding_window": null,
34
  "tie_word_embeddings": false,