brady777 commited on
Commit
5922642
·
verified ·
1 Parent(s): 51f245d

restore Qwen3ForCausalLM architecture (HF supports it natively)

Browse files
Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "architectures": [
3
- "Qwen2ForCausalLM"
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
@@ -13,7 +13,7 @@
13
  "initializer_range": 0.02,
14
  "intermediate_size": 12288,
15
  "max_position_embeddings": 40960,
16
- "model_type": "qwen2",
17
  "num_attention_heads": 32,
18
  "num_hidden_layers": 36,
19
  "num_key_value_heads": 8,
 
1
  {
2
  "architectures": [
3
+ "Qwen3ForCausalLM"
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
 
13
  "initializer_range": 0.02,
14
  "intermediate_size": 12288,
15
  "max_position_embeddings": 40960,
16
+ "model_type": "qwen3",
17
  "num_attention_heads": 32,
18
  "num_hidden_layers": 36,
19
  "num_key_value_heads": 8,