Re-upload config.json via AutoConfig (transformers 5.5)

#2
by echarlaix HF Staff - opened
Files changed (1) hide show
  1. config.json +6 -4
config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_name_or_path": "microsoft/Phi-3.5-MoE-instruct",
3
  "architectures": [
4
  "PhiMoEForCausalLM"
5
  ],
@@ -10,6 +9,7 @@
10
  "AutoModelForCausalLM": "modeling_phimoe.PhiMoEForCausalLM"
11
  },
12
  "bos_token_id": 1,
 
13
  "eos_token_id": 32000,
14
  "hidden_act": "silu",
15
  "hidden_dropout": 0.0,
@@ -27,14 +27,17 @@
27
  "num_local_experts": 16,
28
  "original_max_position_embeddings": 4096,
29
  "output_router_logits": false,
 
30
  "rms_norm_eps": 1e-05,
31
- "rope_scaling": {
32
  "long_factor": [
33
  1.0299,
34
  1.0499
35
  ],
36
  "long_mscale": 1.243163121016122,
37
  "original_max_position_embeddings": 4096,
 
 
38
  "short_factor": [
39
  1.05,
40
  1.05
@@ -47,8 +50,7 @@
47
  "router_jitter_noise": 0.01,
48
  "sliding_window": 131072,
49
  "tie_word_embeddings": false,
50
- "torch_dtype": "bfloat16",
51
- "transformers_version": "4.44.0",
52
  "use_cache": true,
53
  "vocab_size": 32064
54
  }
 
1
  {
 
2
  "architectures": [
3
  "PhiMoEForCausalLM"
4
  ],
 
9
  "AutoModelForCausalLM": "modeling_phimoe.PhiMoEForCausalLM"
10
  },
11
  "bos_token_id": 1,
12
+ "dtype": "bfloat16",
13
  "eos_token_id": 32000,
14
  "hidden_act": "silu",
15
  "hidden_dropout": 0.0,
 
27
  "num_local_experts": 16,
28
  "original_max_position_embeddings": 4096,
29
  "output_router_logits": false,
30
+ "pad_token_id": null,
31
  "rms_norm_eps": 1e-05,
32
+ "rope_parameters": {
33
  "long_factor": [
34
  1.0299,
35
  1.0499
36
  ],
37
  "long_mscale": 1.243163121016122,
38
  "original_max_position_embeddings": 4096,
39
+ "rope_theta": 10000.0,
40
+ "rope_type": "longrope",
41
  "short_factor": [
42
  1.05,
43
  1.05
 
50
  "router_jitter_noise": 0.01,
51
  "sliding_window": 131072,
52
  "tie_word_embeddings": false,
53
+ "transformers_version": "5.5.0",
 
54
  "use_cache": true,
55
  "vocab_size": 32064
56
  }