Johnblick187 commited on
Commit
c8a1ec0
·
verified ·
1 Parent(s): 55c313a

Update modeling_smartcoder_moe.py

Browse files
Files changed (1) hide show
  1. modeling_smartcoder_moe.py +1 -3
modeling_smartcoder_moe.py CHANGED
@@ -34,8 +34,7 @@ class SmartCoderMoEConfig(PretrainedConfig):
34
  num_key_value_heads=4,
35
  dense_intermediate_size=8192,
36
  num_experts=32,
37
- expert_dim=512,
38
- expert_intermediate_size=5120,
39
  num_experts_per_tok=2,
40
  max_position_embeddings=16384,
41
  rope_theta=10000.0,
@@ -54,7 +53,6 @@ class SmartCoderMoEConfig(PretrainedConfig):
54
  self.head_dim = hidden_size // num_attention_heads
55
  self.dense_intermediate_size = dense_intermediate_size
56
  self.num_experts = num_experts
57
- self.expert_dim = expert_dim
58
  self.expert_intermediate_size = expert_intermediate_size
59
  self.num_experts_per_tok = num_experts_per_tok
60
  self.max_position_embeddings = max_position_embeddings
 
34
  num_key_value_heads=4,
35
  dense_intermediate_size=8192,
36
  num_experts=32,
37
+ expert_intermediate_size=512,
 
38
  num_experts_per_tok=2,
39
  max_position_embeddings=16384,
40
  rope_theta=10000.0,
 
53
  self.head_dim = hidden_size // num_attention_heads
54
  self.dense_intermediate_size = dense_intermediate_size
55
  self.num_experts = num_experts
 
56
  self.expert_intermediate_size = expert_intermediate_size
57
  self.num_experts_per_tok = num_experts_per_tok
58
  self.max_position_embeddings = max_position_embeddings