Johnblick187 commited on
Commit
55c313a
·
verified ·
1 Parent(s): 1997d68

Update modeling_smartcoder_moe.py

Browse files
Files changed (1) hide show
  1. modeling_smartcoder_moe.py +2 -0
modeling_smartcoder_moe.py CHANGED
@@ -35,6 +35,7 @@ class SmartCoderMoEConfig(PretrainedConfig):
35
  dense_intermediate_size=8192,
36
  num_experts=32,
37
  expert_dim=512,
 
38
  num_experts_per_tok=2,
39
  max_position_embeddings=16384,
40
  rope_theta=10000.0,
@@ -54,6 +55,7 @@ class SmartCoderMoEConfig(PretrainedConfig):
54
  self.dense_intermediate_size = dense_intermediate_size
55
  self.num_experts = num_experts
56
  self.expert_dim = expert_dim
 
57
  self.num_experts_per_tok = num_experts_per_tok
58
  self.max_position_embeddings = max_position_embeddings
59
  self.rope_theta = rope_theta
 
35
  dense_intermediate_size=8192,
36
  num_experts=32,
37
  expert_dim=512,
38
+ expert_intermediate_size=5120,
39
  num_experts_per_tok=2,
40
  max_position_embeddings=16384,
41
  rope_theta=10000.0,
 
55
  self.dense_intermediate_size = dense_intermediate_size
56
  self.num_experts = num_experts
57
  self.expert_dim = expert_dim
58
+ self.expert_intermediate_size = expert_intermediate_size
59
  self.num_experts_per_tok = num_experts_per_tok
60
  self.max_position_embeddings = max_position_embeddings
61
  self.rope_theta = rope_theta