katuni4ka commited on
Commit
b680504
·
verified ·
1 Parent(s): d8419e7

Update configuration_mistral4.py

Browse files
Files changed (1) hide show
  1. configuration_mistral4.py +1 -21
configuration_mistral4.py CHANGED
@@ -99,7 +99,7 @@ class Mistral4Config(PretrainedConfig):
99
  self.qk_rope_head_dim = qk_rope_head_dim
100
  self.v_head_dim = v_head_dim
101
  self.qk_nope_head_dim = qk_nope_head_dim
102
- self.qk_head_dim = qk_nope_head_dim + qk_nope_head_dim
103
  self.n_group = n_group
104
  self.topk_group = topk_group
105
  self.num_experts_per_tok = num_experts_per_tok
@@ -139,25 +139,5 @@ class Mistral4Config(PretrainedConfig):
139
  self.attention_dropout = attention_dropout
140
  self.tie_word_embeddings = tie_word_embeddings
141
 
142
-
143
-
144
-
145
-
146
-
147
-
148
-
149
-
150
-
151
-
152
-
153
-
154
-
155
-
156
-
157
-
158
-
159
-
160
-
161
-
162
 
163
  __all__ = ["Mistral4Config"]
 
99
  self.qk_rope_head_dim = qk_rope_head_dim
100
  self.v_head_dim = v_head_dim
101
  self.qk_nope_head_dim = qk_nope_head_dim
102
+ self.qk_head_dim = qk_nope_head_dim + qk_rope_head_dim
103
  self.n_group = n_group
104
  self.topk_group = topk_group
105
  self.num_experts_per_tok = num_experts_per_tok
 
139
  self.attention_dropout = attention_dropout
140
  self.tie_word_embeddings = tie_word_embeddings
141
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
142
 
143
  __all__ = ["Mistral4Config"]