Upload model quantized shared_experts

#5
This view is limited to 50 files because it contains too many changes. See the raw diff here.
Files changed (50) hide show
  1. chat_template.jinja +3 -4
  2. config.json +369 -7
  3. model-00010-of-00527.safetensors +2 -2
  4. model-00019-of-00527.safetensors +2 -2
  5. model-00027-of-00527.safetensors +2 -2
  6. model-00036-of-00527.safetensors +2 -2
  7. model-00045-of-00527.safetensors +2 -2
  8. model-00054-of-00527.safetensors +2 -2
  9. model-00062-of-00527.safetensors +2 -2
  10. model-00071-of-00527.safetensors +2 -2
  11. model-00080-of-00527.safetensors +2 -2
  12. model-00089-of-00527.safetensors +2 -2
  13. model-00097-of-00527.safetensors +2 -2
  14. model-00106-of-00527.safetensors +2 -2
  15. model-00115-of-00527.safetensors +2 -2
  16. model-00124-of-00527.safetensors +2 -2
  17. model-00132-of-00527.safetensors +2 -2
  18. model-00141-of-00527.safetensors +2 -2
  19. model-00150-of-00527.safetensors +2 -2
  20. model-00159-of-00527.safetensors +2 -2
  21. model-00167-of-00527.safetensors +2 -2
  22. model-00176-of-00527.safetensors +2 -2
  23. model-00185-of-00527.safetensors +2 -2
  24. model-00194-of-00527.safetensors +2 -2
  25. model-00202-of-00527.safetensors +2 -2
  26. model-00211-of-00527.safetensors +2 -2
  27. model-00220-of-00527.safetensors +2 -2
  28. model-00229-of-00527.safetensors +2 -2
  29. model-00237-of-00527.safetensors +2 -2
  30. model-00246-of-00527.safetensors +2 -2
  31. model-00255-of-00527.safetensors +2 -2
  32. model-00264-of-00527.safetensors +2 -2
  33. model-00272-of-00527.safetensors +2 -2
  34. model-00281-of-00527.safetensors +2 -2
  35. model-00290-of-00527.safetensors +2 -2
  36. model-00299-of-00527.safetensors +2 -2
  37. model-00307-of-00527.safetensors +2 -2
  38. model-00316-of-00527.safetensors +2 -2
  39. model-00325-of-00527.safetensors +2 -2
  40. model-00334-of-00527.safetensors +2 -2
  41. model-00342-of-00527.safetensors +2 -2
  42. model-00351-of-00527.safetensors +2 -2
  43. model-00360-of-00527.safetensors +2 -2
  44. model-00369-of-00527.safetensors +2 -2
  45. model-00377-of-00527.safetensors +2 -2
  46. model-00386-of-00527.safetensors +2 -2
  47. model-00395-of-00527.safetensors +2 -2
  48. model-00404-of-00527.safetensors +2 -2
  49. model-00412-of-00527.safetensors +2 -2
  50. model-00421-of-00527.safetensors +2 -2
chat_template.jinja CHANGED
@@ -52,11 +52,10 @@
52
  <|im_system|>tool_declare<|im_middle|>{{ tools | tojson(separators=(',', ':')) }}<|im_end|>
53
  {%- endif -%}
54
 
55
- {%- if messages|length == 0 or messages[0]['role'] != 'system' -%}
56
- <|im_system|>system<|im_middle|>You are Kimi, an AI assistant created by Moonshot AI.<|im_end|>
57
- {%- endif -%}
58
-
59
  {%- for message in hist_msgs -%}
 
 
 
60
  {{set_roles(message)}}
61
  {%- if message['role'] == 'assistant' -%}
62
  <think></think>{{render_content(message)}}
 
52
  <|im_system|>tool_declare<|im_middle|>{{ tools | tojson(separators=(',', ':')) }}<|im_end|>
53
  {%- endif -%}
54
 
 
 
 
 
55
  {%- for message in hist_msgs -%}
56
+ {%- if loop.first and messages[0]['role'] != 'system' -%}
57
+ <|im_system|>system<|im_middle|>You are Kimi, an AI assistant created by Moonshot AI.<|im_end|>
58
+ {%- endif -%}
59
  {{set_roles(message)}}
60
  {%- if message['role'] == 'assistant' -%}
61
  <think></think>{{render_content(message)}}
config.json CHANGED
@@ -97,13 +97,375 @@
97
  "target_device": null
98
  },
99
  "exclude": [
100
- "re:model.layers.*self_attn.*",
101
- "re:model.layers.*mlp.gate",
102
  "lm_head",
103
- "re:model.layers.*mlp.gate_proj",
104
- "re:model.layers.*mlp.up_proj",
105
- "re:model.layers.*mlp.down_proj",
106
- "re:model.layers.*shared_experts.*"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
107
  ],
108
  "algo_config": null,
109
  "softmax_quant_spec": null,
@@ -113,7 +475,7 @@
113
  "kv_cache_quant_config": {},
114
  "kv_cache_post_rope": false,
115
  "quant_mode": "eager_mode",
116
- "version": "0.12+15553c6a61",
117
  "export": {
118
  "kv_cache_group": [],
119
  "min_kv_scale": 0.0,
 
97
  "target_device": null
98
  },
99
  "exclude": [
 
 
100
  "lm_head",
101
+ "model.layers.0.mlp.down_proj",
102
+ "model.layers.0.mlp.gate_proj",
103
+ "model.layers.0.mlp.up_proj",
104
+ "model.layers.0.self_attn.kv_a_proj_with_mqa",
105
+ "model.layers.0.self_attn.kv_b_proj",
106
+ "model.layers.0.self_attn.o_proj",
107
+ "model.layers.0.self_attn.q_a_proj",
108
+ "model.layers.0.self_attn.q_b_proj",
109
+ "model.layers.1.mlp.gate",
110
+ "model.layers.1.self_attn.kv_a_proj_with_mqa",
111
+ "model.layers.1.self_attn.kv_b_proj",
112
+ "model.layers.1.self_attn.o_proj",
113
+ "model.layers.1.self_attn.q_a_proj",
114
+ "model.layers.1.self_attn.q_b_proj",
115
+ "model.layers.10.mlp.gate",
116
+ "model.layers.10.self_attn.kv_a_proj_with_mqa",
117
+ "model.layers.10.self_attn.kv_b_proj",
118
+ "model.layers.10.self_attn.o_proj",
119
+ "model.layers.10.self_attn.q_a_proj",
120
+ "model.layers.10.self_attn.q_b_proj",
121
+ "model.layers.11.mlp.gate",
122
+ "model.layers.11.self_attn.kv_a_proj_with_mqa",
123
+ "model.layers.11.self_attn.kv_b_proj",
124
+ "model.layers.11.self_attn.o_proj",
125
+ "model.layers.11.self_attn.q_a_proj",
126
+ "model.layers.11.self_attn.q_b_proj",
127
+ "model.layers.12.mlp.gate",
128
+ "model.layers.12.self_attn.kv_a_proj_with_mqa",
129
+ "model.layers.12.self_attn.kv_b_proj",
130
+ "model.layers.12.self_attn.o_proj",
131
+ "model.layers.12.self_attn.q_a_proj",
132
+ "model.layers.12.self_attn.q_b_proj",
133
+ "model.layers.13.mlp.gate",
134
+ "model.layers.13.self_attn.kv_a_proj_with_mqa",
135
+ "model.layers.13.self_attn.kv_b_proj",
136
+ "model.layers.13.self_attn.o_proj",
137
+ "model.layers.13.self_attn.q_a_proj",
138
+ "model.layers.13.self_attn.q_b_proj",
139
+ "model.layers.14.mlp.gate",
140
+ "model.layers.14.self_attn.kv_a_proj_with_mqa",
141
+ "model.layers.14.self_attn.kv_b_proj",
142
+ "model.layers.14.self_attn.o_proj",
143
+ "model.layers.14.self_attn.q_a_proj",
144
+ "model.layers.14.self_attn.q_b_proj",
145
+ "model.layers.15.mlp.gate",
146
+ "model.layers.15.self_attn.kv_a_proj_with_mqa",
147
+ "model.layers.15.self_attn.kv_b_proj",
148
+ "model.layers.15.self_attn.o_proj",
149
+ "model.layers.15.self_attn.q_a_proj",
150
+ "model.layers.15.self_attn.q_b_proj",
151
+ "model.layers.16.mlp.gate",
152
+ "model.layers.16.self_attn.kv_a_proj_with_mqa",
153
+ "model.layers.16.self_attn.kv_b_proj",
154
+ "model.layers.16.self_attn.o_proj",
155
+ "model.layers.16.self_attn.q_a_proj",
156
+ "model.layers.16.self_attn.q_b_proj",
157
+ "model.layers.17.mlp.gate",
158
+ "model.layers.17.self_attn.kv_a_proj_with_mqa",
159
+ "model.layers.17.self_attn.kv_b_proj",
160
+ "model.layers.17.self_attn.o_proj",
161
+ "model.layers.17.self_attn.q_a_proj",
162
+ "model.layers.17.self_attn.q_b_proj",
163
+ "model.layers.18.mlp.gate",
164
+ "model.layers.18.self_attn.kv_a_proj_with_mqa",
165
+ "model.layers.18.self_attn.kv_b_proj",
166
+ "model.layers.18.self_attn.o_proj",
167
+ "model.layers.18.self_attn.q_a_proj",
168
+ "model.layers.18.self_attn.q_b_proj",
169
+ "model.layers.19.mlp.gate",
170
+ "model.layers.19.self_attn.kv_a_proj_with_mqa",
171
+ "model.layers.19.self_attn.kv_b_proj",
172
+ "model.layers.19.self_attn.o_proj",
173
+ "model.layers.19.self_attn.q_a_proj",
174
+ "model.layers.19.self_attn.q_b_proj",
175
+ "model.layers.2.mlp.gate",
176
+ "model.layers.2.self_attn.kv_a_proj_with_mqa",
177
+ "model.layers.2.self_attn.kv_b_proj",
178
+ "model.layers.2.self_attn.o_proj",
179
+ "model.layers.2.self_attn.q_a_proj",
180
+ "model.layers.2.self_attn.q_b_proj",
181
+ "model.layers.20.mlp.gate",
182
+ "model.layers.20.self_attn.kv_a_proj_with_mqa",
183
+ "model.layers.20.self_attn.kv_b_proj",
184
+ "model.layers.20.self_attn.o_proj",
185
+ "model.layers.20.self_attn.q_a_proj",
186
+ "model.layers.20.self_attn.q_b_proj",
187
+ "model.layers.21.mlp.gate",
188
+ "model.layers.21.self_attn.kv_a_proj_with_mqa",
189
+ "model.layers.21.self_attn.kv_b_proj",
190
+ "model.layers.21.self_attn.o_proj",
191
+ "model.layers.21.self_attn.q_a_proj",
192
+ "model.layers.21.self_attn.q_b_proj",
193
+ "model.layers.22.mlp.gate",
194
+ "model.layers.22.self_attn.kv_a_proj_with_mqa",
195
+ "model.layers.22.self_attn.kv_b_proj",
196
+ "model.layers.22.self_attn.o_proj",
197
+ "model.layers.22.self_attn.q_a_proj",
198
+ "model.layers.22.self_attn.q_b_proj",
199
+ "model.layers.23.mlp.gate",
200
+ "model.layers.23.self_attn.kv_a_proj_with_mqa",
201
+ "model.layers.23.self_attn.kv_b_proj",
202
+ "model.layers.23.self_attn.o_proj",
203
+ "model.layers.23.self_attn.q_a_proj",
204
+ "model.layers.23.self_attn.q_b_proj",
205
+ "model.layers.24.mlp.gate",
206
+ "model.layers.24.self_attn.kv_a_proj_with_mqa",
207
+ "model.layers.24.self_attn.kv_b_proj",
208
+ "model.layers.24.self_attn.o_proj",
209
+ "model.layers.24.self_attn.q_a_proj",
210
+ "model.layers.24.self_attn.q_b_proj",
211
+ "model.layers.25.mlp.gate",
212
+ "model.layers.25.self_attn.kv_a_proj_with_mqa",
213
+ "model.layers.25.self_attn.kv_b_proj",
214
+ "model.layers.25.self_attn.o_proj",
215
+ "model.layers.25.self_attn.q_a_proj",
216
+ "model.layers.25.self_attn.q_b_proj",
217
+ "model.layers.26.mlp.gate",
218
+ "model.layers.26.self_attn.kv_a_proj_with_mqa",
219
+ "model.layers.26.self_attn.kv_b_proj",
220
+ "model.layers.26.self_attn.o_proj",
221
+ "model.layers.26.self_attn.q_a_proj",
222
+ "model.layers.26.self_attn.q_b_proj",
223
+ "model.layers.27.mlp.gate",
224
+ "model.layers.27.self_attn.kv_a_proj_with_mqa",
225
+ "model.layers.27.self_attn.kv_b_proj",
226
+ "model.layers.27.self_attn.o_proj",
227
+ "model.layers.27.self_attn.q_a_proj",
228
+ "model.layers.27.self_attn.q_b_proj",
229
+ "model.layers.28.mlp.gate",
230
+ "model.layers.28.self_attn.kv_a_proj_with_mqa",
231
+ "model.layers.28.self_attn.kv_b_proj",
232
+ "model.layers.28.self_attn.o_proj",
233
+ "model.layers.28.self_attn.q_a_proj",
234
+ "model.layers.28.self_attn.q_b_proj",
235
+ "model.layers.29.mlp.gate",
236
+ "model.layers.29.self_attn.kv_a_proj_with_mqa",
237
+ "model.layers.29.self_attn.kv_b_proj",
238
+ "model.layers.29.self_attn.o_proj",
239
+ "model.layers.29.self_attn.q_a_proj",
240
+ "model.layers.29.self_attn.q_b_proj",
241
+ "model.layers.3.mlp.gate",
242
+ "model.layers.3.self_attn.kv_a_proj_with_mqa",
243
+ "model.layers.3.self_attn.kv_b_proj",
244
+ "model.layers.3.self_attn.o_proj",
245
+ "model.layers.3.self_attn.q_a_proj",
246
+ "model.layers.3.self_attn.q_b_proj",
247
+ "model.layers.30.mlp.gate",
248
+ "model.layers.30.self_attn.kv_a_proj_with_mqa",
249
+ "model.layers.30.self_attn.kv_b_proj",
250
+ "model.layers.30.self_attn.o_proj",
251
+ "model.layers.30.self_attn.q_a_proj",
252
+ "model.layers.30.self_attn.q_b_proj",
253
+ "model.layers.31.mlp.gate",
254
+ "model.layers.31.self_attn.kv_a_proj_with_mqa",
255
+ "model.layers.31.self_attn.kv_b_proj",
256
+ "model.layers.31.self_attn.o_proj",
257
+ "model.layers.31.self_attn.q_a_proj",
258
+ "model.layers.31.self_attn.q_b_proj",
259
+ "model.layers.32.mlp.gate",
260
+ "model.layers.32.self_attn.kv_a_proj_with_mqa",
261
+ "model.layers.32.self_attn.kv_b_proj",
262
+ "model.layers.32.self_attn.o_proj",
263
+ "model.layers.32.self_attn.q_a_proj",
264
+ "model.layers.32.self_attn.q_b_proj",
265
+ "model.layers.33.mlp.gate",
266
+ "model.layers.33.self_attn.kv_a_proj_with_mqa",
267
+ "model.layers.33.self_attn.kv_b_proj",
268
+ "model.layers.33.self_attn.o_proj",
269
+ "model.layers.33.self_attn.q_a_proj",
270
+ "model.layers.33.self_attn.q_b_proj",
271
+ "model.layers.34.mlp.gate",
272
+ "model.layers.34.self_attn.kv_a_proj_with_mqa",
273
+ "model.layers.34.self_attn.kv_b_proj",
274
+ "model.layers.34.self_attn.o_proj",
275
+ "model.layers.34.self_attn.q_a_proj",
276
+ "model.layers.34.self_attn.q_b_proj",
277
+ "model.layers.35.mlp.gate",
278
+ "model.layers.35.self_attn.kv_a_proj_with_mqa",
279
+ "model.layers.35.self_attn.kv_b_proj",
280
+ "model.layers.35.self_attn.o_proj",
281
+ "model.layers.35.self_attn.q_a_proj",
282
+ "model.layers.35.self_attn.q_b_proj",
283
+ "model.layers.36.mlp.gate",
284
+ "model.layers.36.self_attn.kv_a_proj_with_mqa",
285
+ "model.layers.36.self_attn.kv_b_proj",
286
+ "model.layers.36.self_attn.o_proj",
287
+ "model.layers.36.self_attn.q_a_proj",
288
+ "model.layers.36.self_attn.q_b_proj",
289
+ "model.layers.37.mlp.gate",
290
+ "model.layers.37.self_attn.kv_a_proj_with_mqa",
291
+ "model.layers.37.self_attn.kv_b_proj",
292
+ "model.layers.37.self_attn.o_proj",
293
+ "model.layers.37.self_attn.q_a_proj",
294
+ "model.layers.37.self_attn.q_b_proj",
295
+ "model.layers.38.mlp.gate",
296
+ "model.layers.38.self_attn.kv_a_proj_with_mqa",
297
+ "model.layers.38.self_attn.kv_b_proj",
298
+ "model.layers.38.self_attn.o_proj",
299
+ "model.layers.38.self_attn.q_a_proj",
300
+ "model.layers.38.self_attn.q_b_proj",
301
+ "model.layers.39.mlp.gate",
302
+ "model.layers.39.self_attn.kv_a_proj_with_mqa",
303
+ "model.layers.39.self_attn.kv_b_proj",
304
+ "model.layers.39.self_attn.o_proj",
305
+ "model.layers.39.self_attn.q_a_proj",
306
+ "model.layers.39.self_attn.q_b_proj",
307
+ "model.layers.4.mlp.gate",
308
+ "model.layers.4.self_attn.kv_a_proj_with_mqa",
309
+ "model.layers.4.self_attn.kv_b_proj",
310
+ "model.layers.4.self_attn.o_proj",
311
+ "model.layers.4.self_attn.q_a_proj",
312
+ "model.layers.4.self_attn.q_b_proj",
313
+ "model.layers.40.mlp.gate",
314
+ "model.layers.40.self_attn.kv_a_proj_with_mqa",
315
+ "model.layers.40.self_attn.kv_b_proj",
316
+ "model.layers.40.self_attn.o_proj",
317
+ "model.layers.40.self_attn.q_a_proj",
318
+ "model.layers.40.self_attn.q_b_proj",
319
+ "model.layers.41.mlp.gate",
320
+ "model.layers.41.self_attn.kv_a_proj_with_mqa",
321
+ "model.layers.41.self_attn.kv_b_proj",
322
+ "model.layers.41.self_attn.o_proj",
323
+ "model.layers.41.self_attn.q_a_proj",
324
+ "model.layers.41.self_attn.q_b_proj",
325
+ "model.layers.42.mlp.gate",
326
+ "model.layers.42.self_attn.kv_a_proj_with_mqa",
327
+ "model.layers.42.self_attn.kv_b_proj",
328
+ "model.layers.42.self_attn.o_proj",
329
+ "model.layers.42.self_attn.q_a_proj",
330
+ "model.layers.42.self_attn.q_b_proj",
331
+ "model.layers.43.mlp.gate",
332
+ "model.layers.43.self_attn.kv_a_proj_with_mqa",
333
+ "model.layers.43.self_attn.kv_b_proj",
334
+ "model.layers.43.self_attn.o_proj",
335
+ "model.layers.43.self_attn.q_a_proj",
336
+ "model.layers.43.self_attn.q_b_proj",
337
+ "model.layers.44.mlp.gate",
338
+ "model.layers.44.self_attn.kv_a_proj_with_mqa",
339
+ "model.layers.44.self_attn.kv_b_proj",
340
+ "model.layers.44.self_attn.o_proj",
341
+ "model.layers.44.self_attn.q_a_proj",
342
+ "model.layers.44.self_attn.q_b_proj",
343
+ "model.layers.45.mlp.gate",
344
+ "model.layers.45.self_attn.kv_a_proj_with_mqa",
345
+ "model.layers.45.self_attn.kv_b_proj",
346
+ "model.layers.45.self_attn.o_proj",
347
+ "model.layers.45.self_attn.q_a_proj",
348
+ "model.layers.45.self_attn.q_b_proj",
349
+ "model.layers.46.mlp.gate",
350
+ "model.layers.46.self_attn.kv_a_proj_with_mqa",
351
+ "model.layers.46.self_attn.kv_b_proj",
352
+ "model.layers.46.self_attn.o_proj",
353
+ "model.layers.46.self_attn.q_a_proj",
354
+ "model.layers.46.self_attn.q_b_proj",
355
+ "model.layers.47.mlp.gate",
356
+ "model.layers.47.self_attn.kv_a_proj_with_mqa",
357
+ "model.layers.47.self_attn.kv_b_proj",
358
+ "model.layers.47.self_attn.o_proj",
359
+ "model.layers.47.self_attn.q_a_proj",
360
+ "model.layers.47.self_attn.q_b_proj",
361
+ "model.layers.48.mlp.gate",
362
+ "model.layers.48.self_attn.kv_a_proj_with_mqa",
363
+ "model.layers.48.self_attn.kv_b_proj",
364
+ "model.layers.48.self_attn.o_proj",
365
+ "model.layers.48.self_attn.q_a_proj",
366
+ "model.layers.48.self_attn.q_b_proj",
367
+ "model.layers.49.mlp.gate",
368
+ "model.layers.49.self_attn.kv_a_proj_with_mqa",
369
+ "model.layers.49.self_attn.kv_b_proj",
370
+ "model.layers.49.self_attn.o_proj",
371
+ "model.layers.49.self_attn.q_a_proj",
372
+ "model.layers.49.self_attn.q_b_proj",
373
+ "model.layers.5.mlp.gate",
374
+ "model.layers.5.self_attn.kv_a_proj_with_mqa",
375
+ "model.layers.5.self_attn.kv_b_proj",
376
+ "model.layers.5.self_attn.o_proj",
377
+ "model.layers.5.self_attn.q_a_proj",
378
+ "model.layers.5.self_attn.q_b_proj",
379
+ "model.layers.50.mlp.gate",
380
+ "model.layers.50.self_attn.kv_a_proj_with_mqa",
381
+ "model.layers.50.self_attn.kv_b_proj",
382
+ "model.layers.50.self_attn.o_proj",
383
+ "model.layers.50.self_attn.q_a_proj",
384
+ "model.layers.50.self_attn.q_b_proj",
385
+ "model.layers.51.mlp.gate",
386
+ "model.layers.51.self_attn.kv_a_proj_with_mqa",
387
+ "model.layers.51.self_attn.kv_b_proj",
388
+ "model.layers.51.self_attn.o_proj",
389
+ "model.layers.51.self_attn.q_a_proj",
390
+ "model.layers.51.self_attn.q_b_proj",
391
+ "model.layers.52.mlp.gate",
392
+ "model.layers.52.self_attn.kv_a_proj_with_mqa",
393
+ "model.layers.52.self_attn.kv_b_proj",
394
+ "model.layers.52.self_attn.o_proj",
395
+ "model.layers.52.self_attn.q_a_proj",
396
+ "model.layers.52.self_attn.q_b_proj",
397
+ "model.layers.53.mlp.gate",
398
+ "model.layers.53.self_attn.kv_a_proj_with_mqa",
399
+ "model.layers.53.self_attn.kv_b_proj",
400
+ "model.layers.53.self_attn.o_proj",
401
+ "model.layers.53.self_attn.q_a_proj",
402
+ "model.layers.53.self_attn.q_b_proj",
403
+ "model.layers.54.mlp.gate",
404
+ "model.layers.54.self_attn.kv_a_proj_with_mqa",
405
+ "model.layers.54.self_attn.kv_b_proj",
406
+ "model.layers.54.self_attn.o_proj",
407
+ "model.layers.54.self_attn.q_a_proj",
408
+ "model.layers.54.self_attn.q_b_proj",
409
+ "model.layers.55.mlp.gate",
410
+ "model.layers.55.self_attn.kv_a_proj_with_mqa",
411
+ "model.layers.55.self_attn.kv_b_proj",
412
+ "model.layers.55.self_attn.o_proj",
413
+ "model.layers.55.self_attn.q_a_proj",
414
+ "model.layers.55.self_attn.q_b_proj",
415
+ "model.layers.56.mlp.gate",
416
+ "model.layers.56.self_attn.kv_a_proj_with_mqa",
417
+ "model.layers.56.self_attn.kv_b_proj",
418
+ "model.layers.56.self_attn.o_proj",
419
+ "model.layers.56.self_attn.q_a_proj",
420
+ "model.layers.56.self_attn.q_b_proj",
421
+ "model.layers.57.mlp.gate",
422
+ "model.layers.57.self_attn.kv_a_proj_with_mqa",
423
+ "model.layers.57.self_attn.kv_b_proj",
424
+ "model.layers.57.self_attn.o_proj",
425
+ "model.layers.57.self_attn.q_a_proj",
426
+ "model.layers.57.self_attn.q_b_proj",
427
+ "model.layers.58.mlp.gate",
428
+ "model.layers.58.self_attn.kv_a_proj_with_mqa",
429
+ "model.layers.58.self_attn.kv_b_proj",
430
+ "model.layers.58.self_attn.o_proj",
431
+ "model.layers.58.self_attn.q_a_proj",
432
+ "model.layers.58.self_attn.q_b_proj",
433
+ "model.layers.59.mlp.gate",
434
+ "model.layers.59.self_attn.kv_a_proj_with_mqa",
435
+ "model.layers.59.self_attn.kv_b_proj",
436
+ "model.layers.59.self_attn.o_proj",
437
+ "model.layers.59.self_attn.q_a_proj",
438
+ "model.layers.59.self_attn.q_b_proj",
439
+ "model.layers.6.mlp.gate",
440
+ "model.layers.6.self_attn.kv_a_proj_with_mqa",
441
+ "model.layers.6.self_attn.kv_b_proj",
442
+ "model.layers.6.self_attn.o_proj",
443
+ "model.layers.6.self_attn.q_a_proj",
444
+ "model.layers.6.self_attn.q_b_proj",
445
+ "model.layers.60.mlp.gate",
446
+ "model.layers.60.self_attn.kv_a_proj_with_mqa",
447
+ "model.layers.60.self_attn.kv_b_proj",
448
+ "model.layers.60.self_attn.o_proj",
449
+ "model.layers.60.self_attn.q_a_proj",
450
+ "model.layers.60.self_attn.q_b_proj",
451
+ "model.layers.7.mlp.gate",
452
+ "model.layers.7.self_attn.kv_a_proj_with_mqa",
453
+ "model.layers.7.self_attn.kv_b_proj",
454
+ "model.layers.7.self_attn.o_proj",
455
+ "model.layers.7.self_attn.q_a_proj",
456
+ "model.layers.7.self_attn.q_b_proj",
457
+ "model.layers.8.mlp.gate",
458
+ "model.layers.8.self_attn.kv_a_proj_with_mqa",
459
+ "model.layers.8.self_attn.kv_b_proj",
460
+ "model.layers.8.self_attn.o_proj",
461
+ "model.layers.8.self_attn.q_a_proj",
462
+ "model.layers.8.self_attn.q_b_proj",
463
+ "model.layers.9.mlp.gate",
464
+ "model.layers.9.self_attn.kv_a_proj_with_mqa",
465
+ "model.layers.9.self_attn.kv_b_proj",
466
+ "model.layers.9.self_attn.o_proj",
467
+ "model.layers.9.self_attn.q_a_proj",
468
+ "model.layers.9.self_attn.q_b_proj"
469
  ],
470
  "algo_config": null,
471
  "softmax_quant_spec": null,
 
475
  "kv_cache_quant_config": {},
476
  "kv_cache_post_rope": false,
477
  "quant_mode": "eager_mode",
478
+ "version": "0.11.2+e7a61dd5fa8",
479
  "export": {
480
  "kv_cache_group": [],
481
  "min_kv_scale": 0.0,
model-00010-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a208ad3704aa08ae37e05ff7ed30db7feca9f5f939a3ad5e7cd9f018b3074f99
3
- size 1270743528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fea8119c515eb6adf764232e17b3caf0a51f45128c0d538d3a1b235a625fb17
3
+ size 1206059840
model-00019-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb05f728dc85eb0ecc80a241b84e3a48dffb3fb8246e9b7c822a1f7c2c55f49b
3
- size 1270743456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a337c2f2209b908d7f0fee73d579bb2edf806acdbc91c8a6a264fb98df76474
3
+ size 1206059776
model-00027-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3270c2d8ff5af3d6d561d6b771307c0f25e831581d294cfd32f3ed0199acd3e7
3
- size 1270743704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1751275b155c2aafdc6f407fc2c7e62843b5b02f6b5d6406765d0d40ead51feb
3
+ size 1206060024
model-00036-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9887e107bf62c39a481dc8f968733ec3e60f72b3cccc372a3b1cf100bd9949c3
3
- size 1270743592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74aa2cbbfaa9936c97a6082530123b8afd51ea784eca1de9c7b515d96e27d6cd
3
+ size 1206059904
model-00045-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85fd29373779cf6b15b8b98d3d8a8427b82b33fb49bb03915f631a9d1d11a2c8
3
- size 1270743528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfd50d9d1ad3608682882f8cb8ef317dc18620130eb3f893796c324f1f5fb8fa
3
+ size 1206059840
model-00054-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0bc371206285fc604e1c354ccf3be50210aca911ab65b947cd6a5e0addffe2d
3
- size 1270743456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fb2d322c665e3e90eca9857b8353903ad75f55d85f774614fd2cb741605a075
3
+ size 1206059776
model-00062-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29958391f60ccc22aa9437926b44f888ff49cd1dd4eb86636c4ca33b4e5c08e4
3
- size 1270743712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:264e1e679146c9c30a4ec21354a15ffbc29645332038ee44bb40af02cdef80f0
3
+ size 1206060032
model-00071-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3970230f532821daf40a422ccdf7e2b16e39417eb9cf10e6ed2e66e60779abe2
3
- size 1270743600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:780f8d238c583a7336491e4a7b38f9c66e549c507e19e32ac8094985f37b6eb1
3
+ size 1206059912
model-00080-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3aea3f757b8c757aee66fa5991ce797561c4a9530db1db477499d4201b079c6
3
- size 1270743688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3969fc6920d5bac1435606235c54d1711f0dd5f3cda89f9b408fec514a022386
3
+ size 1206060008
model-00089-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ea39f037c74b8c1464a8483b22af99a8c77b4e4862a42821504d8101d43523a
3
- size 1270743728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbce3096af7b461411a8e17dc9501ce3cdcca16c33c1e87aa55c63ba1cd8825c
3
+ size 1206060048
model-00097-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de0c5dded8df7ba93c08344fdd7d4e07174b1786a47475c1f355d76cee7838aa
3
- size 1270743976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb36c8a0c00d24ed2cbc11632b01d172f2d5ece63f3b3fd67d7fc416c6b6f4a4
3
+ size 1206060296
model-00106-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6a596ebdb97a336a872927d6ee805bc0b24a0635eb9203613bb6e2cea05ddad
3
- size 1270743864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6f8e685364d434db2ff99191504cb463d0e89ce4b8286596a75643f6708d99b
3
+ size 1206060176
model-00115-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2fbc44a46b592565c4556d66baf74bd6f008a7cfc556c6503f3e4d7d6c4a57e
3
- size 1270743792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56775aa2844909bffe22ccd1864176bd6d0ddb532b6f7875641d0be1d5f058a3
3
+ size 1206060112
model-00124-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89221a2e36738fba5c493111faf3ee322d40d8902efe9da81729e2625fa82d3c
3
- size 1270743728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:495065129673395e30c45c8d7f8f6bf025e0e6d909e82313517802bcd2162f37
3
+ size 1206060048
model-00132-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a89a3b454b5d1d476150fa6d372ce7f5f60f285b92f071e2c6b053fd707f544
3
- size 1270743976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64c8011432d14d54bf8ca50eccda8b4e4802c532319656b7986cffaa0c5a1d69
3
+ size 1206060296
model-00141-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad9bd65f2281656707ffccd6c9804871927177158cc1749df13bbe24de22aa29
3
- size 1270743856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cce968bbd4037158861af19a6cc280f58681a10244be7f9355b250afc5a19a0a
3
+ size 1206060176
model-00150-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:582cd87d4190d3753b5aa32d5eefe4657981d7446e132b882d61cf41d028546f
3
- size 1270743792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cff72343fc973ae27fbe7eaadccd36d36583a59399fb6372d3f044159a77283a
3
+ size 1206060112
model-00159-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c067d353f6fb754b12232b3bd3accd3c4694b915a0eea7cf1ff96edd38095c1e
3
- size 1270743728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ab096528970a2810a7f2f1acb764182e251db6f1d4807d3f9c2f6e9add3c8bb
3
+ size 1206060048
model-00167-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e59cf0e3f3476097053ac09f10664e6cc35ceab52837c80c7aaa612eec989a32
3
- size 1270743976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc2efdb3eeab410ef7e24a1194d6ca58af12b7244056333a8a505fb073fc3236
3
+ size 1206060296
model-00176-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1e0f9b8bf25f8f17d3c54ac683ed8c94b274f39ba166fe56616348582fc8fc3
3
- size 1270743856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deb6f27b9fe2468cbafdb9aab9b520478a408249df60bf673f15287d45682225
3
+ size 1206060176
model-00185-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c818abd2d661cf5d10a42a357c5bd97c34876b07583f6667e30d1741ae888f68
3
- size 1270743792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a05673b9afc75f7421ad5b2985c58398c4a6f3e440f647ca43c1c7d16a2ffcc0
3
+ size 1206060112
model-00194-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5700c9ff171a0c84758c7746fddf941a8170c9369e358e54b597265c963163a
3
- size 1270743728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01e9969864658b0ac91ff38c502db516f75581016417a8532567e7267a3d3692
3
+ size 1206060048
model-00202-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6b9b15b72b0a8169abd9975dcffe3ce843445632dda8b85e5ab90d2255f871a
3
- size 1270743984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9f790f10c5a63528d1ff8083b3faeb9d2deca8926fb4a209660e2557b7253bb
3
+ size 1206060304
model-00211-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2f28dfee7c7aab25752d36bde3a4a0c8314dbef44d3a2b1d1bc207e2294491a
3
- size 1270743864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9fd01ce686e2e68e4fd3ae725622e31281df5b17975dce7cf74bcd166b5db15
3
+ size 1206060176
model-00220-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fd0e163c94fc8c427d7b4118c15466c73aadb4d5d06d0a2a69a8b2b23acafd9
3
- size 1270743792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c58497fd5cfc58f5b781ab4be0cc7639acd9be8a925f06ac3abd882e9ab40bc
3
+ size 1206060112
model-00229-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a81bcbcdd8bd3c20d9d79d2af543b136d4d9ecb95e9fc92ddcc70b128dfccb0a
3
- size 1270743728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9941ca2b869708dd7e26e47ceceae79a7f4bbe7fae0bf83760174cb151b9d754
3
+ size 1206060048
model-00237-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e776cb48d02f1d849d0b7890982667608ea143c69a77288592f7bc89455fc49
3
- size 1270743984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a70e5e6f9208bf8422f63bb8c63e94170a1db8d5076e61843a41cf09363adba
3
+ size 1206060304
model-00246-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80382f7e8133ef17f944f1e6c3dc9f0a3a353b4152ec0ecb3072bb1fd467776d
3
- size 1270743864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a28f676de7990497ef29ca74753169b6b1efffb156d9d3feae674d2161b7dc96
3
+ size 1206060176
model-00255-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5a803d662180cbac1ea24f930cd4145f19c55749d3b4a11fd6ef5f7a989bb0c
3
- size 1270743792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ddbea33feb0741fc55c1a7be1e24e708ef743d472bbc722b29179c8c1296806
3
+ size 1206060112
model-00264-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8956381bf22b284f9771a10968809592e1e1b70ac3e0593b80ec4003076cbed
3
- size 1270743728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be3f448eb206ba6db2099e6cfe9f87ea4048e0340e30ba0ba5e17c7bd6bede19
3
+ size 1206060048
model-00272-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15068d119f24cfeeebd7130c6a133ae6812e4d850406448b13aa040a08173b37
3
- size 1270743992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94a5678a472a8fcdff0e879ae733ebabb0f7445df72c12899243bfeb3659e433
3
+ size 1206060312
model-00281-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcaa224a3908c7333c6cc6c5fbe881fc1acaf96888d65d53f26babf6ebefdaa4
3
- size 1270743864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d93b34205b8a849a248e3bf0a08039833afefc21828ae96f693d31c83d52ab23
3
+ size 1206060184
model-00290-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cbe7bcf77098ff7dfc069007058f89e2543ed7f73bc8c6b5ab9c136d0600a2d
3
- size 1270743800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcc3881ec8dc52140b0961558d2d53e1782c2abba2241a0c96e26c4c10d7ed83
3
+ size 1206060120
model-00299-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc346ffe1c20208fbab8eee612816ab9015ba8452e8babe4d0db10e85f1943bc
3
- size 1270743736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ea8a15a11c4b97aff9100bd63fb9a2f3f4d342572e6fd8387c93813ea8ab94d
3
+ size 1206060056
model-00307-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab0ed64d2b869dfad1096d1330331140022de1f99a08b66e00d407616a4573e5
3
- size 1270743992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed61aaba8ebade05b4de020eb4c76aa8c4cb8d4dffa8a810a13f273dfbbbdfb7
3
+ size 1206060312
model-00316-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c5a9bed1e671e739db8235f57cbdbb462feeef9e49711759aa849e466460c1f
3
- size 1270743864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93c5fe0da1a19fa85e8faefb0e323d00da19dac3ca61e513776aed08a9f35f4f
3
+ size 1206060184
model-00325-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d6d1fa0386570b15053344e357312ba088f030476c664563f3c8700086654034
3
- size 1270743800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac95094e54577ff487b6ae3cd279ee6e1750d85401fb5acc2aaa2144ea2a68dd
3
+ size 1206060120
model-00334-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea45e6b1a7e6a653bf028c79fd3597c992703d9111cc6efca7dbb9875a90a52d
3
- size 1270743736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75be5b64b4ace92c4a869afbb02671e3c9841f74d3832806506b769147d09d0b
3
+ size 1206060056
model-00342-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70d58c612e9c02f9415c295bdf6071e0714ca3b707a2e841645bc5eff5ba801e
3
- size 1270743992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cdf79f728e0d097547998a5f6b2c15ca729b4d90fb809650552d3c99eb88150
3
+ size 1206060312
model-00351-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:642d30d676c184c8851f9cf76b2cbc916b0830382aa218637c074ccfec55b527
3
- size 1270743864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c8b75033d9170344561ce074f1ecdc8e603dcb12c614ca12868285518a0bc1e
3
+ size 1206060184
model-00360-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd67fee1f4585c2233ef67f9ec76d58142b073d4e3674703853452234c3f0d27
3
- size 1270743800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa9927c7fb51b66323c8cf01be4e03c7557d7fe0c9d445262e322f7aeb57c62f
3
+ size 1206060120
model-00369-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cf258481db2ca93b3f1e8bae206d10f2b84c052bdb7c96858043390aebe56ff
3
- size 1270743736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd30770f1ba29e7cb5a66ec3f6a60c53f5c5628f966b5c43f3761d19bbcd649f
3
+ size 1206060048
model-00377-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:853cf195a1d3e249f63e9c6abb4b791638cf49a11503c8ec0c539470e7e0b329
3
- size 1270743992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9be28ddab9e6ac9457c8a506608bbc91cc36cfb66bb960ba62b7fdd28a56cb5
3
+ size 1206060312
model-00386-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87a44b87d830fd4fc1476b388c81fba46fa44c683d6dd53d26de68ca177dc380
3
- size 1270743864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc4864728b5b184e1344141bfb9dd9a3d0cfce92b4d08d467ff7ffbdc8c5fdcb
3
+ size 1206060184
model-00395-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f0ccb918f23a370e00d55f6f217a103f2e2acf2aeb4b7cf897debe815a81e4e
3
- size 1270743800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71a28a512328c678f506c0398bde093d70d7e8959f51f93e52766056adf98179
3
+ size 1206060120
model-00404-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1250cb87f1746ec6a75780d3604a900f1618c31ea9fd2964bc554f730df040d3
3
- size 1270743736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:440c3066c08e516967f6cf5896064ef83351230f635e0fae9b415f513a1b05e4
3
+ size 1206060048
model-00412-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfd070374a55c42994883ec0a97131bf53e49597a992979720cef09b6c30a26b
3
- size 1161102344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fa84e05fc48b27a0aabd15ea993787b290ffa2b1fa4441a79a55b4b9f976250
3
+ size 1096418648
model-00421-of-00527.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5a396dfe5a41c34a7125aff72641a0740faf7d203a41bb16d8c8f8e15953c4a
3
- size 1270743872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02a9c10c34d19537eb5fe8a55403f4b097cdc2cea34a1232cb5c392cc312fd0e
3
+ size 1206060192