amychensima commited on
Commit
4865972
·
verified ·
1 Parent(s): 753b27c
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. console.log +56 -0
  2. devkit/precision.json +79 -79
  3. devkit/vlm_config.json +1 -0
  4. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token0_stage1_mla.elf +2 -2
  5. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1024_stage1_mla.elf +2 -2
  6. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1152_stage1_mla.elf +2 -2
  7. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1280_stage1_mla.elf +2 -2
  8. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token128_stage1_mla.elf +2 -2
  9. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1408_stage1_mla.elf +2 -2
  10. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1536_stage1_mla.elf +2 -2
  11. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1664_stage1_mla.elf +2 -2
  12. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1792_stage1_mla.elf +2 -2
  13. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1920_stage1_mla.elf +2 -2
  14. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token256_stage1_mla.elf +2 -2
  15. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token384_stage1_mla.elf +2 -2
  16. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token512_stage1_mla.elf +2 -2
  17. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token640_stage1_mla.elf +2 -2
  18. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token768_stage1_mla.elf +2 -2
  19. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token896_stage1_mla.elf +2 -2
  20. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer0_stage1_mla.elf +2 -2
  21. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer10_stage1_mla.elf +2 -2
  22. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer11_stage1_mla.elf +2 -2
  23. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer12_stage1_mla.elf +2 -2
  24. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer13_stage1_mla.elf +2 -2
  25. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer14_stage1_mla.elf +2 -2
  26. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer15_stage1_mla.elf +2 -2
  27. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer16_stage1_mla.elf +2 -2
  28. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer17_stage1_mla.elf +2 -2
  29. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer18_stage1_mla.elf +2 -2
  30. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer19_stage1_mla.elf +2 -2
  31. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer1_stage1_mla.elf +2 -2
  32. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer20_stage1_mla.elf +2 -2
  33. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer21_stage1_mla.elf +2 -2
  34. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer22_stage1_mla.elf +2 -2
  35. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer23_stage1_mla.elf +2 -2
  36. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer24_stage1_mla.elf +2 -2
  37. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer25_stage1_mla.elf +2 -2
  38. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer26_stage1_mla.elf +2 -2
  39. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer27_stage1_mla.elf +2 -2
  40. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer28_stage1_mla.elf +2 -2
  41. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer29_stage1_mla.elf +2 -2
  42. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer2_stage1_mla.elf +2 -2
  43. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer30_stage1_mla.elf +2 -2
  44. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer3_stage1_mla.elf +2 -2
  45. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer4_stage1_mla.elf +2 -2
  46. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer5_stage1_mla.elf +2 -2
  47. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer6_stage1_mla.elf +2 -2
  48. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer7_stage1_mla.elf +2 -2
  49. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer8_stage1_mla.elf +2 -2
  50. elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer9_stage1_mla.elf +2 -2
console.log ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ None of PyTorch, TensorFlow >= 2.0, or Flax have been found. Models won't be available and only tokenizers, configuration and file/data utilities can be used.
2
+ None of PyTorch, TensorFlow >= 2.0, or Flax have been found. Models won't be available and only tokenizers, configuration and file/data utilities can be used.
3
+ VLM initialization starting ...
4
+ VLM initialization completed.
5
+ >>> Query: Why is the sky blue?
6
+ Assistant: The color of the sky is not inherently "blue," but rather the result of a phenomenon known as Rayleigh scattering. Here's a simplified explanation:
7
+
8
+ 1. Sunlight is composed of a wide range of wavelengths, which we perceive as different colors.
9
+
10
+ 2. When sunlight enters Earth'€™s atmosphere, it interacts with the gases and particles present in the air.
11
+
12
+ 3. The Earth's atmosphere is mostly made up of nitrogen and oxygen, which are very effective at scattering shorter wavelengths of light.
13
+
14
+ 4. Shorter wavelengths include the blue and violet parts of the visible spectrum.
15
+
16
+ 5. When sunlight enters the atmosphere, the shorter blue and violet wavelengths are scattered in every direction by the gases and particles in the air.
17
+
18
+ 6. Because the blue and violet light is scattered more than the other colors, the scattered blue and violet light reaches our eyes more frequently than the other colors.
19
+
20
+ 7. This scattered blue and violet light is what we see when we look up at the sky during a clear day.
21
+
22
+ 8. During the daytime, the sky appears predominantly blue because the scattered blue and violet light is more prevalent than the other colors.
23
+
24
+ 9. At sunrise and sunset, the light has to pass through more of the Earth's atmosphere, which causes even more scattering of the blue and violet light. This is why the sky often appears red or orange during these times.
25
+
26
+ In summary, the blue color of the sky is primarily due to the scattering of shorter wavelengths of light (blue and violet) by the gases and particles in the Earth's atmosphere. This scattering effect is more pronounced during the daytime, which is why the sky appears predominantly blue during these hours.
27
+
28
+ Number of generated tokens: 408
29
+ TTFT: 0.22s
30
+ TPS: avg=16.69, quantiles=['17.54', '16.76', '16.53', '16.14']
31
+ >>> Query: Summarize
32
+ Assistant: The sky appears blue due to Rayleigh scattering, where shorter blue and violet wavelengths of sunlight are scattered by atmospheric particles. This scattering is more pronounced during daytime, making the sky predominantly blue. The scattering effect is more intense during sunrise and sunset, leading to red or orange hues in the sky.
33
+
34
+ Number of generated tokens: 80
35
+ TTFT: 0.20s
36
+ TPS: avg=15.55, quantiles=['15.73', '15.52', '15.49', '15.46']
37
+ >>> Query: Tell me a story based on this
38
+ Assistant: Once upon a time, in a land where the sky was always a vivid blue, there lived a young girl named Lily. Lily had always been fascinated by the color of the sky, and she often wondered why it was blue.
39
+
40
+ One day, while Lily was exploring the outskirts of her village, she stumbled upon an old, wise man named Old Thomas. Seeing the curiosity in Lily's eyes, Old Thomas decided to share the secret behind the blue sky.
41
+
42
+ "My dear," Old Thomas began, "the reason the sky is blue is due to a phenomenon called Rayleigh scattering. You see, the Earth's atmosphere is filled with tiny particles and gases, which are excellent at scattering shorter wavelengths of light."
43
+
44
+ Lily listened intently as Old Thomas continued, "The blue and violet wavelengths of light, which are the shortest, are scattered more than the other colors. This scattered blue and violet light reaches our eyes more frequently, and that's why we see the sky as predominantly blue during the day."
45
+
46
+ Lily was amazed by this revelation and thanked Old Thomas for his wisdom. From that day forward, Lily looked up at the sky with a newfound appreciation for the beautiful blue hue that adorned the heavens above.
47
+
48
+ And so, the story of Lily and the blue sky became a cherished tale in the village, reminding everyone of the wonders of our natural world and the simple yet fascinating reasons behind the color of the sky.
49
+
50
+ And they all lived happily ever after, gazing up at the sky, always remembering the story of Lily and the blue sky.
51
+
52
+ Number of generated tokens: 373
53
+ TTFT: 0.29s
54
+ TPS: avg=15.16, quantiles=['15.52', '15.08', '15.04', '14.95']
55
+ >>> WARN:starting syslog with prefix MLA-RT
56
+ ~MLALogger: logger is closed
devkit/precision.json CHANGED
@@ -2,397 +2,397 @@
2
  {
3
  "part": "group_pre",
4
  "idx": 0,
5
- "precision": "A_BF16_W_INT4"
6
  },
7
  {
8
  "part": "group_pre",
9
  "idx": 1,
10
- "precision": "A_BF16_W_INT4"
11
  },
12
  {
13
  "part": "group_pre",
14
  "idx": 2,
15
- "precision": "A_BF16_W_INT4"
16
  },
17
  {
18
  "part": "group_pre",
19
  "idx": 3,
20
- "precision": "A_BF16_W_INT4"
21
  },
22
  {
23
  "part": "group_pre",
24
  "idx": 4,
25
- "precision": "A_BF16_W_INT4"
26
  },
27
  {
28
  "part": "group_pre",
29
  "idx": 5,
30
- "precision": "A_BF16_W_INT4"
31
  },
32
  {
33
  "part": "group_pre",
34
  "idx": 6,
35
- "precision": "A_BF16_W_INT4"
36
  },
37
  {
38
  "part": "group_pre",
39
  "idx": 7,
40
- "precision": "A_BF16_W_INT4"
41
  },
42
  {
43
  "part": "group_pre",
44
  "idx": 8,
45
- "precision": "A_BF16_W_INT4"
46
  },
47
  {
48
  "part": "group_pre",
49
  "idx": 9,
50
- "precision": "A_BF16_W_INT4"
51
  },
52
  {
53
  "part": "group_pre",
54
  "idx": 10,
55
- "precision": "A_BF16_W_INT4"
56
  },
57
  {
58
  "part": "group_pre",
59
  "idx": 11,
60
- "precision": "A_BF16_W_INT4"
61
  },
62
  {
63
  "part": "group_pre",
64
  "idx": 12,
65
- "precision": "A_BF16_W_INT4"
66
  },
67
  {
68
  "part": "group_pre",
69
  "idx": 13,
70
- "precision": "A_BF16_W_INT4"
71
  },
72
  {
73
  "part": "group_pre",
74
  "idx": 14,
75
- "precision": "A_BF16_W_INT4"
76
  },
77
  {
78
  "part": "group_pre",
79
  "idx": 15,
80
- "precision": "A_BF16_W_INT4"
81
  },
82
  {
83
  "part": "group_pre",
84
  "idx": 16,
85
- "precision": "A_BF16_W_INT4"
86
  },
87
  {
88
  "part": "group_pre",
89
  "idx": 17,
90
- "precision": "A_BF16_W_INT4"
91
  },
92
  {
93
  "part": "group_pre",
94
  "idx": 18,
95
- "precision": "A_BF16_W_INT4"
96
  },
97
  {
98
  "part": "group_pre",
99
  "idx": 19,
100
- "precision": "A_BF16_W_INT4"
101
  },
102
  {
103
  "part": "group_pre",
104
  "idx": 20,
105
- "precision": "A_BF16_W_INT4"
106
  },
107
  {
108
  "part": "group_pre",
109
  "idx": 21,
110
- "precision": "A_BF16_W_INT4"
111
  },
112
  {
113
  "part": "group_pre",
114
  "idx": 22,
115
- "precision": "A_BF16_W_INT4"
116
  },
117
  {
118
  "part": "group_pre",
119
  "idx": 23,
120
- "precision": "A_BF16_W_INT4"
121
  },
122
  {
123
  "part": "group_pre",
124
  "idx": 24,
125
- "precision": "A_BF16_W_INT4"
126
  },
127
  {
128
  "part": "group_pre",
129
  "idx": 25,
130
- "precision": "A_BF16_W_INT4"
131
  },
132
  {
133
  "part": "group_pre",
134
  "idx": 26,
135
- "precision": "A_BF16_W_INT4"
136
  },
137
  {
138
  "part": "group_pre",
139
  "idx": 27,
140
- "precision": "A_BF16_W_INT4"
141
  },
142
  {
143
  "part": "group_pre",
144
  "idx": 28,
145
- "precision": "A_BF16_W_INT4"
146
  },
147
  {
148
  "part": "group_pre",
149
  "idx": 29,
150
- "precision": "A_BF16_W_INT4"
151
  },
152
  {
153
  "part": "group_pre",
154
  "idx": 30,
155
- "precision": "A_BF16_W_INT4"
156
  },
157
  {
158
  "part": "group_pre",
159
  "idx": 31,
160
- "precision": "A_BF16_W_INT4"
161
  },
162
  {
163
  "part": "group_post",
164
  "idx": 0,
165
- "precision": "A_BF16_W_INT4"
166
  },
167
  {
168
  "part": "group_post",
169
  "idx": 1,
170
- "precision": "A_BF16_W_INT4"
171
  },
172
  {
173
  "part": "group_post",
174
  "idx": 2,
175
- "precision": "A_BF16_W_INT4"
176
  },
177
  {
178
  "part": "group_post",
179
  "idx": 3,
180
- "precision": "A_BF16_W_INT4"
181
  },
182
  {
183
  "part": "group_post",
184
  "idx": 4,
185
- "precision": "A_BF16_W_INT4"
186
  },
187
  {
188
  "part": "group_post",
189
  "idx": 5,
190
- "precision": "A_BF16_W_INT4"
191
  },
192
  {
193
  "part": "group_post",
194
  "idx": 6,
195
- "precision": "A_BF16_W_INT4"
196
  },
197
  {
198
  "part": "group_post",
199
  "idx": 7,
200
- "precision": "A_BF16_W_INT4"
201
  },
202
  {
203
  "part": "group_post",
204
  "idx": 8,
205
- "precision": "A_BF16_W_INT4"
206
  },
207
  {
208
  "part": "group_post",
209
  "idx": 9,
210
- "precision": "A_BF16_W_INT4"
211
  },
212
  {
213
  "part": "group_post",
214
  "idx": 10,
215
- "precision": "A_BF16_W_INT4"
216
  },
217
  {
218
  "part": "group_post",
219
  "idx": 11,
220
- "precision": "A_BF16_W_INT4"
221
  },
222
  {
223
  "part": "group_post",
224
  "idx": 12,
225
- "precision": "A_BF16_W_INT4"
226
  },
227
  {
228
  "part": "group_post",
229
  "idx": 13,
230
- "precision": "A_BF16_W_INT4"
231
  },
232
  {
233
  "part": "group_post",
234
  "idx": 14,
235
- "precision": "A_BF16_W_INT4"
236
  },
237
  {
238
  "part": "group_post",
239
  "idx": 15,
240
- "precision": "A_BF16_W_INT4"
241
  },
242
  {
243
  "part": "group_post",
244
  "idx": 16,
245
- "precision": "A_BF16_W_INT4"
246
  },
247
  {
248
  "part": "group_post",
249
  "idx": 17,
250
- "precision": "A_BF16_W_INT4"
251
  },
252
  {
253
  "part": "group_post",
254
  "idx": 18,
255
- "precision": "A_BF16_W_INT4"
256
  },
257
  {
258
  "part": "group_post",
259
  "idx": 19,
260
- "precision": "A_BF16_W_INT4"
261
  },
262
  {
263
  "part": "group_post",
264
  "idx": 20,
265
- "precision": "A_BF16_W_INT4"
266
  },
267
  {
268
  "part": "group_post",
269
  "idx": 21,
270
- "precision": "A_BF16_W_INT4"
271
  },
272
  {
273
  "part": "group_post",
274
  "idx": 22,
275
- "precision": "A_BF16_W_INT4"
276
  },
277
  {
278
  "part": "group_post",
279
  "idx": 23,
280
- "precision": "A_BF16_W_INT4"
281
  },
282
  {
283
  "part": "group_post",
284
  "idx": 24,
285
- "precision": "A_BF16_W_INT4"
286
  },
287
  {
288
  "part": "group_post",
289
  "idx": 25,
290
- "precision": "A_BF16_W_INT4"
291
  },
292
  {
293
  "part": "group_post",
294
  "idx": 26,
295
- "precision": "A_BF16_W_INT4"
296
  },
297
  {
298
  "part": "group_post",
299
  "idx": 27,
300
- "precision": "A_BF16_W_INT4"
301
  },
302
  {
303
  "part": "group_post",
304
  "idx": 28,
305
- "precision": "A_BF16_W_INT4"
306
  },
307
  {
308
  "part": "group_post",
309
  "idx": 29,
310
- "precision": "A_BF16_W_INT4"
311
  },
312
  {
313
  "part": "group_post",
314
  "idx": 30,
315
- "precision": "A_BF16_W_INT4"
316
  },
317
  {
318
  "part": "group_cache",
319
  "idx": 0,
320
- "precision": "A_BF16_W_INT4"
321
  },
322
  {
323
  "part": "group_cache",
324
  "idx": 128,
325
- "precision": "A_BF16_W_INT4"
326
  },
327
  {
328
  "part": "group_cache",
329
  "idx": 256,
330
- "precision": "A_BF16_W_INT4"
331
  },
332
  {
333
  "part": "group_cache",
334
  "idx": 384,
335
- "precision": "A_BF16_W_INT4"
336
  },
337
  {
338
  "part": "group_cache",
339
  "idx": 512,
340
- "precision": "A_BF16_W_INT4"
341
  },
342
  {
343
  "part": "group_cache",
344
  "idx": 640,
345
- "precision": "A_BF16_W_INT4"
346
  },
347
  {
348
  "part": "group_cache",
349
  "idx": 768,
350
- "precision": "A_BF16_W_INT4"
351
  },
352
  {
353
  "part": "group_cache",
354
  "idx": 896,
355
- "precision": "A_BF16_W_INT4"
356
  },
357
  {
358
  "part": "group_cache",
359
  "idx": 1024,
360
- "precision": "A_BF16_W_INT4"
361
  },
362
  {
363
  "part": "group_cache",
364
  "idx": 1152,
365
- "precision": "A_BF16_W_INT4"
366
  },
367
  {
368
  "part": "group_cache",
369
  "idx": 1280,
370
- "precision": "A_BF16_W_INT4"
371
  },
372
  {
373
  "part": "group_cache",
374
  "idx": 1408,
375
- "precision": "A_BF16_W_INT4"
376
  },
377
  {
378
  "part": "group_cache",
379
  "idx": 1536,
380
- "precision": "A_BF16_W_INT4"
381
  },
382
  {
383
  "part": "group_cache",
384
  "idx": 1664,
385
- "precision": "A_BF16_W_INT4"
386
  },
387
  {
388
  "part": "group_cache",
389
  "idx": 1792,
390
- "precision": "A_BF16_W_INT4"
391
  },
392
  {
393
  "part": "group_cache",
394
  "idx": 1920,
395
- "precision": "A_BF16_W_INT4"
396
  },
397
  {
398
  "part": "single_pre",
 
2
  {
3
  "part": "group_pre",
4
  "idx": 0,
5
+ "precision": "A_BF16_W_INT8"
6
  },
7
  {
8
  "part": "group_pre",
9
  "idx": 1,
10
+ "precision": "A_BF16_W_INT8"
11
  },
12
  {
13
  "part": "group_pre",
14
  "idx": 2,
15
+ "precision": "A_BF16_W_INT8"
16
  },
17
  {
18
  "part": "group_pre",
19
  "idx": 3,
20
+ "precision": "A_BF16_W_INT8"
21
  },
22
  {
23
  "part": "group_pre",
24
  "idx": 4,
25
+ "precision": "A_BF16_W_INT8"
26
  },
27
  {
28
  "part": "group_pre",
29
  "idx": 5,
30
+ "precision": "A_BF16_W_INT8"
31
  },
32
  {
33
  "part": "group_pre",
34
  "idx": 6,
35
+ "precision": "A_BF16_W_INT8"
36
  },
37
  {
38
  "part": "group_pre",
39
  "idx": 7,
40
+ "precision": "A_BF16_W_INT8"
41
  },
42
  {
43
  "part": "group_pre",
44
  "idx": 8,
45
+ "precision": "A_BF16_W_INT8"
46
  },
47
  {
48
  "part": "group_pre",
49
  "idx": 9,
50
+ "precision": "A_BF16_W_INT8"
51
  },
52
  {
53
  "part": "group_pre",
54
  "idx": 10,
55
+ "precision": "A_BF16_W_INT8"
56
  },
57
  {
58
  "part": "group_pre",
59
  "idx": 11,
60
+ "precision": "A_BF16_W_INT8"
61
  },
62
  {
63
  "part": "group_pre",
64
  "idx": 12,
65
+ "precision": "A_BF16_W_INT8"
66
  },
67
  {
68
  "part": "group_pre",
69
  "idx": 13,
70
+ "precision": "A_BF16_W_INT8"
71
  },
72
  {
73
  "part": "group_pre",
74
  "idx": 14,
75
+ "precision": "A_BF16_W_INT8"
76
  },
77
  {
78
  "part": "group_pre",
79
  "idx": 15,
80
+ "precision": "A_BF16_W_INT8"
81
  },
82
  {
83
  "part": "group_pre",
84
  "idx": 16,
85
+ "precision": "A_BF16_W_INT8"
86
  },
87
  {
88
  "part": "group_pre",
89
  "idx": 17,
90
+ "precision": "A_BF16_W_INT8"
91
  },
92
  {
93
  "part": "group_pre",
94
  "idx": 18,
95
+ "precision": "A_BF16_W_INT8"
96
  },
97
  {
98
  "part": "group_pre",
99
  "idx": 19,
100
+ "precision": "A_BF16_W_INT8"
101
  },
102
  {
103
  "part": "group_pre",
104
  "idx": 20,
105
+ "precision": "A_BF16_W_INT8"
106
  },
107
  {
108
  "part": "group_pre",
109
  "idx": 21,
110
+ "precision": "A_BF16_W_INT8"
111
  },
112
  {
113
  "part": "group_pre",
114
  "idx": 22,
115
+ "precision": "A_BF16_W_INT8"
116
  },
117
  {
118
  "part": "group_pre",
119
  "idx": 23,
120
+ "precision": "A_BF16_W_INT8"
121
  },
122
  {
123
  "part": "group_pre",
124
  "idx": 24,
125
+ "precision": "A_BF16_W_INT8"
126
  },
127
  {
128
  "part": "group_pre",
129
  "idx": 25,
130
+ "precision": "A_BF16_W_INT8"
131
  },
132
  {
133
  "part": "group_pre",
134
  "idx": 26,
135
+ "precision": "A_BF16_W_INT8"
136
  },
137
  {
138
  "part": "group_pre",
139
  "idx": 27,
140
+ "precision": "A_BF16_W_INT8"
141
  },
142
  {
143
  "part": "group_pre",
144
  "idx": 28,
145
+ "precision": "A_BF16_W_INT8"
146
  },
147
  {
148
  "part": "group_pre",
149
  "idx": 29,
150
+ "precision": "A_BF16_W_INT8"
151
  },
152
  {
153
  "part": "group_pre",
154
  "idx": 30,
155
+ "precision": "A_BF16_W_INT8"
156
  },
157
  {
158
  "part": "group_pre",
159
  "idx": 31,
160
+ "precision": "A_BF16_W_INT8"
161
  },
162
  {
163
  "part": "group_post",
164
  "idx": 0,
165
+ "precision": "A_BF16_W_INT8"
166
  },
167
  {
168
  "part": "group_post",
169
  "idx": 1,
170
+ "precision": "A_BF16_W_INT8"
171
  },
172
  {
173
  "part": "group_post",
174
  "idx": 2,
175
+ "precision": "A_BF16_W_INT8"
176
  },
177
  {
178
  "part": "group_post",
179
  "idx": 3,
180
+ "precision": "A_BF16_W_INT8"
181
  },
182
  {
183
  "part": "group_post",
184
  "idx": 4,
185
+ "precision": "A_BF16_W_INT8"
186
  },
187
  {
188
  "part": "group_post",
189
  "idx": 5,
190
+ "precision": "A_BF16_W_INT8"
191
  },
192
  {
193
  "part": "group_post",
194
  "idx": 6,
195
+ "precision": "A_BF16_W_INT8"
196
  },
197
  {
198
  "part": "group_post",
199
  "idx": 7,
200
+ "precision": "A_BF16_W_INT8"
201
  },
202
  {
203
  "part": "group_post",
204
  "idx": 8,
205
+ "precision": "A_BF16_W_INT8"
206
  },
207
  {
208
  "part": "group_post",
209
  "idx": 9,
210
+ "precision": "A_BF16_W_INT8"
211
  },
212
  {
213
  "part": "group_post",
214
  "idx": 10,
215
+ "precision": "A_BF16_W_INT8"
216
  },
217
  {
218
  "part": "group_post",
219
  "idx": 11,
220
+ "precision": "A_BF16_W_INT8"
221
  },
222
  {
223
  "part": "group_post",
224
  "idx": 12,
225
+ "precision": "A_BF16_W_INT8"
226
  },
227
  {
228
  "part": "group_post",
229
  "idx": 13,
230
+ "precision": "A_BF16_W_INT8"
231
  },
232
  {
233
  "part": "group_post",
234
  "idx": 14,
235
+ "precision": "A_BF16_W_INT8"
236
  },
237
  {
238
  "part": "group_post",
239
  "idx": 15,
240
+ "precision": "A_BF16_W_INT8"
241
  },
242
  {
243
  "part": "group_post",
244
  "idx": 16,
245
+ "precision": "A_BF16_W_INT8"
246
  },
247
  {
248
  "part": "group_post",
249
  "idx": 17,
250
+ "precision": "A_BF16_W_INT8"
251
  },
252
  {
253
  "part": "group_post",
254
  "idx": 18,
255
+ "precision": "A_BF16_W_INT8"
256
  },
257
  {
258
  "part": "group_post",
259
  "idx": 19,
260
+ "precision": "A_BF16_W_INT8"
261
  },
262
  {
263
  "part": "group_post",
264
  "idx": 20,
265
+ "precision": "A_BF16_W_INT8"
266
  },
267
  {
268
  "part": "group_post",
269
  "idx": 21,
270
+ "precision": "A_BF16_W_INT8"
271
  },
272
  {
273
  "part": "group_post",
274
  "idx": 22,
275
+ "precision": "A_BF16_W_INT8"
276
  },
277
  {
278
  "part": "group_post",
279
  "idx": 23,
280
+ "precision": "A_BF16_W_INT8"
281
  },
282
  {
283
  "part": "group_post",
284
  "idx": 24,
285
+ "precision": "A_BF16_W_INT8"
286
  },
287
  {
288
  "part": "group_post",
289
  "idx": 25,
290
+ "precision": "A_BF16_W_INT8"
291
  },
292
  {
293
  "part": "group_post",
294
  "idx": 26,
295
+ "precision": "A_BF16_W_INT8"
296
  },
297
  {
298
  "part": "group_post",
299
  "idx": 27,
300
+ "precision": "A_BF16_W_INT8"
301
  },
302
  {
303
  "part": "group_post",
304
  "idx": 28,
305
+ "precision": "A_BF16_W_INT8"
306
  },
307
  {
308
  "part": "group_post",
309
  "idx": 29,
310
+ "precision": "A_BF16_W_INT8"
311
  },
312
  {
313
  "part": "group_post",
314
  "idx": 30,
315
+ "precision": "A_BF16_W_INT8"
316
  },
317
  {
318
  "part": "group_cache",
319
  "idx": 0,
320
+ "precision": "A_BF16_W_INT8"
321
  },
322
  {
323
  "part": "group_cache",
324
  "idx": 128,
325
+ "precision": "A_BF16_W_INT8"
326
  },
327
  {
328
  "part": "group_cache",
329
  "idx": 256,
330
+ "precision": "A_BF16_W_INT8"
331
  },
332
  {
333
  "part": "group_cache",
334
  "idx": 384,
335
+ "precision": "A_BF16_W_INT8"
336
  },
337
  {
338
  "part": "group_cache",
339
  "idx": 512,
340
+ "precision": "A_BF16_W_INT8"
341
  },
342
  {
343
  "part": "group_cache",
344
  "idx": 640,
345
+ "precision": "A_BF16_W_INT8"
346
  },
347
  {
348
  "part": "group_cache",
349
  "idx": 768,
350
+ "precision": "A_BF16_W_INT8"
351
  },
352
  {
353
  "part": "group_cache",
354
  "idx": 896,
355
+ "precision": "A_BF16_W_INT8"
356
  },
357
  {
358
  "part": "group_cache",
359
  "idx": 1024,
360
+ "precision": "A_BF16_W_INT8"
361
  },
362
  {
363
  "part": "group_cache",
364
  "idx": 1152,
365
+ "precision": "A_BF16_W_INT8"
366
  },
367
  {
368
  "part": "group_cache",
369
  "idx": 1280,
370
+ "precision": "A_BF16_W_INT8"
371
  },
372
  {
373
  "part": "group_cache",
374
  "idx": 1408,
375
+ "precision": "A_BF16_W_INT8"
376
  },
377
  {
378
  "part": "group_cache",
379
  "idx": 1536,
380
+ "precision": "A_BF16_W_INT8"
381
  },
382
  {
383
  "part": "group_cache",
384
  "idx": 1664,
385
+ "precision": "A_BF16_W_INT8"
386
  },
387
  {
388
  "part": "group_cache",
389
  "idx": 1792,
390
+ "precision": "A_BF16_W_INT8"
391
  },
392
  {
393
  "part": "group_cache",
394
  "idx": 1920,
395
+ "precision": "A_BF16_W_INT8"
396
  },
397
  {
398
  "part": "single_pre",
devkit/vlm_config.json CHANGED
@@ -156,6 +156,7 @@
156
  },
157
  "pipeline_cfg": {
158
  "system_prompt": null,
 
159
  "max_num_tokens": 2048,
160
  "input_token_group_size": 128,
161
  "input_token_group_offsets": [
 
156
  },
157
  "pipeline_cfg": {
158
  "system_prompt": null,
159
+ "chat_template": null,
160
  "max_num_tokens": 2048,
161
  "input_token_group_size": 128,
162
  "input_token_group_offsets": [
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token0_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e119888ed0b403d1aace2b571736f9fe22f3231c11faa6afcc6503eafd881934
3
- size 2806120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85cec0120efdf29ed9fff2d79dc163c658216fb07473333bb5a7468bfb82c37e
3
+ size 2791080
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1024_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd93716c1c3bf405ff1c0ff31a0f041eda793ab6621c1679c7eec09098909855
3
- size 17754624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:306e155580967aec0b539e1be8f4b9a74ca713ef88242868e2cbeabdb7c36874
3
+ size 16981200
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1152_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f63dade5130d7bf2921ee68383ddae3d148d15aaec8c879f8f509151542890c
3
- size 29709256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54c560a01c5e589bef46d819745b776fdd3506b75704e29327cde13400ef78dd
3
+ size 19303232
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1280_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3c85884365e187d7585782b0d37e3841b4545f02e29741f3f732200ae3f0ee7
3
- size 20976680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0d4aa2cd04c5aa36a7d36c43280b4ecb554e21e9366c9c6a4db99a578284555
3
+ size 16720592
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token128_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8b5ca1ea167ec6c617f63499882548ccc6a73d19aa5b1f06d53475ac5347363
3
- size 5810008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3a4fbe2839f039ab938a6cb0fc3d1c36c63886c4e02900dcbac5454235888fa
3
+ size 5768480
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1408_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b40588f36f2dc769b5631d19a610c7f56d9df4d66cca038f2b744d82bf8ebe4
3
- size 22573632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac5d783e8cc447fce24d92b2f32702ea003d3513535cd98d03e454d2a2688fe3
3
+ size 22171144
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1536_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:117a5e683519e004b03ec7b72cb9093338d85973497fac6e188b98da897823ce
3
- size 19542072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d63ae2b5395be65258a55bfa739fb93caffc3ad111252378602c9efd28b655bc
3
+ size 20442664
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1664_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dee3a8e5b7e9abc6a9af40bd74470d3f32eb0925edaf30f7b076db3ea6429a0a
3
- size 37121168
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fa2b87365342848132fab3e93d504c1f52dac1ac35625b029270b1e75fc67ab
3
+ size 23555720
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1792_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08aa5dc1bacb986b86e9ac102e51b8ce07589c900958b008b8b8ace13df9dd46
3
- size 35241480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeb3a1c3f9d2f7ea4fd754233487f74041ca72b421e8b4da8a940f60c16f5089
3
+ size 32170720
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token1920_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca57c0b65c48b33fed767c4a14545ee13f0bfb4d5064dfc34267d58944f2096f
3
- size 28561216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c85cd94b8b2187466df99c44086062be1f51e9108fcd629bfe1b63af188b4eab
3
+ size 28154376
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token256_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:977417da6fa3ea731b75308fda9cecca26ae2b686dd404bdf9de48d3c776184c
3
- size 7865736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96a406e9888189d8385ce8a328a81aef2054cd2217a8d494271ca53b82ea761b
3
+ size 6556448
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token384_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:686d65092349e53b9a2c2c05bd74aeab1c01e2432a3085ace2c056f33a70486f
3
- size 6770576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab1adfa87f65486efe1a36ef43a6e5c7f84072b217e4c6f02f55dc1e9dbc1c7f
3
+ size 6492288
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token512_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab7502d79a87eaee78bf89a3f172f95e45392594b89c0122935126ebe0957346
3
- size 10238120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bff20905c5ba3706f18ab02f2a27b6a84506e99b67ae779d74b86e893b924ca3
3
+ size 9054384
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token640_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4eb640502d4b456376fc990b0ffee55d35a0c7d4133e4d51b2051de6d93084f
3
- size 9989472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21479880aef7ad9eec360a90bf56b33499e240f3cfe7c0565f41ae4b347c5e88
3
+ size 9555360
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token768_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d95acf54963c7075903d04d9ff7a7fc520f79f24b58d93643306a379245796c7
3
- size 15419304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5f3f07e099f16bff685f747633ef0ee9f92845f9070c0629836c4655f5064dd
3
+ size 9288688
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_cache_token896_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c902d33b27355a4f67d1a4802eeb621cbb1b2040fae75a61408c383b1f20dec4
3
- size 9438824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:210e11d7d4e6f70ddf3e1e2e62bf9e892a3279ba19c7e1ebb85e90fdc7c45ef4
3
+ size 10956568
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer0_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45c19cc4d0b46bbe145514c976d6bba45e6a47a6cb0a48ff3fba435e4488a7f3
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e37201d3d0f3867b9e8c03129ac542450c60b9ca81075c5ce6fbe7970e3ba69
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer10_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e319335d03069e02ebcc18782d4e2ee3f5947ce4edb240288afd68ee56cba6e
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e60c695cbab0e72505f382e8b851267a01c0e09ccad9f22e0eae061828520f98
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer11_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb893c0054da92d4c6361adf2a7032273d4b4eef48018c3b12d2a88e4f243df2
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc71524461b5fcf332e16aac31036f19a31a306ec4ad61091cfd5769c58f01b3
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer12_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f02348fd697142219cf1f67474542fd1f32b1356969e2132df7ec006905f03e
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d83536b31cf67f1bce4806585b49b791f121fd5ec8d3f281eda89720deb42689
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer13_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b758f9fc3f6a62bc0478bdfc12a24bcde30e58375632660283c480b33ca7108b
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75cffdf8a8c427ddf2c5bbc30a88d189f7865f860d40fd650e8bc30d1c1d21dc
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer14_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b8d0ab30ce0f216727092f1d09a684711e1d0aa9d085fecb97822e07ab08883
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36071cac60add851320bd0cad3689341dbd22062648bbd7e90df55a2cce429ee
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer15_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00334e509c582204d39d997adb650e51dba87f6f6489b5a73a061d3225253f6f
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d9b952448fa52daf12607a95950ef7c75e0ca245fbea6a02f751a36d7b0f4e4
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer16_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fb481f8b70334a7d8ad26176bd38dbb4529eefdca188fbdf7380a0a741406ff
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3698e5baae76adb2642024ae9fe0abc3b7dfafddcc680f8f7936b1db652b6f56
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer17_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e752b67f844c2ceeaaa8b01ee52e4244e24f18622a0ad3ce439f9200fdb488fc
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfa52ad11fb00e7a59525829c3747b9a7ca186097c9bfefd1c3ec9176b67d82e
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer18_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e0635169a104836b727a750e6aca7ac2e96e722af401357826c9852b6478a60
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c60a9e8d773c3bd4fc1eae133497ac33c2b21660209db396ca8e8c60562eb0
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer19_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d89c90bc7fbe20defb8283707228a5439480a12c2ade68374bcc0eb5dd4715bb
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8d144039ab89a21fc20e64b22772a6506cee4c22c16ccc00809db1337490b0e
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer1_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63180a25a6a6feb780c959e2fb6e8ff3c0da6e68451ce71e0a0acf30199a3362
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:927449056924b746e8c3c3d6117e0633c67c40438f11644fdd3fa9b6798da197
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer20_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14cdf3104ed8d85921db17bb2a61af619e5b856199f78fd59ddb3ef5f16ca288
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dab1442111a92f49ddd62c1ab11f096849843675a8382186dd5f8830213f2949
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer21_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:896d498aecdf7000b4cd963167bcbb486bad9528e019780531fa6acafdfeb395
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37dde19a46f9a81d70809a6ca965c8bc6dc815d38734d415c7114fc1844fb462
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer22_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06a7a0db1f0725a4719a09a2cece85d1869538e2b0f64549b2e3d4a91dfb67d2
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9e5947d54be1e8aac066ac937cacabea08a6acff338c205813398c68b967f37
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer23_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10aa722cb799a7dfe1a08a263c2594c70a3fbd6aa3205086c4200585ac788de7
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:817a8a1912244c4b3da4add0d2c6de4641ffce8262cc646ea8e56313ee1bd00b
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer24_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d152c8b7920b553f8a43c8bf045ecf7ad15e16758f9df6f600364991352b2762
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed34a5ca83599992aab9bd0f49fb4d7c43833eccba07f40a442fdc1bc766fffc
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer25_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a46e73857b23e3ca62d41bbca3d1ffa6930f4a255fcb9f6b443fafd59a05d850
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb8e6cdfb7d80d2936a29f9d486b15ad1101fa6f5c8af4fe2fdf565d3965b6f0
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer26_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03f9b701c1c32dbbcb35b7498c65edbb4596115bc2d7267ff9dd962066f9174e
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16caf4dd3764c7c92142cc202c71765e7f4770b65b425522ebb8dde287f0311f
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer27_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74ffc33717cac73702b97fd9a7a2ffd079120de76b8fdd5f74b8f90e4a109a15
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b07a10bf2dc5027d42f5f750926aaaa36ba914f82c743669c9f24265d0154413
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer28_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5209b59df1d59ee64300806983d3b55d0d887403db9081a5ddeed7fce4ceb2df
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f2195b39296f4c1a3273949bf3807692082f02fb38bae8c3a2fed26eaa8f90c
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer29_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13dc7881c03b1704f08d71472fa0748e123bc3e818036daa428b073f57596ed6
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e42dc955e1a574c0efa0ed5415b528dfb9e33b92fab47f23846b58bc1378cb86
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer2_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f4cac9baf46e861007ec2689a59d885ffc08906a9a1fcbf51990460ba7bec4b
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc27b368ef2751cc5b10bdb2f62b25e1ede340c2aa7cfa999efcddeabfd5b176
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer30_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c340640dd1622df8cd9e534ced75c6481f7dc57fc61ed457dfe76b4f4322af71
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dddb679cee5228aa9cb322fed6c3cf545a6be81649ae3e220d0b7f5bb6c06ff4
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer3_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b99f0c0dab6cd17838ab602804b0e28ab518527cf1d94da647280eb31d77ce08
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:428e69ddfdb4eefe78659af5eb2787420dab5ba09d80fc87aa68cbb4ae40b85c
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer4_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecaf17f00dd70fbb6810028a5af529e0fb99bb19fe69a99cb32ab278129b5ba6
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44b92bf422e6e6068836729179e01ed722267d1d5a724e7ef33cf0fc69f96efb
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer5_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aec69cf586411d15dfb8bfe34e3ec503357fcfacfa9f0b20428adeacb994badc
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc33459bed95e82f910cf8a4fab688699a0c1e2c1fa8c7a463c0f4a03f26f8f6
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer6_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ec701090cbbf3215fbc3d9d99c66ec5d7fb3defc6f266ae26603bf32351e30e
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3972440c3b04d04110a0f10236c718dc41d2dc245944ebe8df115c79d3695c1f
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer7_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8d19195d0b6fb408d1737f8e198679f602554c1a0828e3611182480fe4dd0ea
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d295cf8d749f6520215135be0c592d891eb8f3f47c95689136138bb2dba6ffb
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer8_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7acf33986d112db2fa0dbcea99433e7d1d2280feb0d67f799d75fb932b77d93
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e0b03273beea42d710d6fbc7b23bd4b26d5e0eede80e322ab81d67855531508
3
+ size 97409136
elf_files/models--microsoft--Phi-3.5-mini-instruct_language_n128_post_layer9_stage1_mla.elf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:178bd8530b0cb894a7d4069b262de717a80908d6b3a8448ff532bd648d7f8674
3
- size 112493256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:886ea4016e0ec59fc9fdce6228e31bd8ec481c08f56dff3d34a201648c036cbd
3
+ size 97409136