dourakushinju commited on
Commit
54a8fba
·
verified ·
1 Parent(s): 76e0a69

Add files using upload-large-folder tool

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,1034 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</action>": 151670,
3
+ "</think>": 151668,
4
+ "</tool_call>": 151658,
5
+ "</tool_response>": 151666,
6
+ "<0>": 151675,
7
+ "<100>": 151775,
8
+ "<101>": 151776,
9
+ "<102>": 151777,
10
+ "<103>": 151778,
11
+ "<104>": 151779,
12
+ "<105>": 151780,
13
+ "<106>": 151781,
14
+ "<107>": 151782,
15
+ "<108>": 151783,
16
+ "<109>": 151784,
17
+ "<10>": 151685,
18
+ "<110>": 151785,
19
+ "<111>": 151786,
20
+ "<112>": 151787,
21
+ "<113>": 151788,
22
+ "<114>": 151789,
23
+ "<115>": 151790,
24
+ "<116>": 151791,
25
+ "<117>": 151792,
26
+ "<118>": 151793,
27
+ "<119>": 151794,
28
+ "<11>": 151686,
29
+ "<120>": 151795,
30
+ "<121>": 151796,
31
+ "<122>": 151797,
32
+ "<123>": 151798,
33
+ "<124>": 151799,
34
+ "<125>": 151800,
35
+ "<126>": 151801,
36
+ "<127>": 151802,
37
+ "<128>": 151803,
38
+ "<129>": 151804,
39
+ "<12>": 151687,
40
+ "<130>": 151805,
41
+ "<131>": 151806,
42
+ "<132>": 151807,
43
+ "<133>": 151808,
44
+ "<134>": 151809,
45
+ "<135>": 151810,
46
+ "<136>": 151811,
47
+ "<137>": 151812,
48
+ "<138>": 151813,
49
+ "<139>": 151814,
50
+ "<13>": 151688,
51
+ "<140>": 151815,
52
+ "<141>": 151816,
53
+ "<142>": 151817,
54
+ "<143>": 151818,
55
+ "<144>": 151819,
56
+ "<145>": 151820,
57
+ "<146>": 151821,
58
+ "<147>": 151822,
59
+ "<148>": 151823,
60
+ "<149>": 151824,
61
+ "<14>": 151689,
62
+ "<150>": 151825,
63
+ "<151>": 151826,
64
+ "<152>": 151827,
65
+ "<153>": 151828,
66
+ "<154>": 151829,
67
+ "<155>": 151830,
68
+ "<156>": 151831,
69
+ "<157>": 151832,
70
+ "<158>": 151833,
71
+ "<159>": 151834,
72
+ "<15>": 151690,
73
+ "<160>": 151835,
74
+ "<161>": 151836,
75
+ "<162>": 151837,
76
+ "<163>": 151838,
77
+ "<164>": 151839,
78
+ "<165>": 151840,
79
+ "<166>": 151841,
80
+ "<167>": 151842,
81
+ "<168>": 151843,
82
+ "<169>": 151844,
83
+ "<16>": 151691,
84
+ "<170>": 151845,
85
+ "<171>": 151846,
86
+ "<172>": 151847,
87
+ "<173>": 151848,
88
+ "<174>": 151849,
89
+ "<175>": 151850,
90
+ "<176>": 151851,
91
+ "<177>": 151852,
92
+ "<178>": 151853,
93
+ "<179>": 151854,
94
+ "<17>": 151692,
95
+ "<180>": 151855,
96
+ "<181>": 151856,
97
+ "<182>": 151857,
98
+ "<183>": 151858,
99
+ "<184>": 151859,
100
+ "<185>": 151860,
101
+ "<186>": 151861,
102
+ "<187>": 151862,
103
+ "<188>": 151863,
104
+ "<189>": 151864,
105
+ "<18>": 151693,
106
+ "<190>": 151865,
107
+ "<191>": 151866,
108
+ "<192>": 151867,
109
+ "<193>": 151868,
110
+ "<194>": 151869,
111
+ "<195>": 151870,
112
+ "<196>": 151871,
113
+ "<197>": 151872,
114
+ "<198>": 151873,
115
+ "<199>": 151874,
116
+ "<19>": 151694,
117
+ "<1>": 151676,
118
+ "<200>": 151875,
119
+ "<201>": 151876,
120
+ "<202>": 151877,
121
+ "<203>": 151878,
122
+ "<204>": 151879,
123
+ "<205>": 151880,
124
+ "<206>": 151881,
125
+ "<207>": 151882,
126
+ "<208>": 151883,
127
+ "<209>": 151884,
128
+ "<20>": 151695,
129
+ "<210>": 151885,
130
+ "<211>": 151886,
131
+ "<212>": 151887,
132
+ "<213>": 151888,
133
+ "<214>": 151889,
134
+ "<215>": 151890,
135
+ "<216>": 151891,
136
+ "<217>": 151892,
137
+ "<218>": 151893,
138
+ "<219>": 151894,
139
+ "<21>": 151696,
140
+ "<220>": 151895,
141
+ "<221>": 151896,
142
+ "<222>": 151897,
143
+ "<223>": 151898,
144
+ "<224>": 151899,
145
+ "<225>": 151900,
146
+ "<226>": 151901,
147
+ "<227>": 151902,
148
+ "<228>": 151903,
149
+ "<229>": 151904,
150
+ "<22>": 151697,
151
+ "<230>": 151905,
152
+ "<231>": 151906,
153
+ "<232>": 151907,
154
+ "<233>": 151908,
155
+ "<234>": 151909,
156
+ "<235>": 151910,
157
+ "<236>": 151911,
158
+ "<237>": 151912,
159
+ "<238>": 151913,
160
+ "<239>": 151914,
161
+ "<23>": 151698,
162
+ "<240>": 151915,
163
+ "<241>": 151916,
164
+ "<242>": 151917,
165
+ "<243>": 151918,
166
+ "<244>": 151919,
167
+ "<245>": 151920,
168
+ "<246>": 151921,
169
+ "<247>": 151922,
170
+ "<248>": 151923,
171
+ "<249>": 151924,
172
+ "<24>": 151699,
173
+ "<250>": 151925,
174
+ "<251>": 151926,
175
+ "<252>": 151927,
176
+ "<253>": 151928,
177
+ "<254>": 151929,
178
+ "<255>": 151930,
179
+ "<256>": 151931,
180
+ "<257>": 151932,
181
+ "<258>": 151933,
182
+ "<259>": 151934,
183
+ "<25>": 151700,
184
+ "<260>": 151935,
185
+ "<261>": 151936,
186
+ "<262>": 151937,
187
+ "<263>": 151938,
188
+ "<264>": 151939,
189
+ "<265>": 151940,
190
+ "<266>": 151941,
191
+ "<267>": 151942,
192
+ "<268>": 151943,
193
+ "<269>": 151944,
194
+ "<26>": 151701,
195
+ "<270>": 151945,
196
+ "<271>": 151946,
197
+ "<272>": 151947,
198
+ "<273>": 151948,
199
+ "<274>": 151949,
200
+ "<275>": 151950,
201
+ "<276>": 151951,
202
+ "<277>": 151952,
203
+ "<278>": 151953,
204
+ "<279>": 151954,
205
+ "<27>": 151702,
206
+ "<280>": 151955,
207
+ "<281>": 151956,
208
+ "<282>": 151957,
209
+ "<283>": 151958,
210
+ "<284>": 151959,
211
+ "<285>": 151960,
212
+ "<286>": 151961,
213
+ "<287>": 151962,
214
+ "<288>": 151963,
215
+ "<289>": 151964,
216
+ "<28>": 151703,
217
+ "<290>": 151965,
218
+ "<291>": 151966,
219
+ "<292>": 151967,
220
+ "<293>": 151968,
221
+ "<294>": 151969,
222
+ "<295>": 151970,
223
+ "<296>": 151971,
224
+ "<297>": 151972,
225
+ "<298>": 151973,
226
+ "<299>": 151974,
227
+ "<29>": 151704,
228
+ "<2>": 151677,
229
+ "<300>": 151975,
230
+ "<301>": 151976,
231
+ "<302>": 151977,
232
+ "<303>": 151978,
233
+ "<304>": 151979,
234
+ "<305>": 151980,
235
+ "<306>": 151981,
236
+ "<307>": 151982,
237
+ "<308>": 151983,
238
+ "<309>": 151984,
239
+ "<30>": 151705,
240
+ "<310>": 151985,
241
+ "<311>": 151986,
242
+ "<312>": 151987,
243
+ "<313>": 151988,
244
+ "<314>": 151989,
245
+ "<315>": 151990,
246
+ "<316>": 151991,
247
+ "<317>": 151992,
248
+ "<318>": 151993,
249
+ "<319>": 151994,
250
+ "<31>": 151706,
251
+ "<320>": 151995,
252
+ "<321>": 151996,
253
+ "<322>": 151997,
254
+ "<323>": 151998,
255
+ "<324>": 151999,
256
+ "<325>": 152000,
257
+ "<326>": 152001,
258
+ "<327>": 152002,
259
+ "<328>": 152003,
260
+ "<329>": 152004,
261
+ "<32>": 151707,
262
+ "<330>": 152005,
263
+ "<331>": 152006,
264
+ "<332>": 152007,
265
+ "<333>": 152008,
266
+ "<334>": 152009,
267
+ "<335>": 152010,
268
+ "<336>": 152011,
269
+ "<337>": 152012,
270
+ "<338>": 152013,
271
+ "<339>": 152014,
272
+ "<33>": 151708,
273
+ "<340>": 152015,
274
+ "<341>": 152016,
275
+ "<342>": 152017,
276
+ "<343>": 152018,
277
+ "<344>": 152019,
278
+ "<345>": 152020,
279
+ "<346>": 152021,
280
+ "<347>": 152022,
281
+ "<348>": 152023,
282
+ "<349>": 152024,
283
+ "<34>": 151709,
284
+ "<350>": 152025,
285
+ "<351>": 152026,
286
+ "<352>": 152027,
287
+ "<353>": 152028,
288
+ "<354>": 152029,
289
+ "<355>": 152030,
290
+ "<356>": 152031,
291
+ "<357>": 152032,
292
+ "<358>": 152033,
293
+ "<359>": 152034,
294
+ "<35>": 151710,
295
+ "<360>": 152035,
296
+ "<361>": 152036,
297
+ "<362>": 152037,
298
+ "<363>": 152038,
299
+ "<364>": 152039,
300
+ "<365>": 152040,
301
+ "<366>": 152041,
302
+ "<367>": 152042,
303
+ "<368>": 152043,
304
+ "<369>": 152044,
305
+ "<36>": 151711,
306
+ "<370>": 152045,
307
+ "<371>": 152046,
308
+ "<372>": 152047,
309
+ "<373>": 152048,
310
+ "<374>": 152049,
311
+ "<375>": 152050,
312
+ "<376>": 152051,
313
+ "<377>": 152052,
314
+ "<378>": 152053,
315
+ "<379>": 152054,
316
+ "<37>": 151712,
317
+ "<380>": 152055,
318
+ "<381>": 152056,
319
+ "<382>": 152057,
320
+ "<383>": 152058,
321
+ "<384>": 152059,
322
+ "<385>": 152060,
323
+ "<386>": 152061,
324
+ "<387>": 152062,
325
+ "<388>": 152063,
326
+ "<389>": 152064,
327
+ "<38>": 151713,
328
+ "<390>": 152065,
329
+ "<391>": 152066,
330
+ "<392>": 152067,
331
+ "<393>": 152068,
332
+ "<394>": 152069,
333
+ "<395>": 152070,
334
+ "<396>": 152071,
335
+ "<397>": 152072,
336
+ "<398>": 152073,
337
+ "<399>": 152074,
338
+ "<39>": 151714,
339
+ "<3>": 151678,
340
+ "<400>": 152075,
341
+ "<401>": 152076,
342
+ "<402>": 152077,
343
+ "<403>": 152078,
344
+ "<404>": 152079,
345
+ "<405>": 152080,
346
+ "<406>": 152081,
347
+ "<407>": 152082,
348
+ "<408>": 152083,
349
+ "<409>": 152084,
350
+ "<40>": 151715,
351
+ "<410>": 152085,
352
+ "<411>": 152086,
353
+ "<412>": 152087,
354
+ "<413>": 152088,
355
+ "<414>": 152089,
356
+ "<415>": 152090,
357
+ "<416>": 152091,
358
+ "<417>": 152092,
359
+ "<418>": 152093,
360
+ "<419>": 152094,
361
+ "<41>": 151716,
362
+ "<420>": 152095,
363
+ "<421>": 152096,
364
+ "<422>": 152097,
365
+ "<423>": 152098,
366
+ "<424>": 152099,
367
+ "<425>": 152100,
368
+ "<426>": 152101,
369
+ "<427>": 152102,
370
+ "<428>": 152103,
371
+ "<429>": 152104,
372
+ "<42>": 151717,
373
+ "<430>": 152105,
374
+ "<431>": 152106,
375
+ "<432>": 152107,
376
+ "<433>": 152108,
377
+ "<434>": 152109,
378
+ "<435>": 152110,
379
+ "<436>": 152111,
380
+ "<437>": 152112,
381
+ "<438>": 152113,
382
+ "<439>": 152114,
383
+ "<43>": 151718,
384
+ "<440>": 152115,
385
+ "<441>": 152116,
386
+ "<442>": 152117,
387
+ "<443>": 152118,
388
+ "<444>": 152119,
389
+ "<445>": 152120,
390
+ "<446>": 152121,
391
+ "<447>": 152122,
392
+ "<448>": 152123,
393
+ "<449>": 152124,
394
+ "<44>": 151719,
395
+ "<450>": 152125,
396
+ "<451>": 152126,
397
+ "<452>": 152127,
398
+ "<453>": 152128,
399
+ "<454>": 152129,
400
+ "<455>": 152130,
401
+ "<456>": 152131,
402
+ "<457>": 152132,
403
+ "<458>": 152133,
404
+ "<459>": 152134,
405
+ "<45>": 151720,
406
+ "<460>": 152135,
407
+ "<461>": 152136,
408
+ "<462>": 152137,
409
+ "<463>": 152138,
410
+ "<464>": 152139,
411
+ "<465>": 152140,
412
+ "<466>": 152141,
413
+ "<467>": 152142,
414
+ "<468>": 152143,
415
+ "<469>": 152144,
416
+ "<46>": 151721,
417
+ "<470>": 152145,
418
+ "<471>": 152146,
419
+ "<472>": 152147,
420
+ "<473>": 152148,
421
+ "<474>": 152149,
422
+ "<475>": 152150,
423
+ "<476>": 152151,
424
+ "<477>": 152152,
425
+ "<478>": 152153,
426
+ "<479>": 152154,
427
+ "<47>": 151722,
428
+ "<480>": 152155,
429
+ "<481>": 152156,
430
+ "<482>": 152157,
431
+ "<483>": 152158,
432
+ "<484>": 152159,
433
+ "<485>": 152160,
434
+ "<486>": 152161,
435
+ "<487>": 152162,
436
+ "<488>": 152163,
437
+ "<489>": 152164,
438
+ "<48>": 151723,
439
+ "<490>": 152165,
440
+ "<491>": 152166,
441
+ "<492>": 152167,
442
+ "<493>": 152168,
443
+ "<494>": 152169,
444
+ "<495>": 152170,
445
+ "<496>": 152171,
446
+ "<497>": 152172,
447
+ "<498>": 152173,
448
+ "<499>": 152174,
449
+ "<49>": 151724,
450
+ "<4>": 151679,
451
+ "<500>": 152175,
452
+ "<501>": 152176,
453
+ "<502>": 152177,
454
+ "<503>": 152178,
455
+ "<504>": 152179,
456
+ "<505>": 152180,
457
+ "<506>": 152181,
458
+ "<507>": 152182,
459
+ "<508>": 152183,
460
+ "<509>": 152184,
461
+ "<50>": 151725,
462
+ "<510>": 152185,
463
+ "<511>": 152186,
464
+ "<512>": 152187,
465
+ "<513>": 152188,
466
+ "<514>": 152189,
467
+ "<515>": 152190,
468
+ "<516>": 152191,
469
+ "<517>": 152192,
470
+ "<518>": 152193,
471
+ "<519>": 152194,
472
+ "<51>": 151726,
473
+ "<520>": 152195,
474
+ "<521>": 152196,
475
+ "<522>": 152197,
476
+ "<523>": 152198,
477
+ "<524>": 152199,
478
+ "<525>": 152200,
479
+ "<526>": 152201,
480
+ "<527>": 152202,
481
+ "<528>": 152203,
482
+ "<529>": 152204,
483
+ "<52>": 151727,
484
+ "<530>": 152205,
485
+ "<531>": 152206,
486
+ "<532>": 152207,
487
+ "<533>": 152208,
488
+ "<534>": 152209,
489
+ "<535>": 152210,
490
+ "<536>": 152211,
491
+ "<537>": 152212,
492
+ "<538>": 152213,
493
+ "<539>": 152214,
494
+ "<53>": 151728,
495
+ "<540>": 152215,
496
+ "<541>": 152216,
497
+ "<542>": 152217,
498
+ "<543>": 152218,
499
+ "<544>": 152219,
500
+ "<545>": 152220,
501
+ "<546>": 152221,
502
+ "<547>": 152222,
503
+ "<548>": 152223,
504
+ "<549>": 152224,
505
+ "<54>": 151729,
506
+ "<550>": 152225,
507
+ "<551>": 152226,
508
+ "<552>": 152227,
509
+ "<553>": 152228,
510
+ "<554>": 152229,
511
+ "<555>": 152230,
512
+ "<556>": 152231,
513
+ "<557>": 152232,
514
+ "<558>": 152233,
515
+ "<559>": 152234,
516
+ "<55>": 151730,
517
+ "<560>": 152235,
518
+ "<561>": 152236,
519
+ "<562>": 152237,
520
+ "<563>": 152238,
521
+ "<564>": 152239,
522
+ "<565>": 152240,
523
+ "<566>": 152241,
524
+ "<567>": 152242,
525
+ "<568>": 152243,
526
+ "<569>": 152244,
527
+ "<56>": 151731,
528
+ "<570>": 152245,
529
+ "<571>": 152246,
530
+ "<572>": 152247,
531
+ "<573>": 152248,
532
+ "<574>": 152249,
533
+ "<575>": 152250,
534
+ "<576>": 152251,
535
+ "<577>": 152252,
536
+ "<578>": 152253,
537
+ "<579>": 152254,
538
+ "<57>": 151732,
539
+ "<580>": 152255,
540
+ "<581>": 152256,
541
+ "<582>": 152257,
542
+ "<583>": 152258,
543
+ "<584>": 152259,
544
+ "<585>": 152260,
545
+ "<586>": 152261,
546
+ "<587>": 152262,
547
+ "<588>": 152263,
548
+ "<589>": 152264,
549
+ "<58>": 151733,
550
+ "<590>": 152265,
551
+ "<591>": 152266,
552
+ "<592>": 152267,
553
+ "<593>": 152268,
554
+ "<594>": 152269,
555
+ "<595>": 152270,
556
+ "<596>": 152271,
557
+ "<597>": 152272,
558
+ "<598>": 152273,
559
+ "<599>": 152274,
560
+ "<59>": 151734,
561
+ "<5>": 151680,
562
+ "<600>": 152275,
563
+ "<601>": 152276,
564
+ "<602>": 152277,
565
+ "<603>": 152278,
566
+ "<604>": 152279,
567
+ "<605>": 152280,
568
+ "<606>": 152281,
569
+ "<607>": 152282,
570
+ "<608>": 152283,
571
+ "<609>": 152284,
572
+ "<60>": 151735,
573
+ "<610>": 152285,
574
+ "<611>": 152286,
575
+ "<612>": 152287,
576
+ "<613>": 152288,
577
+ "<614>": 152289,
578
+ "<615>": 152290,
579
+ "<616>": 152291,
580
+ "<617>": 152292,
581
+ "<618>": 152293,
582
+ "<619>": 152294,
583
+ "<61>": 151736,
584
+ "<620>": 152295,
585
+ "<621>": 152296,
586
+ "<622>": 152297,
587
+ "<623>": 152298,
588
+ "<624>": 152299,
589
+ "<625>": 152300,
590
+ "<626>": 152301,
591
+ "<627>": 152302,
592
+ "<628>": 152303,
593
+ "<629>": 152304,
594
+ "<62>": 151737,
595
+ "<630>": 152305,
596
+ "<631>": 152306,
597
+ "<632>": 152307,
598
+ "<633>": 152308,
599
+ "<634>": 152309,
600
+ "<635>": 152310,
601
+ "<636>": 152311,
602
+ "<637>": 152312,
603
+ "<638>": 152313,
604
+ "<639>": 152314,
605
+ "<63>": 151738,
606
+ "<640>": 152315,
607
+ "<641>": 152316,
608
+ "<642>": 152317,
609
+ "<643>": 152318,
610
+ "<644>": 152319,
611
+ "<645>": 152320,
612
+ "<646>": 152321,
613
+ "<647>": 152322,
614
+ "<648>": 152323,
615
+ "<649>": 152324,
616
+ "<64>": 151739,
617
+ "<650>": 152325,
618
+ "<651>": 152326,
619
+ "<652>": 152327,
620
+ "<653>": 152328,
621
+ "<654>": 152329,
622
+ "<655>": 152330,
623
+ "<656>": 152331,
624
+ "<657>": 152332,
625
+ "<658>": 152333,
626
+ "<659>": 152334,
627
+ "<65>": 151740,
628
+ "<660>": 152335,
629
+ "<661>": 152336,
630
+ "<662>": 152337,
631
+ "<663>": 152338,
632
+ "<664>": 152339,
633
+ "<665>": 152340,
634
+ "<666>": 152341,
635
+ "<667>": 152342,
636
+ "<668>": 152343,
637
+ "<669>": 152344,
638
+ "<66>": 151741,
639
+ "<670>": 152345,
640
+ "<671>": 152346,
641
+ "<672>": 152347,
642
+ "<673>": 152348,
643
+ "<674>": 152349,
644
+ "<675>": 152350,
645
+ "<676>": 152351,
646
+ "<677>": 152352,
647
+ "<678>": 152353,
648
+ "<679>": 152354,
649
+ "<67>": 151742,
650
+ "<680>": 152355,
651
+ "<681>": 152356,
652
+ "<682>": 152357,
653
+ "<683>": 152358,
654
+ "<684>": 152359,
655
+ "<685>": 152360,
656
+ "<686>": 152361,
657
+ "<687>": 152362,
658
+ "<688>": 152363,
659
+ "<689>": 152364,
660
+ "<68>": 151743,
661
+ "<690>": 152365,
662
+ "<691>": 152366,
663
+ "<692>": 152367,
664
+ "<693>": 152368,
665
+ "<694>": 152369,
666
+ "<695>": 152370,
667
+ "<696>": 152371,
668
+ "<697>": 152372,
669
+ "<698>": 152373,
670
+ "<699>": 152374,
671
+ "<69>": 151744,
672
+ "<6>": 151681,
673
+ "<700>": 152375,
674
+ "<701>": 152376,
675
+ "<702>": 152377,
676
+ "<703>": 152378,
677
+ "<704>": 152379,
678
+ "<705>": 152380,
679
+ "<706>": 152381,
680
+ "<707>": 152382,
681
+ "<708>": 152383,
682
+ "<709>": 152384,
683
+ "<70>": 151745,
684
+ "<710>": 152385,
685
+ "<711>": 152386,
686
+ "<712>": 152387,
687
+ "<713>": 152388,
688
+ "<714>": 152389,
689
+ "<715>": 152390,
690
+ "<716>": 152391,
691
+ "<717>": 152392,
692
+ "<718>": 152393,
693
+ "<719>": 152394,
694
+ "<71>": 151746,
695
+ "<720>": 152395,
696
+ "<721>": 152396,
697
+ "<722>": 152397,
698
+ "<723>": 152398,
699
+ "<724>": 152399,
700
+ "<725>": 152400,
701
+ "<726>": 152401,
702
+ "<727>": 152402,
703
+ "<728>": 152403,
704
+ "<729>": 152404,
705
+ "<72>": 151747,
706
+ "<730>": 152405,
707
+ "<731>": 152406,
708
+ "<732>": 152407,
709
+ "<733>": 152408,
710
+ "<734>": 152409,
711
+ "<735>": 152410,
712
+ "<736>": 152411,
713
+ "<737>": 152412,
714
+ "<738>": 152413,
715
+ "<739>": 152414,
716
+ "<73>": 151748,
717
+ "<740>": 152415,
718
+ "<741>": 152416,
719
+ "<742>": 152417,
720
+ "<743>": 152418,
721
+ "<744>": 152419,
722
+ "<745>": 152420,
723
+ "<746>": 152421,
724
+ "<747>": 152422,
725
+ "<748>": 152423,
726
+ "<749>": 152424,
727
+ "<74>": 151749,
728
+ "<750>": 152425,
729
+ "<751>": 152426,
730
+ "<752>": 152427,
731
+ "<753>": 152428,
732
+ "<754>": 152429,
733
+ "<755>": 152430,
734
+ "<756>": 152431,
735
+ "<757>": 152432,
736
+ "<758>": 152433,
737
+ "<759>": 152434,
738
+ "<75>": 151750,
739
+ "<760>": 152435,
740
+ "<761>": 152436,
741
+ "<762>": 152437,
742
+ "<763>": 152438,
743
+ "<764>": 152439,
744
+ "<765>": 152440,
745
+ "<766>": 152441,
746
+ "<767>": 152442,
747
+ "<768>": 152443,
748
+ "<769>": 152444,
749
+ "<76>": 151751,
750
+ "<770>": 152445,
751
+ "<771>": 152446,
752
+ "<772>": 152447,
753
+ "<773>": 152448,
754
+ "<774>": 152449,
755
+ "<775>": 152450,
756
+ "<776>": 152451,
757
+ "<777>": 152452,
758
+ "<778>": 152453,
759
+ "<779>": 152454,
760
+ "<77>": 151752,
761
+ "<780>": 152455,
762
+ "<781>": 152456,
763
+ "<782>": 152457,
764
+ "<783>": 152458,
765
+ "<784>": 152459,
766
+ "<785>": 152460,
767
+ "<786>": 152461,
768
+ "<787>": 152462,
769
+ "<788>": 152463,
770
+ "<789>": 152464,
771
+ "<78>": 151753,
772
+ "<790>": 152465,
773
+ "<791>": 152466,
774
+ "<792>": 152467,
775
+ "<793>": 152468,
776
+ "<794>": 152469,
777
+ "<795>": 152470,
778
+ "<796>": 152471,
779
+ "<797>": 152472,
780
+ "<798>": 152473,
781
+ "<799>": 152474,
782
+ "<79>": 151754,
783
+ "<7>": 151682,
784
+ "<800>": 152475,
785
+ "<801>": 152476,
786
+ "<802>": 152477,
787
+ "<803>": 152478,
788
+ "<804>": 152479,
789
+ "<805>": 152480,
790
+ "<806>": 152481,
791
+ "<807>": 152482,
792
+ "<808>": 152483,
793
+ "<809>": 152484,
794
+ "<80>": 151755,
795
+ "<810>": 152485,
796
+ "<811>": 152486,
797
+ "<812>": 152487,
798
+ "<813>": 152488,
799
+ "<814>": 152489,
800
+ "<815>": 152490,
801
+ "<816>": 152491,
802
+ "<817>": 152492,
803
+ "<818>": 152493,
804
+ "<819>": 152494,
805
+ "<81>": 151756,
806
+ "<820>": 152495,
807
+ "<821>": 152496,
808
+ "<822>": 152497,
809
+ "<823>": 152498,
810
+ "<824>": 152499,
811
+ "<825>": 152500,
812
+ "<826>": 152501,
813
+ "<827>": 152502,
814
+ "<828>": 152503,
815
+ "<829>": 152504,
816
+ "<82>": 151757,
817
+ "<830>": 152505,
818
+ "<831>": 152506,
819
+ "<832>": 152507,
820
+ "<833>": 152508,
821
+ "<834>": 152509,
822
+ "<835>": 152510,
823
+ "<836>": 152511,
824
+ "<837>": 152512,
825
+ "<838>": 152513,
826
+ "<839>": 152514,
827
+ "<83>": 151758,
828
+ "<840>": 152515,
829
+ "<841>": 152516,
830
+ "<842>": 152517,
831
+ "<843>": 152518,
832
+ "<844>": 152519,
833
+ "<845>": 152520,
834
+ "<846>": 152521,
835
+ "<847>": 152522,
836
+ "<848>": 152523,
837
+ "<849>": 152524,
838
+ "<84>": 151759,
839
+ "<850>": 152525,
840
+ "<851>": 152526,
841
+ "<852>": 152527,
842
+ "<853>": 152528,
843
+ "<854>": 152529,
844
+ "<855>": 152530,
845
+ "<856>": 152531,
846
+ "<857>": 152532,
847
+ "<858>": 152533,
848
+ "<859>": 152534,
849
+ "<85>": 151760,
850
+ "<860>": 152535,
851
+ "<861>": 152536,
852
+ "<862>": 152537,
853
+ "<863>": 152538,
854
+ "<864>": 152539,
855
+ "<865>": 152540,
856
+ "<866>": 152541,
857
+ "<867>": 152542,
858
+ "<868>": 152543,
859
+ "<869>": 152544,
860
+ "<86>": 151761,
861
+ "<870>": 152545,
862
+ "<871>": 152546,
863
+ "<872>": 152547,
864
+ "<873>": 152548,
865
+ "<874>": 152549,
866
+ "<875>": 152550,
867
+ "<876>": 152551,
868
+ "<877>": 152552,
869
+ "<878>": 152553,
870
+ "<879>": 152554,
871
+ "<87>": 151762,
872
+ "<880>": 152555,
873
+ "<881>": 152556,
874
+ "<882>": 152557,
875
+ "<883>": 152558,
876
+ "<884>": 152559,
877
+ "<885>": 152560,
878
+ "<886>": 152561,
879
+ "<887>": 152562,
880
+ "<888>": 152563,
881
+ "<889>": 152564,
882
+ "<88>": 151763,
883
+ "<890>": 152565,
884
+ "<891>": 152566,
885
+ "<892>": 152567,
886
+ "<893>": 152568,
887
+ "<894>": 152569,
888
+ "<895>": 152570,
889
+ "<896>": 152571,
890
+ "<897>": 152572,
891
+ "<898>": 152573,
892
+ "<899>": 152574,
893
+ "<89>": 151764,
894
+ "<8>": 151683,
895
+ "<900>": 152575,
896
+ "<901>": 152576,
897
+ "<902>": 152577,
898
+ "<903>": 152578,
899
+ "<904>": 152579,
900
+ "<905>": 152580,
901
+ "<906>": 152581,
902
+ "<907>": 152582,
903
+ "<908>": 152583,
904
+ "<909>": 152584,
905
+ "<90>": 151765,
906
+ "<910>": 152585,
907
+ "<911>": 152586,
908
+ "<912>": 152587,
909
+ "<913>": 152588,
910
+ "<914>": 152589,
911
+ "<915>": 152590,
912
+ "<916>": 152591,
913
+ "<917>": 152592,
914
+ "<918>": 152593,
915
+ "<919>": 152594,
916
+ "<91>": 151766,
917
+ "<920>": 152595,
918
+ "<921>": 152596,
919
+ "<922>": 152597,
920
+ "<923>": 152598,
921
+ "<924>": 152599,
922
+ "<925>": 152600,
923
+ "<926>": 152601,
924
+ "<927>": 152602,
925
+ "<928>": 152603,
926
+ "<929>": 152604,
927
+ "<92>": 151767,
928
+ "<930>": 152605,
929
+ "<931>": 152606,
930
+ "<932>": 152607,
931
+ "<933>": 152608,
932
+ "<934>": 152609,
933
+ "<935>": 152610,
934
+ "<936>": 152611,
935
+ "<937>": 152612,
936
+ "<938>": 152613,
937
+ "<939>": 152614,
938
+ "<93>": 151768,
939
+ "<940>": 152615,
940
+ "<941>": 152616,
941
+ "<942>": 152617,
942
+ "<943>": 152618,
943
+ "<944>": 152619,
944
+ "<945>": 152620,
945
+ "<946>": 152621,
946
+ "<947>": 152622,
947
+ "<948>": 152623,
948
+ "<949>": 152624,
949
+ "<94>": 151769,
950
+ "<950>": 152625,
951
+ "<951>": 152626,
952
+ "<952>": 152627,
953
+ "<953>": 152628,
954
+ "<954>": 152629,
955
+ "<955>": 152630,
956
+ "<956>": 152631,
957
+ "<957>": 152632,
958
+ "<958>": 152633,
959
+ "<959>": 152634,
960
+ "<95>": 151770,
961
+ "<960>": 152635,
962
+ "<961>": 152636,
963
+ "<962>": 152637,
964
+ "<963>": 152638,
965
+ "<964>": 152639,
966
+ "<965>": 152640,
967
+ "<966>": 152641,
968
+ "<967>": 152642,
969
+ "<968>": 152643,
970
+ "<969>": 152644,
971
+ "<96>": 151771,
972
+ "<970>": 152645,
973
+ "<971>": 152646,
974
+ "<972>": 152647,
975
+ "<973>": 152648,
976
+ "<974>": 152649,
977
+ "<975>": 152650,
978
+ "<976>": 152651,
979
+ "<977>": 152652,
980
+ "<978>": 152653,
981
+ "<979>": 152654,
982
+ "<97>": 151772,
983
+ "<980>": 152655,
984
+ "<981>": 152656,
985
+ "<982>": 152657,
986
+ "<983>": 152658,
987
+ "<984>": 152659,
988
+ "<985>": 152660,
989
+ "<986>": 152661,
990
+ "<987>": 152662,
991
+ "<988>": 152663,
992
+ "<989>": 152664,
993
+ "<98>": 151773,
994
+ "<990>": 152665,
995
+ "<991>": 152666,
996
+ "<992>": 152667,
997
+ "<993>": 152668,
998
+ "<994>": 152669,
999
+ "<995>": 152670,
1000
+ "<996>": 152671,
1001
+ "<997>": 152672,
1002
+ "<998>": 152673,
1003
+ "<999>": 152674,
1004
+ "<99>": 151774,
1005
+ "<9>": 151684,
1006
+ "<FWD>": 151671,
1007
+ "<LEFT>": 151672,
1008
+ "<RIGHT>": 151673,
1009
+ "<STOP>": 151674,
1010
+ "<action>": 151669,
1011
+ "<think>": 151667,
1012
+ "<tool_call>": 151657,
1013
+ "<tool_response>": 151665,
1014
+ "<|box_end|>": 151649,
1015
+ "<|box_start|>": 151648,
1016
+ "<|endoftext|>": 151643,
1017
+ "<|file_sep|>": 151664,
1018
+ "<|fim_middle|>": 151660,
1019
+ "<|fim_pad|>": 151662,
1020
+ "<|fim_prefix|>": 151659,
1021
+ "<|fim_suffix|>": 151661,
1022
+ "<|im_end|>": 151645,
1023
+ "<|im_start|>": 151644,
1024
+ "<|image_pad|>": 151655,
1025
+ "<|object_ref_end|>": 151647,
1026
+ "<|object_ref_start|>": 151646,
1027
+ "<|quad_end|>": 151651,
1028
+ "<|quad_start|>": 151650,
1029
+ "<|repo_name|>": 151663,
1030
+ "<|video_pad|>": 151656,
1031
+ "<|vision_end|>": 151653,
1032
+ "<|vision_pad|>": 151654,
1033
+ "<|vision_start|>": 151652
1034
+ }
chat_template.jinja ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- if tools %}
2
+ {{- '<|im_start|>system\n' }}
3
+ {%- if messages[0].role == 'system' %}
4
+ {%- if messages[0].content is string %}
5
+ {{- messages[0].content }}
6
+ {%- else %}
7
+ {%- for content in messages[0].content %}
8
+ {%- if 'text' in content %}
9
+ {{- content.text }}
10
+ {%- endif %}
11
+ {%- endfor %}
12
+ {%- endif %}
13
+ {{- '\n\n' }}
14
+ {%- endif %}
15
+ {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
16
+ {%- for tool in tools %}
17
+ {{- "\n" }}
18
+ {{- tool | tojson }}
19
+ {%- endfor %}
20
+ {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
21
+ {%- else %}
22
+ {%- if messages[0].role == 'system' %}
23
+ {{- '<|im_start|>system\n' }}
24
+ {%- if messages[0].content is string %}
25
+ {{- messages[0].content }}
26
+ {%- else %}
27
+ {%- for content in messages[0].content %}
28
+ {%- if 'text' in content %}
29
+ {{- content.text }}
30
+ {%- endif %}
31
+ {%- endfor %}
32
+ {%- endif %}
33
+ {{- '<|im_end|>\n' }}
34
+ {%- endif %}
35
+ {%- endif %}
36
+ {%- set image_count = namespace(value=0) %}
37
+ {%- set video_count = namespace(value=0) %}
38
+ {%- for message in messages %}
39
+ {%- if message.role == "user" %}
40
+ {{- '<|im_start|>' + message.role + '\n' }}
41
+ {%- if message.content is string %}
42
+ {{- message.content }}
43
+ {%- else %}
44
+ {%- for content in message.content %}
45
+ {%- if content.type == 'image' or 'image' in content or 'image_url' in content %}
46
+ {%- set image_count.value = image_count.value + 1 %}
47
+ {%- if add_vision_id %}Picture {{ image_count.value }}: {% endif -%}
48
+ <|vision_start|><|image_pad|><|vision_end|>
49
+ {%- elif content.type == 'video' or 'video' in content %}
50
+ {%- set video_count.value = video_count.value + 1 %}
51
+ {%- if add_vision_id %}Video {{ video_count.value }}: {% endif -%}
52
+ <|vision_start|><|video_pad|><|vision_end|>
53
+ {%- elif 'text' in content %}
54
+ {{- content.text }}
55
+ {%- endif %}
56
+ {%- endfor %}
57
+ {%- endif %}
58
+ {{- '<|im_end|>\n' }}
59
+ {%- elif message.role == "assistant" %}
60
+ {{- '<|im_start|>' + message.role + '\n' }}
61
+ {%- if message.content is string %}
62
+ {{- message.content }}
63
+ {%- else %}
64
+ {%- for content_item in message.content %}
65
+ {%- if 'text' in content_item %}
66
+ {{- content_item.text }}
67
+ {%- endif %}
68
+ {%- endfor %}
69
+ {%- endif %}
70
+ {%- if message.tool_calls %}
71
+ {%- for tool_call in message.tool_calls %}
72
+ {%- if (loop.first and message.content) or (not loop.first) %}
73
+ {{- '\n' }}
74
+ {%- endif %}
75
+ {%- if tool_call.function %}
76
+ {%- set tool_call = tool_call.function %}
77
+ {%- endif %}
78
+ {{- '<tool_call>\n{"name": "' }}
79
+ {{- tool_call.name }}
80
+ {{- '", "arguments": ' }}
81
+ {%- if tool_call.arguments is string %}
82
+ {{- tool_call.arguments }}
83
+ {%- else %}
84
+ {{- tool_call.arguments | tojson }}
85
+ {%- endif %}
86
+ {{- '}\n</tool_call>' }}
87
+ {%- endfor %}
88
+ {%- endif %}
89
+ {{- '<|im_end|>\n' }}
90
+ {%- elif message.role == "tool" %}
91
+ {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
92
+ {{- '<|im_start|>user' }}
93
+ {%- endif %}
94
+ {{- '\n<tool_response>\n' }}
95
+ {%- if message.content is string %}
96
+ {{- message.content }}
97
+ {%- else %}
98
+ {%- for content in message.content %}
99
+ {%- if content.type == 'image' or 'image' in content or 'image_url' in content %}
100
+ {%- set image_count.value = image_count.value + 1 %}
101
+ {%- if add_vision_id %}Picture {{ image_count.value }}: {% endif -%}
102
+ <|vision_start|><|image_pad|><|vision_end|>
103
+ {%- elif content.type == 'video' or 'video' in content %}
104
+ {%- set video_count.value = video_count.value + 1 %}
105
+ {%- if add_vision_id %}Video {{ video_count.value }}: {% endif -%}
106
+ <|vision_start|><|video_pad|><|vision_end|>
107
+ {%- elif 'text' in content %}
108
+ {{- content.text }}
109
+ {%- endif %}
110
+ {%- endfor %}
111
+ {%- endif %}
112
+ {{- '\n</tool_response>' }}
113
+ {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
114
+ {{- '<|im_end|>\n' }}
115
+ {%- endif %}
116
+ {%- endif %}
117
+ {%- endfor %}
118
+ {%- if add_generation_prompt %}
119
+ {{- '<|im_start|>assistant\n' }}
120
+ {%- endif %}
config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen3VLForConditionalGeneration"
4
+ ],
5
+ "dtype": "float32",
6
+ "eos_token_id": 151645,
7
+ "hidden_size": 4096,
8
+ "image_token_id": 151655,
9
+ "model_type": "qwen3_vl",
10
+ "pad_token_id": 151643,
11
+ "text_config": {
12
+ "attention_bias": false,
13
+ "attention_dropout": 0.0,
14
+ "bos_token_id": 151643,
15
+ "dtype": "float32",
16
+ "eos_token_id": 151645,
17
+ "head_dim": 128,
18
+ "hidden_act": "silu",
19
+ "hidden_size": 4096,
20
+ "initializer_range": 0.02,
21
+ "intermediate_size": 12288,
22
+ "max_position_embeddings": 262144,
23
+ "model_type": "qwen3_vl_text",
24
+ "num_attention_heads": 32,
25
+ "num_hidden_layers": 36,
26
+ "num_key_value_heads": 8,
27
+ "rms_norm_eps": 1e-06,
28
+ "rope_scaling": {
29
+ "mrope_interleaved": true,
30
+ "mrope_section": [
31
+ 24,
32
+ 20,
33
+ 20
34
+ ],
35
+ "rope_type": "default"
36
+ },
37
+ "rope_theta": 5000000,
38
+ "use_cache": true,
39
+ "vocab_size": 152675
40
+ },
41
+ "tie_word_embeddings": false,
42
+ "transformers_version": "4.57.6",
43
+ "use_cache": true,
44
+ "video_token_id": 151656,
45
+ "vision_config": {
46
+ "deepstack_visual_indexes": [
47
+ 8,
48
+ 16,
49
+ 24
50
+ ],
51
+ "depth": 27,
52
+ "dtype": "float32",
53
+ "hidden_act": "gelu_pytorch_tanh",
54
+ "hidden_size": 1152,
55
+ "in_channels": 3,
56
+ "initializer_range": 0.02,
57
+ "intermediate_size": 4304,
58
+ "model_type": "qwen3_vl",
59
+ "num_heads": 16,
60
+ "num_position_embeddings": 2304,
61
+ "out_hidden_size": 4096,
62
+ "patch_size": 16,
63
+ "spatial_merge_size": 2,
64
+ "temporal_patch_size": 2
65
+ },
66
+ "vision_end_token_id": 151653,
67
+ "vision_start_token_id": 151652
68
+ }
generation_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_sample": true,
3
+ "eos_token_id": [
4
+ 151645,
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "temperature": 0.7,
10
+ "top_k": 20,
11
+ "top_p": 0.8,
12
+ "transformers_version": "4.57.6"
13
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:743bfd8f482856acbc7dbb6670dc7bfc80a612ec45688f597e2e52e8118eaf05
3
+ size 4983801288
model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e78e64b3bb329dc48f98157d0a9160b4f26a71e90e5e0b2c13c81c16a9b49b1f
3
+ size 4942442984
model-00003-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f856f8eb8b5d430d96dc6fb2dd900380ca7400ee1c68ac6ecbf8f010e003afe6
3
+ size 4735757584
model-00004-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d00f3db7e31dcc990fd69cd65e95fa6ebd5ca4518a3620618187574d515645d1
3
+ size 2884445424
model.safetensors.index.json ADDED
@@ -0,0 +1,758 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "total_parameters": 8773177584,
4
+ "total_size": 17546355168
5
+ },
6
+ "weight_map": {
7
+ "lm_head.weight": "model-00004-of-00004.safetensors",
8
+ "model.language_model.embed_tokens.weight": "model-00002-of-00004.safetensors",
9
+ "model.language_model.layers.0.input_layernorm.weight": "model-00002-of-00004.safetensors",
10
+ "model.language_model.layers.0.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
11
+ "model.language_model.layers.0.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
12
+ "model.language_model.layers.0.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
13
+ "model.language_model.layers.0.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
14
+ "model.language_model.layers.0.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
15
+ "model.language_model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
16
+ "model.language_model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
17
+ "model.language_model.layers.0.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
18
+ "model.language_model.layers.0.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
19
+ "model.language_model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
20
+ "model.language_model.layers.1.input_layernorm.weight": "model-00003-of-00004.safetensors",
21
+ "model.language_model.layers.1.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
22
+ "model.language_model.layers.1.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
23
+ "model.language_model.layers.1.mlp.up_proj.weight": "model-00004-of-00004.safetensors",
24
+ "model.language_model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
25
+ "model.language_model.layers.1.self_attn.k_norm.weight": "model-00004-of-00004.safetensors",
26
+ "model.language_model.layers.1.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
27
+ "model.language_model.layers.1.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
28
+ "model.language_model.layers.1.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
29
+ "model.language_model.layers.1.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
30
+ "model.language_model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
31
+ "model.language_model.layers.10.input_layernorm.weight": "model-00001-of-00004.safetensors",
32
+ "model.language_model.layers.10.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
33
+ "model.language_model.layers.10.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
34
+ "model.language_model.layers.10.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
35
+ "model.language_model.layers.10.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
36
+ "model.language_model.layers.10.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
37
+ "model.language_model.layers.10.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
38
+ "model.language_model.layers.10.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
39
+ "model.language_model.layers.10.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
40
+ "model.language_model.layers.10.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
41
+ "model.language_model.layers.10.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
42
+ "model.language_model.layers.11.input_layernorm.weight": "model-00001-of-00004.safetensors",
43
+ "model.language_model.layers.11.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
44
+ "model.language_model.layers.11.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
45
+ "model.language_model.layers.11.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
46
+ "model.language_model.layers.11.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
47
+ "model.language_model.layers.11.self_attn.k_norm.weight": "model-00004-of-00004.safetensors",
48
+ "model.language_model.layers.11.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
49
+ "model.language_model.layers.11.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
50
+ "model.language_model.layers.11.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
51
+ "model.language_model.layers.11.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
52
+ "model.language_model.layers.11.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
53
+ "model.language_model.layers.12.input_layernorm.weight": "model-00001-of-00004.safetensors",
54
+ "model.language_model.layers.12.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
55
+ "model.language_model.layers.12.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
56
+ "model.language_model.layers.12.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
57
+ "model.language_model.layers.12.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
58
+ "model.language_model.layers.12.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
59
+ "model.language_model.layers.12.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
60
+ "model.language_model.layers.12.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
61
+ "model.language_model.layers.12.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
62
+ "model.language_model.layers.12.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
63
+ "model.language_model.layers.12.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
64
+ "model.language_model.layers.13.input_layernorm.weight": "model-00001-of-00004.safetensors",
65
+ "model.language_model.layers.13.mlp.down_proj.weight": "model-00004-of-00004.safetensors",
66
+ "model.language_model.layers.13.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
67
+ "model.language_model.layers.13.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
68
+ "model.language_model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
69
+ "model.language_model.layers.13.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
70
+ "model.language_model.layers.13.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
71
+ "model.language_model.layers.13.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
72
+ "model.language_model.layers.13.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
73
+ "model.language_model.layers.13.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
74
+ "model.language_model.layers.13.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
75
+ "model.language_model.layers.14.input_layernorm.weight": "model-00003-of-00004.safetensors",
76
+ "model.language_model.layers.14.mlp.down_proj.weight": "model-00004-of-00004.safetensors",
77
+ "model.language_model.layers.14.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
78
+ "model.language_model.layers.14.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
79
+ "model.language_model.layers.14.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
80
+ "model.language_model.layers.14.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
81
+ "model.language_model.layers.14.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
82
+ "model.language_model.layers.14.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
83
+ "model.language_model.layers.14.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
84
+ "model.language_model.layers.14.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
85
+ "model.language_model.layers.14.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
86
+ "model.language_model.layers.15.input_layernorm.weight": "model-00004-of-00004.safetensors",
87
+ "model.language_model.layers.15.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
88
+ "model.language_model.layers.15.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
89
+ "model.language_model.layers.15.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
90
+ "model.language_model.layers.15.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
91
+ "model.language_model.layers.15.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
92
+ "model.language_model.layers.15.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
93
+ "model.language_model.layers.15.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
94
+ "model.language_model.layers.15.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
95
+ "model.language_model.layers.15.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
96
+ "model.language_model.layers.15.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
97
+ "model.language_model.layers.16.input_layernorm.weight": "model-00001-of-00004.safetensors",
98
+ "model.language_model.layers.16.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
99
+ "model.language_model.layers.16.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
100
+ "model.language_model.layers.16.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
101
+ "model.language_model.layers.16.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
102
+ "model.language_model.layers.16.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
103
+ "model.language_model.layers.16.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
104
+ "model.language_model.layers.16.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
105
+ "model.language_model.layers.16.self_attn.q_norm.weight": "model-00004-of-00004.safetensors",
106
+ "model.language_model.layers.16.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
107
+ "model.language_model.layers.16.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
108
+ "model.language_model.layers.17.input_layernorm.weight": "model-00004-of-00004.safetensors",
109
+ "model.language_model.layers.17.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
110
+ "model.language_model.layers.17.mlp.gate_proj.weight": "model-00004-of-00004.safetensors",
111
+ "model.language_model.layers.17.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
112
+ "model.language_model.layers.17.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
113
+ "model.language_model.layers.17.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
114
+ "model.language_model.layers.17.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
115
+ "model.language_model.layers.17.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
116
+ "model.language_model.layers.17.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
117
+ "model.language_model.layers.17.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
118
+ "model.language_model.layers.17.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
119
+ "model.language_model.layers.18.input_layernorm.weight": "model-00001-of-00004.safetensors",
120
+ "model.language_model.layers.18.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
121
+ "model.language_model.layers.18.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
122
+ "model.language_model.layers.18.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
123
+ "model.language_model.layers.18.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
124
+ "model.language_model.layers.18.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
125
+ "model.language_model.layers.18.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
126
+ "model.language_model.layers.18.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
127
+ "model.language_model.layers.18.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
128
+ "model.language_model.layers.18.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
129
+ "model.language_model.layers.18.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
130
+ "model.language_model.layers.19.input_layernorm.weight": "model-00002-of-00004.safetensors",
131
+ "model.language_model.layers.19.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
132
+ "model.language_model.layers.19.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
133
+ "model.language_model.layers.19.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
134
+ "model.language_model.layers.19.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
135
+ "model.language_model.layers.19.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
136
+ "model.language_model.layers.19.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
137
+ "model.language_model.layers.19.self_attn.o_proj.weight": "model-00004-of-00004.safetensors",
138
+ "model.language_model.layers.19.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
139
+ "model.language_model.layers.19.self_attn.q_proj.weight": "model-00004-of-00004.safetensors",
140
+ "model.language_model.layers.19.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
141
+ "model.language_model.layers.2.input_layernorm.weight": "model-00003-of-00004.safetensors",
142
+ "model.language_model.layers.2.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
143
+ "model.language_model.layers.2.mlp.gate_proj.weight": "model-00004-of-00004.safetensors",
144
+ "model.language_model.layers.2.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
145
+ "model.language_model.layers.2.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
146
+ "model.language_model.layers.2.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
147
+ "model.language_model.layers.2.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
148
+ "model.language_model.layers.2.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
149
+ "model.language_model.layers.2.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
150
+ "model.language_model.layers.2.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
151
+ "model.language_model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
152
+ "model.language_model.layers.20.input_layernorm.weight": "model-00004-of-00004.safetensors",
153
+ "model.language_model.layers.20.mlp.down_proj.weight": "model-00004-of-00004.safetensors",
154
+ "model.language_model.layers.20.mlp.gate_proj.weight": "model-00004-of-00004.safetensors",
155
+ "model.language_model.layers.20.mlp.up_proj.weight": "model-00004-of-00004.safetensors",
156
+ "model.language_model.layers.20.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
157
+ "model.language_model.layers.20.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
158
+ "model.language_model.layers.20.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
159
+ "model.language_model.layers.20.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
160
+ "model.language_model.layers.20.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
161
+ "model.language_model.layers.20.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
162
+ "model.language_model.layers.20.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
163
+ "model.language_model.layers.21.input_layernorm.weight": "model-00003-of-00004.safetensors",
164
+ "model.language_model.layers.21.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
165
+ "model.language_model.layers.21.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
166
+ "model.language_model.layers.21.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
167
+ "model.language_model.layers.21.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
168
+ "model.language_model.layers.21.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
169
+ "model.language_model.layers.21.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
170
+ "model.language_model.layers.21.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
171
+ "model.language_model.layers.21.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
172
+ "model.language_model.layers.21.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
173
+ "model.language_model.layers.21.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
174
+ "model.language_model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors",
175
+ "model.language_model.layers.22.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
176
+ "model.language_model.layers.22.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
177
+ "model.language_model.layers.22.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
178
+ "model.language_model.layers.22.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
179
+ "model.language_model.layers.22.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
180
+ "model.language_model.layers.22.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
181
+ "model.language_model.layers.22.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
182
+ "model.language_model.layers.22.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
183
+ "model.language_model.layers.22.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
184
+ "model.language_model.layers.22.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
185
+ "model.language_model.layers.23.input_layernorm.weight": "model-00001-of-00004.safetensors",
186
+ "model.language_model.layers.23.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
187
+ "model.language_model.layers.23.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
188
+ "model.language_model.layers.23.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
189
+ "model.language_model.layers.23.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
190
+ "model.language_model.layers.23.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
191
+ "model.language_model.layers.23.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
192
+ "model.language_model.layers.23.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
193
+ "model.language_model.layers.23.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
194
+ "model.language_model.layers.23.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
195
+ "model.language_model.layers.23.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
196
+ "model.language_model.layers.24.input_layernorm.weight": "model-00001-of-00004.safetensors",
197
+ "model.language_model.layers.24.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
198
+ "model.language_model.layers.24.mlp.gate_proj.weight": "model-00004-of-00004.safetensors",
199
+ "model.language_model.layers.24.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
200
+ "model.language_model.layers.24.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
201
+ "model.language_model.layers.24.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
202
+ "model.language_model.layers.24.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
203
+ "model.language_model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
204
+ "model.language_model.layers.24.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
205
+ "model.language_model.layers.24.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
206
+ "model.language_model.layers.24.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
207
+ "model.language_model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors",
208
+ "model.language_model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
209
+ "model.language_model.layers.25.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
210
+ "model.language_model.layers.25.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
211
+ "model.language_model.layers.25.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
212
+ "model.language_model.layers.25.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
213
+ "model.language_model.layers.25.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
214
+ "model.language_model.layers.25.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
215
+ "model.language_model.layers.25.self_attn.q_norm.weight": "model-00002-of-00004.safetensors",
216
+ "model.language_model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
217
+ "model.language_model.layers.25.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
218
+ "model.language_model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors",
219
+ "model.language_model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
220
+ "model.language_model.layers.26.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
221
+ "model.language_model.layers.26.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
222
+ "model.language_model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
223
+ "model.language_model.layers.26.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
224
+ "model.language_model.layers.26.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
225
+ "model.language_model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
226
+ "model.language_model.layers.26.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
227
+ "model.language_model.layers.26.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
228
+ "model.language_model.layers.26.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
229
+ "model.language_model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors",
230
+ "model.language_model.layers.27.mlp.down_proj.weight": "model-00004-of-00004.safetensors",
231
+ "model.language_model.layers.27.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
232
+ "model.language_model.layers.27.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
233
+ "model.language_model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
234
+ "model.language_model.layers.27.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
235
+ "model.language_model.layers.27.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
236
+ "model.language_model.layers.27.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
237
+ "model.language_model.layers.27.self_attn.q_norm.weight": "model-00004-of-00004.safetensors",
238
+ "model.language_model.layers.27.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
239
+ "model.language_model.layers.27.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
240
+ "model.language_model.layers.28.input_layernorm.weight": "model-00001-of-00004.safetensors",
241
+ "model.language_model.layers.28.mlp.down_proj.weight": "model-00004-of-00004.safetensors",
242
+ "model.language_model.layers.28.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
243
+ "model.language_model.layers.28.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
244
+ "model.language_model.layers.28.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
245
+ "model.language_model.layers.28.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
246
+ "model.language_model.layers.28.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
247
+ "model.language_model.layers.28.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
248
+ "model.language_model.layers.28.self_attn.q_norm.weight": "model-00004-of-00004.safetensors",
249
+ "model.language_model.layers.28.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
250
+ "model.language_model.layers.28.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
251
+ "model.language_model.layers.29.input_layernorm.weight": "model-00002-of-00004.safetensors",
252
+ "model.language_model.layers.29.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
253
+ "model.language_model.layers.29.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
254
+ "model.language_model.layers.29.mlp.up_proj.weight": "model-00004-of-00004.safetensors",
255
+ "model.language_model.layers.29.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
256
+ "model.language_model.layers.29.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
257
+ "model.language_model.layers.29.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
258
+ "model.language_model.layers.29.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
259
+ "model.language_model.layers.29.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
260
+ "model.language_model.layers.29.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
261
+ "model.language_model.layers.29.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
262
+ "model.language_model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors",
263
+ "model.language_model.layers.3.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
264
+ "model.language_model.layers.3.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
265
+ "model.language_model.layers.3.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
266
+ "model.language_model.layers.3.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
267
+ "model.language_model.layers.3.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
268
+ "model.language_model.layers.3.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
269
+ "model.language_model.layers.3.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
270
+ "model.language_model.layers.3.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
271
+ "model.language_model.layers.3.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
272
+ "model.language_model.layers.3.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
273
+ "model.language_model.layers.30.input_layernorm.weight": "model-00001-of-00004.safetensors",
274
+ "model.language_model.layers.30.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
275
+ "model.language_model.layers.30.mlp.gate_proj.weight": "model-00004-of-00004.safetensors",
276
+ "model.language_model.layers.30.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
277
+ "model.language_model.layers.30.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
278
+ "model.language_model.layers.30.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
279
+ "model.language_model.layers.30.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
280
+ "model.language_model.layers.30.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
281
+ "model.language_model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
282
+ "model.language_model.layers.30.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
283
+ "model.language_model.layers.30.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
284
+ "model.language_model.layers.31.input_layernorm.weight": "model-00001-of-00004.safetensors",
285
+ "model.language_model.layers.31.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
286
+ "model.language_model.layers.31.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
287
+ "model.language_model.layers.31.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
288
+ "model.language_model.layers.31.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
289
+ "model.language_model.layers.31.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
290
+ "model.language_model.layers.31.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
291
+ "model.language_model.layers.31.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
292
+ "model.language_model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
293
+ "model.language_model.layers.31.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
294
+ "model.language_model.layers.31.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
295
+ "model.language_model.layers.32.input_layernorm.weight": "model-00002-of-00004.safetensors",
296
+ "model.language_model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
297
+ "model.language_model.layers.32.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
298
+ "model.language_model.layers.32.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
299
+ "model.language_model.layers.32.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
300
+ "model.language_model.layers.32.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
301
+ "model.language_model.layers.32.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
302
+ "model.language_model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
303
+ "model.language_model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
304
+ "model.language_model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
305
+ "model.language_model.layers.32.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
306
+ "model.language_model.layers.33.input_layernorm.weight": "model-00001-of-00004.safetensors",
307
+ "model.language_model.layers.33.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
308
+ "model.language_model.layers.33.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
309
+ "model.language_model.layers.33.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
310
+ "model.language_model.layers.33.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
311
+ "model.language_model.layers.33.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
312
+ "model.language_model.layers.33.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
313
+ "model.language_model.layers.33.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
314
+ "model.language_model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
315
+ "model.language_model.layers.33.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
316
+ "model.language_model.layers.33.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
317
+ "model.language_model.layers.34.input_layernorm.weight": "model-00004-of-00004.safetensors",
318
+ "model.language_model.layers.34.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
319
+ "model.language_model.layers.34.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
320
+ "model.language_model.layers.34.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
321
+ "model.language_model.layers.34.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
322
+ "model.language_model.layers.34.self_attn.k_norm.weight": "model-00002-of-00004.safetensors",
323
+ "model.language_model.layers.34.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
324
+ "model.language_model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
325
+ "model.language_model.layers.34.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
326
+ "model.language_model.layers.34.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
327
+ "model.language_model.layers.34.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
328
+ "model.language_model.layers.35.input_layernorm.weight": "model-00001-of-00004.safetensors",
329
+ "model.language_model.layers.35.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
330
+ "model.language_model.layers.35.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
331
+ "model.language_model.layers.35.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
332
+ "model.language_model.layers.35.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
333
+ "model.language_model.layers.35.self_attn.k_norm.weight": "model-00004-of-00004.safetensors",
334
+ "model.language_model.layers.35.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
335
+ "model.language_model.layers.35.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
336
+ "model.language_model.layers.35.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
337
+ "model.language_model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
338
+ "model.language_model.layers.35.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
339
+ "model.language_model.layers.4.input_layernorm.weight": "model-00002-of-00004.safetensors",
340
+ "model.language_model.layers.4.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
341
+ "model.language_model.layers.4.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
342
+ "model.language_model.layers.4.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
343
+ "model.language_model.layers.4.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
344
+ "model.language_model.layers.4.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
345
+ "model.language_model.layers.4.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
346
+ "model.language_model.layers.4.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
347
+ "model.language_model.layers.4.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
348
+ "model.language_model.layers.4.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
349
+ "model.language_model.layers.4.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
350
+ "model.language_model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors",
351
+ "model.language_model.layers.5.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
352
+ "model.language_model.layers.5.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
353
+ "model.language_model.layers.5.mlp.up_proj.weight": "model-00004-of-00004.safetensors",
354
+ "model.language_model.layers.5.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
355
+ "model.language_model.layers.5.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
356
+ "model.language_model.layers.5.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
357
+ "model.language_model.layers.5.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
358
+ "model.language_model.layers.5.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
359
+ "model.language_model.layers.5.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
360
+ "model.language_model.layers.5.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
361
+ "model.language_model.layers.6.input_layernorm.weight": "model-00003-of-00004.safetensors",
362
+ "model.language_model.layers.6.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
363
+ "model.language_model.layers.6.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
364
+ "model.language_model.layers.6.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
365
+ "model.language_model.layers.6.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
366
+ "model.language_model.layers.6.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
367
+ "model.language_model.layers.6.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
368
+ "model.language_model.layers.6.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
369
+ "model.language_model.layers.6.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
370
+ "model.language_model.layers.6.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
371
+ "model.language_model.layers.6.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
372
+ "model.language_model.layers.7.input_layernorm.weight": "model-00003-of-00004.safetensors",
373
+ "model.language_model.layers.7.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
374
+ "model.language_model.layers.7.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
375
+ "model.language_model.layers.7.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
376
+ "model.language_model.layers.7.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
377
+ "model.language_model.layers.7.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
378
+ "model.language_model.layers.7.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
379
+ "model.language_model.layers.7.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
380
+ "model.language_model.layers.7.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
381
+ "model.language_model.layers.7.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
382
+ "model.language_model.layers.7.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
383
+ "model.language_model.layers.8.input_layernorm.weight": "model-00001-of-00004.safetensors",
384
+ "model.language_model.layers.8.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
385
+ "model.language_model.layers.8.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
386
+ "model.language_model.layers.8.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
387
+ "model.language_model.layers.8.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
388
+ "model.language_model.layers.8.self_attn.k_norm.weight": "model-00003-of-00004.safetensors",
389
+ "model.language_model.layers.8.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
390
+ "model.language_model.layers.8.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
391
+ "model.language_model.layers.8.self_attn.q_norm.weight": "model-00001-of-00004.safetensors",
392
+ "model.language_model.layers.8.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
393
+ "model.language_model.layers.8.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
394
+ "model.language_model.layers.9.input_layernorm.weight": "model-00001-of-00004.safetensors",
395
+ "model.language_model.layers.9.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
396
+ "model.language_model.layers.9.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
397
+ "model.language_model.layers.9.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
398
+ "model.language_model.layers.9.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
399
+ "model.language_model.layers.9.self_attn.k_norm.weight": "model-00001-of-00004.safetensors",
400
+ "model.language_model.layers.9.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
401
+ "model.language_model.layers.9.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
402
+ "model.language_model.layers.9.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
403
+ "model.language_model.layers.9.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
404
+ "model.language_model.layers.9.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
405
+ "model.language_model.norm.weight": "model-00002-of-00004.safetensors",
406
+ "model.visual.blocks.0.attn.proj.bias": "model-00004-of-00004.safetensors",
407
+ "model.visual.blocks.0.attn.proj.weight": "model-00001-of-00004.safetensors",
408
+ "model.visual.blocks.0.attn.qkv.bias": "model-00001-of-00004.safetensors",
409
+ "model.visual.blocks.0.attn.qkv.weight": "model-00001-of-00004.safetensors",
410
+ "model.visual.blocks.0.mlp.linear_fc1.bias": "model-00003-of-00004.safetensors",
411
+ "model.visual.blocks.0.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
412
+ "model.visual.blocks.0.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
413
+ "model.visual.blocks.0.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
414
+ "model.visual.blocks.0.norm1.bias": "model-00003-of-00004.safetensors",
415
+ "model.visual.blocks.0.norm1.weight": "model-00003-of-00004.safetensors",
416
+ "model.visual.blocks.0.norm2.bias": "model-00001-of-00004.safetensors",
417
+ "model.visual.blocks.0.norm2.weight": "model-00003-of-00004.safetensors",
418
+ "model.visual.blocks.1.attn.proj.bias": "model-00002-of-00004.safetensors",
419
+ "model.visual.blocks.1.attn.proj.weight": "model-00003-of-00004.safetensors",
420
+ "model.visual.blocks.1.attn.qkv.bias": "model-00001-of-00004.safetensors",
421
+ "model.visual.blocks.1.attn.qkv.weight": "model-00001-of-00004.safetensors",
422
+ "model.visual.blocks.1.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
423
+ "model.visual.blocks.1.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
424
+ "model.visual.blocks.1.mlp.linear_fc2.bias": "model-00004-of-00004.safetensors",
425
+ "model.visual.blocks.1.mlp.linear_fc2.weight": "model-00004-of-00004.safetensors",
426
+ "model.visual.blocks.1.norm1.bias": "model-00003-of-00004.safetensors",
427
+ "model.visual.blocks.1.norm1.weight": "model-00003-of-00004.safetensors",
428
+ "model.visual.blocks.1.norm2.bias": "model-00003-of-00004.safetensors",
429
+ "model.visual.blocks.1.norm2.weight": "model-00003-of-00004.safetensors",
430
+ "model.visual.blocks.10.attn.proj.bias": "model-00001-of-00004.safetensors",
431
+ "model.visual.blocks.10.attn.proj.weight": "model-00003-of-00004.safetensors",
432
+ "model.visual.blocks.10.attn.qkv.bias": "model-00002-of-00004.safetensors",
433
+ "model.visual.blocks.10.attn.qkv.weight": "model-00001-of-00004.safetensors",
434
+ "model.visual.blocks.10.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
435
+ "model.visual.blocks.10.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors",
436
+ "model.visual.blocks.10.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
437
+ "model.visual.blocks.10.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
438
+ "model.visual.blocks.10.norm1.bias": "model-00001-of-00004.safetensors",
439
+ "model.visual.blocks.10.norm1.weight": "model-00003-of-00004.safetensors",
440
+ "model.visual.blocks.10.norm2.bias": "model-00001-of-00004.safetensors",
441
+ "model.visual.blocks.10.norm2.weight": "model-00002-of-00004.safetensors",
442
+ "model.visual.blocks.11.attn.proj.bias": "model-00001-of-00004.safetensors",
443
+ "model.visual.blocks.11.attn.proj.weight": "model-00002-of-00004.safetensors",
444
+ "model.visual.blocks.11.attn.qkv.bias": "model-00001-of-00004.safetensors",
445
+ "model.visual.blocks.11.attn.qkv.weight": "model-00001-of-00004.safetensors",
446
+ "model.visual.blocks.11.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
447
+ "model.visual.blocks.11.mlp.linear_fc1.weight": "model-00004-of-00004.safetensors",
448
+ "model.visual.blocks.11.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
449
+ "model.visual.blocks.11.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
450
+ "model.visual.blocks.11.norm1.bias": "model-00002-of-00004.safetensors",
451
+ "model.visual.blocks.11.norm1.weight": "model-00003-of-00004.safetensors",
452
+ "model.visual.blocks.11.norm2.bias": "model-00002-of-00004.safetensors",
453
+ "model.visual.blocks.11.norm2.weight": "model-00002-of-00004.safetensors",
454
+ "model.visual.blocks.12.attn.proj.bias": "model-00002-of-00004.safetensors",
455
+ "model.visual.blocks.12.attn.proj.weight": "model-00002-of-00004.safetensors",
456
+ "model.visual.blocks.12.attn.qkv.bias": "model-00001-of-00004.safetensors",
457
+ "model.visual.blocks.12.attn.qkv.weight": "model-00003-of-00004.safetensors",
458
+ "model.visual.blocks.12.mlp.linear_fc1.bias": "model-00003-of-00004.safetensors",
459
+ "model.visual.blocks.12.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
460
+ "model.visual.blocks.12.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
461
+ "model.visual.blocks.12.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
462
+ "model.visual.blocks.12.norm1.bias": "model-00001-of-00004.safetensors",
463
+ "model.visual.blocks.12.norm1.weight": "model-00001-of-00004.safetensors",
464
+ "model.visual.blocks.12.norm2.bias": "model-00001-of-00004.safetensors",
465
+ "model.visual.blocks.12.norm2.weight": "model-00001-of-00004.safetensors",
466
+ "model.visual.blocks.13.attn.proj.bias": "model-00003-of-00004.safetensors",
467
+ "model.visual.blocks.13.attn.proj.weight": "model-00002-of-00004.safetensors",
468
+ "model.visual.blocks.13.attn.qkv.bias": "model-00003-of-00004.safetensors",
469
+ "model.visual.blocks.13.attn.qkv.weight": "model-00001-of-00004.safetensors",
470
+ "model.visual.blocks.13.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
471
+ "model.visual.blocks.13.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors",
472
+ "model.visual.blocks.13.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
473
+ "model.visual.blocks.13.mlp.linear_fc2.weight": "model-00003-of-00004.safetensors",
474
+ "model.visual.blocks.13.norm1.bias": "model-00001-of-00004.safetensors",
475
+ "model.visual.blocks.13.norm1.weight": "model-00001-of-00004.safetensors",
476
+ "model.visual.blocks.13.norm2.bias": "model-00001-of-00004.safetensors",
477
+ "model.visual.blocks.13.norm2.weight": "model-00003-of-00004.safetensors",
478
+ "model.visual.blocks.14.attn.proj.bias": "model-00002-of-00004.safetensors",
479
+ "model.visual.blocks.14.attn.proj.weight": "model-00001-of-00004.safetensors",
480
+ "model.visual.blocks.14.attn.qkv.bias": "model-00004-of-00004.safetensors",
481
+ "model.visual.blocks.14.attn.qkv.weight": "model-00001-of-00004.safetensors",
482
+ "model.visual.blocks.14.mlp.linear_fc1.bias": "model-00004-of-00004.safetensors",
483
+ "model.visual.blocks.14.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
484
+ "model.visual.blocks.14.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
485
+ "model.visual.blocks.14.mlp.linear_fc2.weight": "model-00002-of-00004.safetensors",
486
+ "model.visual.blocks.14.norm1.bias": "model-00003-of-00004.safetensors",
487
+ "model.visual.blocks.14.norm1.weight": "model-00003-of-00004.safetensors",
488
+ "model.visual.blocks.14.norm2.bias": "model-00001-of-00004.safetensors",
489
+ "model.visual.blocks.14.norm2.weight": "model-00003-of-00004.safetensors",
490
+ "model.visual.blocks.15.attn.proj.bias": "model-00003-of-00004.safetensors",
491
+ "model.visual.blocks.15.attn.proj.weight": "model-00003-of-00004.safetensors",
492
+ "model.visual.blocks.15.attn.qkv.bias": "model-00004-of-00004.safetensors",
493
+ "model.visual.blocks.15.attn.qkv.weight": "model-00002-of-00004.safetensors",
494
+ "model.visual.blocks.15.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
495
+ "model.visual.blocks.15.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
496
+ "model.visual.blocks.15.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
497
+ "model.visual.blocks.15.mlp.linear_fc2.weight": "model-00004-of-00004.safetensors",
498
+ "model.visual.blocks.15.norm1.bias": "model-00002-of-00004.safetensors",
499
+ "model.visual.blocks.15.norm1.weight": "model-00001-of-00004.safetensors",
500
+ "model.visual.blocks.15.norm2.bias": "model-00002-of-00004.safetensors",
501
+ "model.visual.blocks.15.norm2.weight": "model-00001-of-00004.safetensors",
502
+ "model.visual.blocks.16.attn.proj.bias": "model-00002-of-00004.safetensors",
503
+ "model.visual.blocks.16.attn.proj.weight": "model-00002-of-00004.safetensors",
504
+ "model.visual.blocks.16.attn.qkv.bias": "model-00002-of-00004.safetensors",
505
+ "model.visual.blocks.16.attn.qkv.weight": "model-00002-of-00004.safetensors",
506
+ "model.visual.blocks.16.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
507
+ "model.visual.blocks.16.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
508
+ "model.visual.blocks.16.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
509
+ "model.visual.blocks.16.mlp.linear_fc2.weight": "model-00004-of-00004.safetensors",
510
+ "model.visual.blocks.16.norm1.bias": "model-00002-of-00004.safetensors",
511
+ "model.visual.blocks.16.norm1.weight": "model-00003-of-00004.safetensors",
512
+ "model.visual.blocks.16.norm2.bias": "model-00001-of-00004.safetensors",
513
+ "model.visual.blocks.16.norm2.weight": "model-00001-of-00004.safetensors",
514
+ "model.visual.blocks.17.attn.proj.bias": "model-00003-of-00004.safetensors",
515
+ "model.visual.blocks.17.attn.proj.weight": "model-00003-of-00004.safetensors",
516
+ "model.visual.blocks.17.attn.qkv.bias": "model-00002-of-00004.safetensors",
517
+ "model.visual.blocks.17.attn.qkv.weight": "model-00001-of-00004.safetensors",
518
+ "model.visual.blocks.17.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
519
+ "model.visual.blocks.17.mlp.linear_fc1.weight": "model-00002-of-00004.safetensors",
520
+ "model.visual.blocks.17.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
521
+ "model.visual.blocks.17.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
522
+ "model.visual.blocks.17.norm1.bias": "model-00003-of-00004.safetensors",
523
+ "model.visual.blocks.17.norm1.weight": "model-00001-of-00004.safetensors",
524
+ "model.visual.blocks.17.norm2.bias": "model-00003-of-00004.safetensors",
525
+ "model.visual.blocks.17.norm2.weight": "model-00002-of-00004.safetensors",
526
+ "model.visual.blocks.18.attn.proj.bias": "model-00003-of-00004.safetensors",
527
+ "model.visual.blocks.18.attn.proj.weight": "model-00003-of-00004.safetensors",
528
+ "model.visual.blocks.18.attn.qkv.bias": "model-00001-of-00004.safetensors",
529
+ "model.visual.blocks.18.attn.qkv.weight": "model-00002-of-00004.safetensors",
530
+ "model.visual.blocks.18.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
531
+ "model.visual.blocks.18.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
532
+ "model.visual.blocks.18.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
533
+ "model.visual.blocks.18.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
534
+ "model.visual.blocks.18.norm1.bias": "model-00003-of-00004.safetensors",
535
+ "model.visual.blocks.18.norm1.weight": "model-00002-of-00004.safetensors",
536
+ "model.visual.blocks.18.norm2.bias": "model-00003-of-00004.safetensors",
537
+ "model.visual.blocks.18.norm2.weight": "model-00001-of-00004.safetensors",
538
+ "model.visual.blocks.19.attn.proj.bias": "model-00003-of-00004.safetensors",
539
+ "model.visual.blocks.19.attn.proj.weight": "model-00001-of-00004.safetensors",
540
+ "model.visual.blocks.19.attn.qkv.bias": "model-00001-of-00004.safetensors",
541
+ "model.visual.blocks.19.attn.qkv.weight": "model-00002-of-00004.safetensors",
542
+ "model.visual.blocks.19.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
543
+ "model.visual.blocks.19.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors",
544
+ "model.visual.blocks.19.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
545
+ "model.visual.blocks.19.mlp.linear_fc2.weight": "model-00003-of-00004.safetensors",
546
+ "model.visual.blocks.19.norm1.bias": "model-00003-of-00004.safetensors",
547
+ "model.visual.blocks.19.norm1.weight": "model-00002-of-00004.safetensors",
548
+ "model.visual.blocks.19.norm2.bias": "model-00004-of-00004.safetensors",
549
+ "model.visual.blocks.19.norm2.weight": "model-00004-of-00004.safetensors",
550
+ "model.visual.blocks.2.attn.proj.bias": "model-00003-of-00004.safetensors",
551
+ "model.visual.blocks.2.attn.proj.weight": "model-00001-of-00004.safetensors",
552
+ "model.visual.blocks.2.attn.qkv.bias": "model-00001-of-00004.safetensors",
553
+ "model.visual.blocks.2.attn.qkv.weight": "model-00003-of-00004.safetensors",
554
+ "model.visual.blocks.2.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
555
+ "model.visual.blocks.2.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors",
556
+ "model.visual.blocks.2.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
557
+ "model.visual.blocks.2.mlp.linear_fc2.weight": "model-00003-of-00004.safetensors",
558
+ "model.visual.blocks.2.norm1.bias": "model-00003-of-00004.safetensors",
559
+ "model.visual.blocks.2.norm1.weight": "model-00002-of-00004.safetensors",
560
+ "model.visual.blocks.2.norm2.bias": "model-00002-of-00004.safetensors",
561
+ "model.visual.blocks.2.norm2.weight": "model-00003-of-00004.safetensors",
562
+ "model.visual.blocks.20.attn.proj.bias": "model-00002-of-00004.safetensors",
563
+ "model.visual.blocks.20.attn.proj.weight": "model-00004-of-00004.safetensors",
564
+ "model.visual.blocks.20.attn.qkv.bias": "model-00002-of-00004.safetensors",
565
+ "model.visual.blocks.20.attn.qkv.weight": "model-00004-of-00004.safetensors",
566
+ "model.visual.blocks.20.mlp.linear_fc1.bias": "model-00003-of-00004.safetensors",
567
+ "model.visual.blocks.20.mlp.linear_fc1.weight": "model-00002-of-00004.safetensors",
568
+ "model.visual.blocks.20.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
569
+ "model.visual.blocks.20.mlp.linear_fc2.weight": "model-00002-of-00004.safetensors",
570
+ "model.visual.blocks.20.norm1.bias": "model-00003-of-00004.safetensors",
571
+ "model.visual.blocks.20.norm1.weight": "model-00003-of-00004.safetensors",
572
+ "model.visual.blocks.20.norm2.bias": "model-00004-of-00004.safetensors",
573
+ "model.visual.blocks.20.norm2.weight": "model-00003-of-00004.safetensors",
574
+ "model.visual.blocks.21.attn.proj.bias": "model-00003-of-00004.safetensors",
575
+ "model.visual.blocks.21.attn.proj.weight": "model-00001-of-00004.safetensors",
576
+ "model.visual.blocks.21.attn.qkv.bias": "model-00003-of-00004.safetensors",
577
+ "model.visual.blocks.21.attn.qkv.weight": "model-00004-of-00004.safetensors",
578
+ "model.visual.blocks.21.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
579
+ "model.visual.blocks.21.mlp.linear_fc1.weight": "model-00002-of-00004.safetensors",
580
+ "model.visual.blocks.21.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
581
+ "model.visual.blocks.21.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
582
+ "model.visual.blocks.21.norm1.bias": "model-00001-of-00004.safetensors",
583
+ "model.visual.blocks.21.norm1.weight": "model-00003-of-00004.safetensors",
584
+ "model.visual.blocks.21.norm2.bias": "model-00003-of-00004.safetensors",
585
+ "model.visual.blocks.21.norm2.weight": "model-00003-of-00004.safetensors",
586
+ "model.visual.blocks.22.attn.proj.bias": "model-00003-of-00004.safetensors",
587
+ "model.visual.blocks.22.attn.proj.weight": "model-00001-of-00004.safetensors",
588
+ "model.visual.blocks.22.attn.qkv.bias": "model-00002-of-00004.safetensors",
589
+ "model.visual.blocks.22.attn.qkv.weight": "model-00004-of-00004.safetensors",
590
+ "model.visual.blocks.22.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
591
+ "model.visual.blocks.22.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
592
+ "model.visual.blocks.22.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
593
+ "model.visual.blocks.22.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
594
+ "model.visual.blocks.22.norm1.bias": "model-00001-of-00004.safetensors",
595
+ "model.visual.blocks.22.norm1.weight": "model-00001-of-00004.safetensors",
596
+ "model.visual.blocks.22.norm2.bias": "model-00001-of-00004.safetensors",
597
+ "model.visual.blocks.22.norm2.weight": "model-00001-of-00004.safetensors",
598
+ "model.visual.blocks.23.attn.proj.bias": "model-00001-of-00004.safetensors",
599
+ "model.visual.blocks.23.attn.proj.weight": "model-00003-of-00004.safetensors",
600
+ "model.visual.blocks.23.attn.qkv.bias": "model-00003-of-00004.safetensors",
601
+ "model.visual.blocks.23.attn.qkv.weight": "model-00001-of-00004.safetensors",
602
+ "model.visual.blocks.23.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
603
+ "model.visual.blocks.23.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
604
+ "model.visual.blocks.23.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
605
+ "model.visual.blocks.23.mlp.linear_fc2.weight": "model-00002-of-00004.safetensors",
606
+ "model.visual.blocks.23.norm1.bias": "model-00003-of-00004.safetensors",
607
+ "model.visual.blocks.23.norm1.weight": "model-00001-of-00004.safetensors",
608
+ "model.visual.blocks.23.norm2.bias": "model-00003-of-00004.safetensors",
609
+ "model.visual.blocks.23.norm2.weight": "model-00003-of-00004.safetensors",
610
+ "model.visual.blocks.24.attn.proj.bias": "model-00003-of-00004.safetensors",
611
+ "model.visual.blocks.24.attn.proj.weight": "model-00002-of-00004.safetensors",
612
+ "model.visual.blocks.24.attn.qkv.bias": "model-00001-of-00004.safetensors",
613
+ "model.visual.blocks.24.attn.qkv.weight": "model-00003-of-00004.safetensors",
614
+ "model.visual.blocks.24.mlp.linear_fc1.bias": "model-00003-of-00004.safetensors",
615
+ "model.visual.blocks.24.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
616
+ "model.visual.blocks.24.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
617
+ "model.visual.blocks.24.mlp.linear_fc2.weight": "model-00002-of-00004.safetensors",
618
+ "model.visual.blocks.24.norm1.bias": "model-00003-of-00004.safetensors",
619
+ "model.visual.blocks.24.norm1.weight": "model-00002-of-00004.safetensors",
620
+ "model.visual.blocks.24.norm2.bias": "model-00003-of-00004.safetensors",
621
+ "model.visual.blocks.24.norm2.weight": "model-00003-of-00004.safetensors",
622
+ "model.visual.blocks.25.attn.proj.bias": "model-00001-of-00004.safetensors",
623
+ "model.visual.blocks.25.attn.proj.weight": "model-00004-of-00004.safetensors",
624
+ "model.visual.blocks.25.attn.qkv.bias": "model-00003-of-00004.safetensors",
625
+ "model.visual.blocks.25.attn.qkv.weight": "model-00002-of-00004.safetensors",
626
+ "model.visual.blocks.25.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
627
+ "model.visual.blocks.25.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors",
628
+ "model.visual.blocks.25.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
629
+ "model.visual.blocks.25.mlp.linear_fc2.weight": "model-00003-of-00004.safetensors",
630
+ "model.visual.blocks.25.norm1.bias": "model-00001-of-00004.safetensors",
631
+ "model.visual.blocks.25.norm1.weight": "model-00004-of-00004.safetensors",
632
+ "model.visual.blocks.25.norm2.bias": "model-00001-of-00004.safetensors",
633
+ "model.visual.blocks.25.norm2.weight": "model-00003-of-00004.safetensors",
634
+ "model.visual.blocks.26.attn.proj.bias": "model-00001-of-00004.safetensors",
635
+ "model.visual.blocks.26.attn.proj.weight": "model-00001-of-00004.safetensors",
636
+ "model.visual.blocks.26.attn.qkv.bias": "model-00001-of-00004.safetensors",
637
+ "model.visual.blocks.26.attn.qkv.weight": "model-00001-of-00004.safetensors",
638
+ "model.visual.blocks.26.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
639
+ "model.visual.blocks.26.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors",
640
+ "model.visual.blocks.26.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors",
641
+ "model.visual.blocks.26.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
642
+ "model.visual.blocks.26.norm1.bias": "model-00002-of-00004.safetensors",
643
+ "model.visual.blocks.26.norm1.weight": "model-00002-of-00004.safetensors",
644
+ "model.visual.blocks.26.norm2.bias": "model-00003-of-00004.safetensors",
645
+ "model.visual.blocks.26.norm2.weight": "model-00003-of-00004.safetensors",
646
+ "model.visual.blocks.3.attn.proj.bias": "model-00004-of-00004.safetensors",
647
+ "model.visual.blocks.3.attn.proj.weight": "model-00002-of-00004.safetensors",
648
+ "model.visual.blocks.3.attn.qkv.bias": "model-00002-of-00004.safetensors",
649
+ "model.visual.blocks.3.attn.qkv.weight": "model-00004-of-00004.safetensors",
650
+ "model.visual.blocks.3.mlp.linear_fc1.bias": "model-00003-of-00004.safetensors",
651
+ "model.visual.blocks.3.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
652
+ "model.visual.blocks.3.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
653
+ "model.visual.blocks.3.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
654
+ "model.visual.blocks.3.norm1.bias": "model-00003-of-00004.safetensors",
655
+ "model.visual.blocks.3.norm1.weight": "model-00002-of-00004.safetensors",
656
+ "model.visual.blocks.3.norm2.bias": "model-00003-of-00004.safetensors",
657
+ "model.visual.blocks.3.norm2.weight": "model-00004-of-00004.safetensors",
658
+ "model.visual.blocks.4.attn.proj.bias": "model-00001-of-00004.safetensors",
659
+ "model.visual.blocks.4.attn.proj.weight": "model-00001-of-00004.safetensors",
660
+ "model.visual.blocks.4.attn.qkv.bias": "model-00004-of-00004.safetensors",
661
+ "model.visual.blocks.4.attn.qkv.weight": "model-00003-of-00004.safetensors",
662
+ "model.visual.blocks.4.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
663
+ "model.visual.blocks.4.mlp.linear_fc1.weight": "model-00002-of-00004.safetensors",
664
+ "model.visual.blocks.4.mlp.linear_fc2.bias": "model-00004-of-00004.safetensors",
665
+ "model.visual.blocks.4.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors",
666
+ "model.visual.blocks.4.norm1.bias": "model-00001-of-00004.safetensors",
667
+ "model.visual.blocks.4.norm1.weight": "model-00001-of-00004.safetensors",
668
+ "model.visual.blocks.4.norm2.bias": "model-00001-of-00004.safetensors",
669
+ "model.visual.blocks.4.norm2.weight": "model-00001-of-00004.safetensors",
670
+ "model.visual.blocks.5.attn.proj.bias": "model-00003-of-00004.safetensors",
671
+ "model.visual.blocks.5.attn.proj.weight": "model-00001-of-00004.safetensors",
672
+ "model.visual.blocks.5.attn.qkv.bias": "model-00001-of-00004.safetensors",
673
+ "model.visual.blocks.5.attn.qkv.weight": "model-00003-of-00004.safetensors",
674
+ "model.visual.blocks.5.mlp.linear_fc1.bias": "model-00003-of-00004.safetensors",
675
+ "model.visual.blocks.5.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
676
+ "model.visual.blocks.5.mlp.linear_fc2.bias": "model-00004-of-00004.safetensors",
677
+ "model.visual.blocks.5.mlp.linear_fc2.weight": "model-00002-of-00004.safetensors",
678
+ "model.visual.blocks.5.norm1.bias": "model-00002-of-00004.safetensors",
679
+ "model.visual.blocks.5.norm1.weight": "model-00003-of-00004.safetensors",
680
+ "model.visual.blocks.5.norm2.bias": "model-00001-of-00004.safetensors",
681
+ "model.visual.blocks.5.norm2.weight": "model-00001-of-00004.safetensors",
682
+ "model.visual.blocks.6.attn.proj.bias": "model-00002-of-00004.safetensors",
683
+ "model.visual.blocks.6.attn.proj.weight": "model-00001-of-00004.safetensors",
684
+ "model.visual.blocks.6.attn.qkv.bias": "model-00003-of-00004.safetensors",
685
+ "model.visual.blocks.6.attn.qkv.weight": "model-00003-of-00004.safetensors",
686
+ "model.visual.blocks.6.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
687
+ "model.visual.blocks.6.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
688
+ "model.visual.blocks.6.mlp.linear_fc2.bias": "model-00004-of-00004.safetensors",
689
+ "model.visual.blocks.6.mlp.linear_fc2.weight": "model-00003-of-00004.safetensors",
690
+ "model.visual.blocks.6.norm1.bias": "model-00001-of-00004.safetensors",
691
+ "model.visual.blocks.6.norm1.weight": "model-00001-of-00004.safetensors",
692
+ "model.visual.blocks.6.norm2.bias": "model-00001-of-00004.safetensors",
693
+ "model.visual.blocks.6.norm2.weight": "model-00002-of-00004.safetensors",
694
+ "model.visual.blocks.7.attn.proj.bias": "model-00001-of-00004.safetensors",
695
+ "model.visual.blocks.7.attn.proj.weight": "model-00002-of-00004.safetensors",
696
+ "model.visual.blocks.7.attn.qkv.bias": "model-00001-of-00004.safetensors",
697
+ "model.visual.blocks.7.attn.qkv.weight": "model-00002-of-00004.safetensors",
698
+ "model.visual.blocks.7.mlp.linear_fc1.bias": "model-00003-of-00004.safetensors",
699
+ "model.visual.blocks.7.mlp.linear_fc1.weight": "model-00002-of-00004.safetensors",
700
+ "model.visual.blocks.7.mlp.linear_fc2.bias": "model-00002-of-00004.safetensors",
701
+ "model.visual.blocks.7.mlp.linear_fc2.weight": "model-00002-of-00004.safetensors",
702
+ "model.visual.blocks.7.norm1.bias": "model-00002-of-00004.safetensors",
703
+ "model.visual.blocks.7.norm1.weight": "model-00001-of-00004.safetensors",
704
+ "model.visual.blocks.7.norm2.bias": "model-00002-of-00004.safetensors",
705
+ "model.visual.blocks.7.norm2.weight": "model-00003-of-00004.safetensors",
706
+ "model.visual.blocks.8.attn.proj.bias": "model-00001-of-00004.safetensors",
707
+ "model.visual.blocks.8.attn.proj.weight": "model-00001-of-00004.safetensors",
708
+ "model.visual.blocks.8.attn.qkv.bias": "model-00001-of-00004.safetensors",
709
+ "model.visual.blocks.8.attn.qkv.weight": "model-00002-of-00004.safetensors",
710
+ "model.visual.blocks.8.mlp.linear_fc1.bias": "model-00002-of-00004.safetensors",
711
+ "model.visual.blocks.8.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
712
+ "model.visual.blocks.8.mlp.linear_fc2.bias": "model-00003-of-00004.safetensors",
713
+ "model.visual.blocks.8.mlp.linear_fc2.weight": "model-00003-of-00004.safetensors",
714
+ "model.visual.blocks.8.norm1.bias": "model-00003-of-00004.safetensors",
715
+ "model.visual.blocks.8.norm1.weight": "model-00001-of-00004.safetensors",
716
+ "model.visual.blocks.8.norm2.bias": "model-00002-of-00004.safetensors",
717
+ "model.visual.blocks.8.norm2.weight": "model-00003-of-00004.safetensors",
718
+ "model.visual.blocks.9.attn.proj.bias": "model-00002-of-00004.safetensors",
719
+ "model.visual.blocks.9.attn.proj.weight": "model-00003-of-00004.safetensors",
720
+ "model.visual.blocks.9.attn.qkv.bias": "model-00001-of-00004.safetensors",
721
+ "model.visual.blocks.9.attn.qkv.weight": "model-00004-of-00004.safetensors",
722
+ "model.visual.blocks.9.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors",
723
+ "model.visual.blocks.9.mlp.linear_fc1.weight": "model-00003-of-00004.safetensors",
724
+ "model.visual.blocks.9.mlp.linear_fc2.bias": "model-00002-of-00004.safetensors",
725
+ "model.visual.blocks.9.mlp.linear_fc2.weight": "model-00003-of-00004.safetensors",
726
+ "model.visual.blocks.9.norm1.bias": "model-00002-of-00004.safetensors",
727
+ "model.visual.blocks.9.norm1.weight": "model-00001-of-00004.safetensors",
728
+ "model.visual.blocks.9.norm2.bias": "model-00002-of-00004.safetensors",
729
+ "model.visual.blocks.9.norm2.weight": "model-00004-of-00004.safetensors",
730
+ "model.visual.deepstack_merger_list.0.linear_fc1.bias": "model-00001-of-00004.safetensors",
731
+ "model.visual.deepstack_merger_list.0.linear_fc1.weight": "model-00002-of-00004.safetensors",
732
+ "model.visual.deepstack_merger_list.0.linear_fc2.bias": "model-00003-of-00004.safetensors",
733
+ "model.visual.deepstack_merger_list.0.linear_fc2.weight": "model-00001-of-00004.safetensors",
734
+ "model.visual.deepstack_merger_list.0.norm.bias": "model-00003-of-00004.safetensors",
735
+ "model.visual.deepstack_merger_list.0.norm.weight": "model-00001-of-00004.safetensors",
736
+ "model.visual.deepstack_merger_list.1.linear_fc1.bias": "model-00001-of-00004.safetensors",
737
+ "model.visual.deepstack_merger_list.1.linear_fc1.weight": "model-00003-of-00004.safetensors",
738
+ "model.visual.deepstack_merger_list.1.linear_fc2.bias": "model-00004-of-00004.safetensors",
739
+ "model.visual.deepstack_merger_list.1.linear_fc2.weight": "model-00003-of-00004.safetensors",
740
+ "model.visual.deepstack_merger_list.1.norm.bias": "model-00003-of-00004.safetensors",
741
+ "model.visual.deepstack_merger_list.1.norm.weight": "model-00003-of-00004.safetensors",
742
+ "model.visual.deepstack_merger_list.2.linear_fc1.bias": "model-00002-of-00004.safetensors",
743
+ "model.visual.deepstack_merger_list.2.linear_fc1.weight": "model-00002-of-00004.safetensors",
744
+ "model.visual.deepstack_merger_list.2.linear_fc2.bias": "model-00002-of-00004.safetensors",
745
+ "model.visual.deepstack_merger_list.2.linear_fc2.weight": "model-00001-of-00004.safetensors",
746
+ "model.visual.deepstack_merger_list.2.norm.bias": "model-00002-of-00004.safetensors",
747
+ "model.visual.deepstack_merger_list.2.norm.weight": "model-00001-of-00004.safetensors",
748
+ "model.visual.merger.linear_fc1.bias": "model-00001-of-00004.safetensors",
749
+ "model.visual.merger.linear_fc1.weight": "model-00002-of-00004.safetensors",
750
+ "model.visual.merger.linear_fc2.bias": "model-00003-of-00004.safetensors",
751
+ "model.visual.merger.linear_fc2.weight": "model-00001-of-00004.safetensors",
752
+ "model.visual.merger.norm.bias": "model-00001-of-00004.safetensors",
753
+ "model.visual.merger.norm.weight": "model-00003-of-00004.safetensors",
754
+ "model.visual.patch_embed.proj.bias": "model-00003-of-00004.safetensors",
755
+ "model.visual.patch_embed.proj.weight": "model-00001-of-00004.safetensors",
756
+ "model.visual.pos_embed.weight": "model-00004-of-00004.safetensors"
757
+ }
758
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": null,
3
+ "data_format": "channels_first",
4
+ "default_to_square": true,
5
+ "device": null,
6
+ "disable_grouping": null,
7
+ "do_center_crop": null,
8
+ "do_convert_rgb": true,
9
+ "do_normalize": true,
10
+ "do_pad": null,
11
+ "do_rescale": true,
12
+ "do_resize": true,
13
+ "image_mean": [
14
+ 0.5,
15
+ 0.5,
16
+ 0.5
17
+ ],
18
+ "image_processor_type": "Qwen2VLImageProcessorFast",
19
+ "image_std": [
20
+ 0.5,
21
+ 0.5,
22
+ 0.5
23
+ ],
24
+ "input_data_format": null,
25
+ "max_pixels": null,
26
+ "merge_size": 2,
27
+ "min_pixels": null,
28
+ "pad_size": null,
29
+ "patch_size": 16,
30
+ "processor_class": "Qwen3VLProcessor",
31
+ "resample": 3,
32
+ "rescale_factor": 0.00392156862745098,
33
+ "return_tensors": null,
34
+ "size": {
35
+ "longest_edge": 16777216,
36
+ "shortest_edge": 65536
37
+ },
38
+ "temporal_patch_size": 2
39
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,1024 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<action>",
4
+ "</action>",
5
+ "<FWD>",
6
+ "<LEFT>",
7
+ "<RIGHT>",
8
+ "<STOP>",
9
+ "<0>",
10
+ "<1>",
11
+ "<2>",
12
+ "<3>",
13
+ "<4>",
14
+ "<5>",
15
+ "<6>",
16
+ "<7>",
17
+ "<8>",
18
+ "<9>",
19
+ "<10>",
20
+ "<11>",
21
+ "<12>",
22
+ "<13>",
23
+ "<14>",
24
+ "<15>",
25
+ "<16>",
26
+ "<17>",
27
+ "<18>",
28
+ "<19>",
29
+ "<20>",
30
+ "<21>",
31
+ "<22>",
32
+ "<23>",
33
+ "<24>",
34
+ "<25>",
35
+ "<26>",
36
+ "<27>",
37
+ "<28>",
38
+ "<29>",
39
+ "<30>",
40
+ "<31>",
41
+ "<32>",
42
+ "<33>",
43
+ "<34>",
44
+ "<35>",
45
+ "<36>",
46
+ "<37>",
47
+ "<38>",
48
+ "<39>",
49
+ "<40>",
50
+ "<41>",
51
+ "<42>",
52
+ "<43>",
53
+ "<44>",
54
+ "<45>",
55
+ "<46>",
56
+ "<47>",
57
+ "<48>",
58
+ "<49>",
59
+ "<50>",
60
+ "<51>",
61
+ "<52>",
62
+ "<53>",
63
+ "<54>",
64
+ "<55>",
65
+ "<56>",
66
+ "<57>",
67
+ "<58>",
68
+ "<59>",
69
+ "<60>",
70
+ "<61>",
71
+ "<62>",
72
+ "<63>",
73
+ "<64>",
74
+ "<65>",
75
+ "<66>",
76
+ "<67>",
77
+ "<68>",
78
+ "<69>",
79
+ "<70>",
80
+ "<71>",
81
+ "<72>",
82
+ "<73>",
83
+ "<74>",
84
+ "<75>",
85
+ "<76>",
86
+ "<77>",
87
+ "<78>",
88
+ "<79>",
89
+ "<80>",
90
+ "<81>",
91
+ "<82>",
92
+ "<83>",
93
+ "<84>",
94
+ "<85>",
95
+ "<86>",
96
+ "<87>",
97
+ "<88>",
98
+ "<89>",
99
+ "<90>",
100
+ "<91>",
101
+ "<92>",
102
+ "<93>",
103
+ "<94>",
104
+ "<95>",
105
+ "<96>",
106
+ "<97>",
107
+ "<98>",
108
+ "<99>",
109
+ "<100>",
110
+ "<101>",
111
+ "<102>",
112
+ "<103>",
113
+ "<104>",
114
+ "<105>",
115
+ "<106>",
116
+ "<107>",
117
+ "<108>",
118
+ "<109>",
119
+ "<110>",
120
+ "<111>",
121
+ "<112>",
122
+ "<113>",
123
+ "<114>",
124
+ "<115>",
125
+ "<116>",
126
+ "<117>",
127
+ "<118>",
128
+ "<119>",
129
+ "<120>",
130
+ "<121>",
131
+ "<122>",
132
+ "<123>",
133
+ "<124>",
134
+ "<125>",
135
+ "<126>",
136
+ "<127>",
137
+ "<128>",
138
+ "<129>",
139
+ "<130>",
140
+ "<131>",
141
+ "<132>",
142
+ "<133>",
143
+ "<134>",
144
+ "<135>",
145
+ "<136>",
146
+ "<137>",
147
+ "<138>",
148
+ "<139>",
149
+ "<140>",
150
+ "<141>",
151
+ "<142>",
152
+ "<143>",
153
+ "<144>",
154
+ "<145>",
155
+ "<146>",
156
+ "<147>",
157
+ "<148>",
158
+ "<149>",
159
+ "<150>",
160
+ "<151>",
161
+ "<152>",
162
+ "<153>",
163
+ "<154>",
164
+ "<155>",
165
+ "<156>",
166
+ "<157>",
167
+ "<158>",
168
+ "<159>",
169
+ "<160>",
170
+ "<161>",
171
+ "<162>",
172
+ "<163>",
173
+ "<164>",
174
+ "<165>",
175
+ "<166>",
176
+ "<167>",
177
+ "<168>",
178
+ "<169>",
179
+ "<170>",
180
+ "<171>",
181
+ "<172>",
182
+ "<173>",
183
+ "<174>",
184
+ "<175>",
185
+ "<176>",
186
+ "<177>",
187
+ "<178>",
188
+ "<179>",
189
+ "<180>",
190
+ "<181>",
191
+ "<182>",
192
+ "<183>",
193
+ "<184>",
194
+ "<185>",
195
+ "<186>",
196
+ "<187>",
197
+ "<188>",
198
+ "<189>",
199
+ "<190>",
200
+ "<191>",
201
+ "<192>",
202
+ "<193>",
203
+ "<194>",
204
+ "<195>",
205
+ "<196>",
206
+ "<197>",
207
+ "<198>",
208
+ "<199>",
209
+ "<200>",
210
+ "<201>",
211
+ "<202>",
212
+ "<203>",
213
+ "<204>",
214
+ "<205>",
215
+ "<206>",
216
+ "<207>",
217
+ "<208>",
218
+ "<209>",
219
+ "<210>",
220
+ "<211>",
221
+ "<212>",
222
+ "<213>",
223
+ "<214>",
224
+ "<215>",
225
+ "<216>",
226
+ "<217>",
227
+ "<218>",
228
+ "<219>",
229
+ "<220>",
230
+ "<221>",
231
+ "<222>",
232
+ "<223>",
233
+ "<224>",
234
+ "<225>",
235
+ "<226>",
236
+ "<227>",
237
+ "<228>",
238
+ "<229>",
239
+ "<230>",
240
+ "<231>",
241
+ "<232>",
242
+ "<233>",
243
+ "<234>",
244
+ "<235>",
245
+ "<236>",
246
+ "<237>",
247
+ "<238>",
248
+ "<239>",
249
+ "<240>",
250
+ "<241>",
251
+ "<242>",
252
+ "<243>",
253
+ "<244>",
254
+ "<245>",
255
+ "<246>",
256
+ "<247>",
257
+ "<248>",
258
+ "<249>",
259
+ "<250>",
260
+ "<251>",
261
+ "<252>",
262
+ "<253>",
263
+ "<254>",
264
+ "<255>",
265
+ "<256>",
266
+ "<257>",
267
+ "<258>",
268
+ "<259>",
269
+ "<260>",
270
+ "<261>",
271
+ "<262>",
272
+ "<263>",
273
+ "<264>",
274
+ "<265>",
275
+ "<266>",
276
+ "<267>",
277
+ "<268>",
278
+ "<269>",
279
+ "<270>",
280
+ "<271>",
281
+ "<272>",
282
+ "<273>",
283
+ "<274>",
284
+ "<275>",
285
+ "<276>",
286
+ "<277>",
287
+ "<278>",
288
+ "<279>",
289
+ "<280>",
290
+ "<281>",
291
+ "<282>",
292
+ "<283>",
293
+ "<284>",
294
+ "<285>",
295
+ "<286>",
296
+ "<287>",
297
+ "<288>",
298
+ "<289>",
299
+ "<290>",
300
+ "<291>",
301
+ "<292>",
302
+ "<293>",
303
+ "<294>",
304
+ "<295>",
305
+ "<296>",
306
+ "<297>",
307
+ "<298>",
308
+ "<299>",
309
+ "<300>",
310
+ "<301>",
311
+ "<302>",
312
+ "<303>",
313
+ "<304>",
314
+ "<305>",
315
+ "<306>",
316
+ "<307>",
317
+ "<308>",
318
+ "<309>",
319
+ "<310>",
320
+ "<311>",
321
+ "<312>",
322
+ "<313>",
323
+ "<314>",
324
+ "<315>",
325
+ "<316>",
326
+ "<317>",
327
+ "<318>",
328
+ "<319>",
329
+ "<320>",
330
+ "<321>",
331
+ "<322>",
332
+ "<323>",
333
+ "<324>",
334
+ "<325>",
335
+ "<326>",
336
+ "<327>",
337
+ "<328>",
338
+ "<329>",
339
+ "<330>",
340
+ "<331>",
341
+ "<332>",
342
+ "<333>",
343
+ "<334>",
344
+ "<335>",
345
+ "<336>",
346
+ "<337>",
347
+ "<338>",
348
+ "<339>",
349
+ "<340>",
350
+ "<341>",
351
+ "<342>",
352
+ "<343>",
353
+ "<344>",
354
+ "<345>",
355
+ "<346>",
356
+ "<347>",
357
+ "<348>",
358
+ "<349>",
359
+ "<350>",
360
+ "<351>",
361
+ "<352>",
362
+ "<353>",
363
+ "<354>",
364
+ "<355>",
365
+ "<356>",
366
+ "<357>",
367
+ "<358>",
368
+ "<359>",
369
+ "<360>",
370
+ "<361>",
371
+ "<362>",
372
+ "<363>",
373
+ "<364>",
374
+ "<365>",
375
+ "<366>",
376
+ "<367>",
377
+ "<368>",
378
+ "<369>",
379
+ "<370>",
380
+ "<371>",
381
+ "<372>",
382
+ "<373>",
383
+ "<374>",
384
+ "<375>",
385
+ "<376>",
386
+ "<377>",
387
+ "<378>",
388
+ "<379>",
389
+ "<380>",
390
+ "<381>",
391
+ "<382>",
392
+ "<383>",
393
+ "<384>",
394
+ "<385>",
395
+ "<386>",
396
+ "<387>",
397
+ "<388>",
398
+ "<389>",
399
+ "<390>",
400
+ "<391>",
401
+ "<392>",
402
+ "<393>",
403
+ "<394>",
404
+ "<395>",
405
+ "<396>",
406
+ "<397>",
407
+ "<398>",
408
+ "<399>",
409
+ "<400>",
410
+ "<401>",
411
+ "<402>",
412
+ "<403>",
413
+ "<404>",
414
+ "<405>",
415
+ "<406>",
416
+ "<407>",
417
+ "<408>",
418
+ "<409>",
419
+ "<410>",
420
+ "<411>",
421
+ "<412>",
422
+ "<413>",
423
+ "<414>",
424
+ "<415>",
425
+ "<416>",
426
+ "<417>",
427
+ "<418>",
428
+ "<419>",
429
+ "<420>",
430
+ "<421>",
431
+ "<422>",
432
+ "<423>",
433
+ "<424>",
434
+ "<425>",
435
+ "<426>",
436
+ "<427>",
437
+ "<428>",
438
+ "<429>",
439
+ "<430>",
440
+ "<431>",
441
+ "<432>",
442
+ "<433>",
443
+ "<434>",
444
+ "<435>",
445
+ "<436>",
446
+ "<437>",
447
+ "<438>",
448
+ "<439>",
449
+ "<440>",
450
+ "<441>",
451
+ "<442>",
452
+ "<443>",
453
+ "<444>",
454
+ "<445>",
455
+ "<446>",
456
+ "<447>",
457
+ "<448>",
458
+ "<449>",
459
+ "<450>",
460
+ "<451>",
461
+ "<452>",
462
+ "<453>",
463
+ "<454>",
464
+ "<455>",
465
+ "<456>",
466
+ "<457>",
467
+ "<458>",
468
+ "<459>",
469
+ "<460>",
470
+ "<461>",
471
+ "<462>",
472
+ "<463>",
473
+ "<464>",
474
+ "<465>",
475
+ "<466>",
476
+ "<467>",
477
+ "<468>",
478
+ "<469>",
479
+ "<470>",
480
+ "<471>",
481
+ "<472>",
482
+ "<473>",
483
+ "<474>",
484
+ "<475>",
485
+ "<476>",
486
+ "<477>",
487
+ "<478>",
488
+ "<479>",
489
+ "<480>",
490
+ "<481>",
491
+ "<482>",
492
+ "<483>",
493
+ "<484>",
494
+ "<485>",
495
+ "<486>",
496
+ "<487>",
497
+ "<488>",
498
+ "<489>",
499
+ "<490>",
500
+ "<491>",
501
+ "<492>",
502
+ "<493>",
503
+ "<494>",
504
+ "<495>",
505
+ "<496>",
506
+ "<497>",
507
+ "<498>",
508
+ "<499>",
509
+ "<500>",
510
+ "<501>",
511
+ "<502>",
512
+ "<503>",
513
+ "<504>",
514
+ "<505>",
515
+ "<506>",
516
+ "<507>",
517
+ "<508>",
518
+ "<509>",
519
+ "<510>",
520
+ "<511>",
521
+ "<512>",
522
+ "<513>",
523
+ "<514>",
524
+ "<515>",
525
+ "<516>",
526
+ "<517>",
527
+ "<518>",
528
+ "<519>",
529
+ "<520>",
530
+ "<521>",
531
+ "<522>",
532
+ "<523>",
533
+ "<524>",
534
+ "<525>",
535
+ "<526>",
536
+ "<527>",
537
+ "<528>",
538
+ "<529>",
539
+ "<530>",
540
+ "<531>",
541
+ "<532>",
542
+ "<533>",
543
+ "<534>",
544
+ "<535>",
545
+ "<536>",
546
+ "<537>",
547
+ "<538>",
548
+ "<539>",
549
+ "<540>",
550
+ "<541>",
551
+ "<542>",
552
+ "<543>",
553
+ "<544>",
554
+ "<545>",
555
+ "<546>",
556
+ "<547>",
557
+ "<548>",
558
+ "<549>",
559
+ "<550>",
560
+ "<551>",
561
+ "<552>",
562
+ "<553>",
563
+ "<554>",
564
+ "<555>",
565
+ "<556>",
566
+ "<557>",
567
+ "<558>",
568
+ "<559>",
569
+ "<560>",
570
+ "<561>",
571
+ "<562>",
572
+ "<563>",
573
+ "<564>",
574
+ "<565>",
575
+ "<566>",
576
+ "<567>",
577
+ "<568>",
578
+ "<569>",
579
+ "<570>",
580
+ "<571>",
581
+ "<572>",
582
+ "<573>",
583
+ "<574>",
584
+ "<575>",
585
+ "<576>",
586
+ "<577>",
587
+ "<578>",
588
+ "<579>",
589
+ "<580>",
590
+ "<581>",
591
+ "<582>",
592
+ "<583>",
593
+ "<584>",
594
+ "<585>",
595
+ "<586>",
596
+ "<587>",
597
+ "<588>",
598
+ "<589>",
599
+ "<590>",
600
+ "<591>",
601
+ "<592>",
602
+ "<593>",
603
+ "<594>",
604
+ "<595>",
605
+ "<596>",
606
+ "<597>",
607
+ "<598>",
608
+ "<599>",
609
+ "<600>",
610
+ "<601>",
611
+ "<602>",
612
+ "<603>",
613
+ "<604>",
614
+ "<605>",
615
+ "<606>",
616
+ "<607>",
617
+ "<608>",
618
+ "<609>",
619
+ "<610>",
620
+ "<611>",
621
+ "<612>",
622
+ "<613>",
623
+ "<614>",
624
+ "<615>",
625
+ "<616>",
626
+ "<617>",
627
+ "<618>",
628
+ "<619>",
629
+ "<620>",
630
+ "<621>",
631
+ "<622>",
632
+ "<623>",
633
+ "<624>",
634
+ "<625>",
635
+ "<626>",
636
+ "<627>",
637
+ "<628>",
638
+ "<629>",
639
+ "<630>",
640
+ "<631>",
641
+ "<632>",
642
+ "<633>",
643
+ "<634>",
644
+ "<635>",
645
+ "<636>",
646
+ "<637>",
647
+ "<638>",
648
+ "<639>",
649
+ "<640>",
650
+ "<641>",
651
+ "<642>",
652
+ "<643>",
653
+ "<644>",
654
+ "<645>",
655
+ "<646>",
656
+ "<647>",
657
+ "<648>",
658
+ "<649>",
659
+ "<650>",
660
+ "<651>",
661
+ "<652>",
662
+ "<653>",
663
+ "<654>",
664
+ "<655>",
665
+ "<656>",
666
+ "<657>",
667
+ "<658>",
668
+ "<659>",
669
+ "<660>",
670
+ "<661>",
671
+ "<662>",
672
+ "<663>",
673
+ "<664>",
674
+ "<665>",
675
+ "<666>",
676
+ "<667>",
677
+ "<668>",
678
+ "<669>",
679
+ "<670>",
680
+ "<671>",
681
+ "<672>",
682
+ "<673>",
683
+ "<674>",
684
+ "<675>",
685
+ "<676>",
686
+ "<677>",
687
+ "<678>",
688
+ "<679>",
689
+ "<680>",
690
+ "<681>",
691
+ "<682>",
692
+ "<683>",
693
+ "<684>",
694
+ "<685>",
695
+ "<686>",
696
+ "<687>",
697
+ "<688>",
698
+ "<689>",
699
+ "<690>",
700
+ "<691>",
701
+ "<692>",
702
+ "<693>",
703
+ "<694>",
704
+ "<695>",
705
+ "<696>",
706
+ "<697>",
707
+ "<698>",
708
+ "<699>",
709
+ "<700>",
710
+ "<701>",
711
+ "<702>",
712
+ "<703>",
713
+ "<704>",
714
+ "<705>",
715
+ "<706>",
716
+ "<707>",
717
+ "<708>",
718
+ "<709>",
719
+ "<710>",
720
+ "<711>",
721
+ "<712>",
722
+ "<713>",
723
+ "<714>",
724
+ "<715>",
725
+ "<716>",
726
+ "<717>",
727
+ "<718>",
728
+ "<719>",
729
+ "<720>",
730
+ "<721>",
731
+ "<722>",
732
+ "<723>",
733
+ "<724>",
734
+ "<725>",
735
+ "<726>",
736
+ "<727>",
737
+ "<728>",
738
+ "<729>",
739
+ "<730>",
740
+ "<731>",
741
+ "<732>",
742
+ "<733>",
743
+ "<734>",
744
+ "<735>",
745
+ "<736>",
746
+ "<737>",
747
+ "<738>",
748
+ "<739>",
749
+ "<740>",
750
+ "<741>",
751
+ "<742>",
752
+ "<743>",
753
+ "<744>",
754
+ "<745>",
755
+ "<746>",
756
+ "<747>",
757
+ "<748>",
758
+ "<749>",
759
+ "<750>",
760
+ "<751>",
761
+ "<752>",
762
+ "<753>",
763
+ "<754>",
764
+ "<755>",
765
+ "<756>",
766
+ "<757>",
767
+ "<758>",
768
+ "<759>",
769
+ "<760>",
770
+ "<761>",
771
+ "<762>",
772
+ "<763>",
773
+ "<764>",
774
+ "<765>",
775
+ "<766>",
776
+ "<767>",
777
+ "<768>",
778
+ "<769>",
779
+ "<770>",
780
+ "<771>",
781
+ "<772>",
782
+ "<773>",
783
+ "<774>",
784
+ "<775>",
785
+ "<776>",
786
+ "<777>",
787
+ "<778>",
788
+ "<779>",
789
+ "<780>",
790
+ "<781>",
791
+ "<782>",
792
+ "<783>",
793
+ "<784>",
794
+ "<785>",
795
+ "<786>",
796
+ "<787>",
797
+ "<788>",
798
+ "<789>",
799
+ "<790>",
800
+ "<791>",
801
+ "<792>",
802
+ "<793>",
803
+ "<794>",
804
+ "<795>",
805
+ "<796>",
806
+ "<797>",
807
+ "<798>",
808
+ "<799>",
809
+ "<800>",
810
+ "<801>",
811
+ "<802>",
812
+ "<803>",
813
+ "<804>",
814
+ "<805>",
815
+ "<806>",
816
+ "<807>",
817
+ "<808>",
818
+ "<809>",
819
+ "<810>",
820
+ "<811>",
821
+ "<812>",
822
+ "<813>",
823
+ "<814>",
824
+ "<815>",
825
+ "<816>",
826
+ "<817>",
827
+ "<818>",
828
+ "<819>",
829
+ "<820>",
830
+ "<821>",
831
+ "<822>",
832
+ "<823>",
833
+ "<824>",
834
+ "<825>",
835
+ "<826>",
836
+ "<827>",
837
+ "<828>",
838
+ "<829>",
839
+ "<830>",
840
+ "<831>",
841
+ "<832>",
842
+ "<833>",
843
+ "<834>",
844
+ "<835>",
845
+ "<836>",
846
+ "<837>",
847
+ "<838>",
848
+ "<839>",
849
+ "<840>",
850
+ "<841>",
851
+ "<842>",
852
+ "<843>",
853
+ "<844>",
854
+ "<845>",
855
+ "<846>",
856
+ "<847>",
857
+ "<848>",
858
+ "<849>",
859
+ "<850>",
860
+ "<851>",
861
+ "<852>",
862
+ "<853>",
863
+ "<854>",
864
+ "<855>",
865
+ "<856>",
866
+ "<857>",
867
+ "<858>",
868
+ "<859>",
869
+ "<860>",
870
+ "<861>",
871
+ "<862>",
872
+ "<863>",
873
+ "<864>",
874
+ "<865>",
875
+ "<866>",
876
+ "<867>",
877
+ "<868>",
878
+ "<869>",
879
+ "<870>",
880
+ "<871>",
881
+ "<872>",
882
+ "<873>",
883
+ "<874>",
884
+ "<875>",
885
+ "<876>",
886
+ "<877>",
887
+ "<878>",
888
+ "<879>",
889
+ "<880>",
890
+ "<881>",
891
+ "<882>",
892
+ "<883>",
893
+ "<884>",
894
+ "<885>",
895
+ "<886>",
896
+ "<887>",
897
+ "<888>",
898
+ "<889>",
899
+ "<890>",
900
+ "<891>",
901
+ "<892>",
902
+ "<893>",
903
+ "<894>",
904
+ "<895>",
905
+ "<896>",
906
+ "<897>",
907
+ "<898>",
908
+ "<899>",
909
+ "<900>",
910
+ "<901>",
911
+ "<902>",
912
+ "<903>",
913
+ "<904>",
914
+ "<905>",
915
+ "<906>",
916
+ "<907>",
917
+ "<908>",
918
+ "<909>",
919
+ "<910>",
920
+ "<911>",
921
+ "<912>",
922
+ "<913>",
923
+ "<914>",
924
+ "<915>",
925
+ "<916>",
926
+ "<917>",
927
+ "<918>",
928
+ "<919>",
929
+ "<920>",
930
+ "<921>",
931
+ "<922>",
932
+ "<923>",
933
+ "<924>",
934
+ "<925>",
935
+ "<926>",
936
+ "<927>",
937
+ "<928>",
938
+ "<929>",
939
+ "<930>",
940
+ "<931>",
941
+ "<932>",
942
+ "<933>",
943
+ "<934>",
944
+ "<935>",
945
+ "<936>",
946
+ "<937>",
947
+ "<938>",
948
+ "<939>",
949
+ "<940>",
950
+ "<941>",
951
+ "<942>",
952
+ "<943>",
953
+ "<944>",
954
+ "<945>",
955
+ "<946>",
956
+ "<947>",
957
+ "<948>",
958
+ "<949>",
959
+ "<950>",
960
+ "<951>",
961
+ "<952>",
962
+ "<953>",
963
+ "<954>",
964
+ "<955>",
965
+ "<956>",
966
+ "<957>",
967
+ "<958>",
968
+ "<959>",
969
+ "<960>",
970
+ "<961>",
971
+ "<962>",
972
+ "<963>",
973
+ "<964>",
974
+ "<965>",
975
+ "<966>",
976
+ "<967>",
977
+ "<968>",
978
+ "<969>",
979
+ "<970>",
980
+ "<971>",
981
+ "<972>",
982
+ "<973>",
983
+ "<974>",
984
+ "<975>",
985
+ "<976>",
986
+ "<977>",
987
+ "<978>",
988
+ "<979>",
989
+ "<980>",
990
+ "<981>",
991
+ "<982>",
992
+ "<983>",
993
+ "<984>",
994
+ "<985>",
995
+ "<986>",
996
+ "<987>",
997
+ "<988>",
998
+ "<989>",
999
+ "<990>",
1000
+ "<991>",
1001
+ "<992>",
1002
+ "<993>",
1003
+ "<994>",
1004
+ "<995>",
1005
+ "<996>",
1006
+ "<997>",
1007
+ "<998>",
1008
+ "<999>"
1009
+ ],
1010
+ "eos_token": {
1011
+ "content": "<|im_end|>",
1012
+ "lstrip": false,
1013
+ "normalized": false,
1014
+ "rstrip": false,
1015
+ "single_word": false
1016
+ },
1017
+ "pad_token": {
1018
+ "content": "<|endoftext|>",
1019
+ "lstrip": false,
1020
+ "normalized": false,
1021
+ "rstrip": false,
1022
+ "single_word": false
1023
+ }
1024
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99d80062929e8d36f4ea40ec5527e22cd9a929267a21b3c414a2f4fc4b28a6f2
3
+ size 11605647
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff
 
video_preprocessor_config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": null,
3
+ "data_format": "channels_first",
4
+ "default_to_square": true,
5
+ "device": null,
6
+ "do_center_crop": null,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "do_sample_frames": true,
12
+ "fps": 2,
13
+ "image_mean": [
14
+ 0.5,
15
+ 0.5,
16
+ 0.5
17
+ ],
18
+ "image_std": [
19
+ 0.5,
20
+ 0.5,
21
+ 0.5
22
+ ],
23
+ "input_data_format": null,
24
+ "max_frames": 768,
25
+ "merge_size": 2,
26
+ "min_frames": 4,
27
+ "num_frames": null,
28
+ "pad_size": null,
29
+ "patch_size": 16,
30
+ "processor_class": "Qwen3VLProcessor",
31
+ "resample": 3,
32
+ "rescale_factor": 0.00392156862745098,
33
+ "return_metadata": false,
34
+ "size": {
35
+ "longest_edge": 25165824,
36
+ "shortest_edge": 4096
37
+ },
38
+ "temporal_patch_size": 2,
39
+ "video_metadata": null,
40
+ "video_processor_type": "Qwen3VLVideoProcessor"
41
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff