eustlb HF Staff commited on
Commit
8fffe09
·
verified ·
1 Parent(s): 3348205

Upload model

Browse files
Files changed (2) hide show
  1. config.json +1301 -72
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,78 +1,1307 @@
1
  {
2
- "model_type": "pe_audio_video",
3
- "audio_video_config": {
4
- "audio_config": {
5
- "dac_config": {
6
- "encoder_hidden_size": 64,
7
- "downsampling_ratios": [
8
- 2,
9
- 8,
10
- 10,
11
- 12
12
- ],
13
- "decoder_hidden_size": 1536,
14
- "n_codebooks": 16,
15
- "codebook_size": 1024,
16
- "codebook_dim": 128,
17
- "quantizer_dropout": 0,
18
- "sampling_rate": 48000
19
- },
20
- "hidden_size": 768,
21
- "intermediate_size": 2048,
22
- "num_hidden_layers": 12,
23
- "num_attention_heads": 6,
24
- "head_dim": 128,
25
- "num_key_value_heads": null,
26
- "hidden_act": "silu",
27
- "max_position_embeddings": 10000,
28
- "initializer_range": 0.02,
29
- "rms_norm_eps": 1e-05,
30
- "rope_parameters": {
31
- "rope_theta": 20000
32
- },
33
- "attention_bias": false,
34
- "attention_dropout": 0.0
 
 
 
 
 
 
 
 
 
 
35
  },
36
- "video_config": {
37
- "vision_config": {
38
- "architecture": "vit_pe_core_large_patch14_336",
39
- "do_pooling": true,
40
- "global_pool": "map",
41
- "initializer_range": 0.02,
42
- "model_args": {},
43
- "num_labels": 1024,
44
- "model_type": "timm_wrapper"
45
- },
46
- "hidden_size": 768,
47
- "intermediate_size": 2048,
48
- "num_hidden_layers": 4,
49
- "num_attention_heads": 6,
50
- "head_dim": 128,
51
- "num_key_value_heads": null,
52
- "hidden_act": "silu",
53
- "max_position_embeddings": 10000,
54
- "initializer_range": 0.02,
55
- "rms_norm_eps": 1e-05,
56
- "rope_parameters": {
57
- "rope_theta": 20000
58
- },
59
- "attention_bias": false,
60
- "attention_dropout": 0.0
61
  },
62
- "hidden_size": 768,
63
- "intermediate_size": 2048,
64
- "num_hidden_layers": 6,
65
- "num_attention_heads": 6,
66
- "head_dim": 128,
67
- "num_key_value_heads": null,
68
- "hidden_act": "silu",
69
- "max_position_embeddings": 10000,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70
  "initializer_range": 0.02,
71
- "rms_norm_eps": 1e-05,
72
- "rope_parameters": {
73
- "rope_theta": 20000
74
- },
75
- "attention_bias": false,
76
- "attention_dropout": 0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
77
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78
  }
 
1
  {
2
+ "architectures": [
3
+ "PeAudioVideoModel"
4
+ ],
5
+ "audio_video_config": {
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "audio_config": {
9
+ "_name_or_path": "",
10
+ "add_cross_attention": false,
11
+ "architectures": null,
12
+ "attention_bias": false,
13
+ "attention_dropout": 0.0,
14
+ "bos_token_id": null,
15
+ "chunk_size_feed_forward": 0,
16
+ "cross_attention_hidden_size": null,
17
+ "dac_config": {
18
+ "_name_or_path": "",
19
+ "add_cross_attention": false,
20
+ "architectures": null,
21
+ "bos_token_id": null,
22
+ "chunk_size_feed_forward": 0,
23
+ "codebook_dim": 128,
24
+ "codebook_loss_weight": 1.0,
25
+ "codebook_size": 1024,
26
+ "commitment_loss_weight": 0.25,
27
+ "cross_attention_hidden_size": null,
28
+ "decoder_hidden_size": 1536,
29
+ "decoder_start_token_id": null,
30
+ "downsampling_ratios": [
31
+ 2,
32
+ 8,
33
+ 10,
34
+ 12
35
+ ],
36
+ "dtype": null,
37
+ "encoder_hidden_size": 64,
38
+ "eos_token_id": null,
39
+ "finetuning_task": null,
40
+ "hidden_size": 1024,
41
+ "hop_length": 1920,
42
+ "id2label": {
43
+ "0": "LABEL_0",
44
+ "1": "LABEL_1"
45
  },
46
+ "is_decoder": false,
47
+ "is_encoder_decoder": false,
48
+ "label2id": {
49
+ "LABEL_0": 0,
50
+ "LABEL_1": 1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  },
52
+ "model_type": "dac",
53
+ "n_codebooks": 16,
54
+ "output_attentions": false,
55
+ "output_hidden_states": false,
56
+ "pad_token_id": null,
57
+ "prefix": null,
58
+ "problem_type": null,
59
+ "quantizer_dropout": 0,
60
+ "return_dict": true,
61
+ "sampling_rate": 48000,
62
+ "sep_token_id": null,
63
+ "task_specific_params": null,
64
+ "tie_encoder_decoder": false,
65
+ "tie_word_embeddings": true,
66
+ "tokenizer_class": null,
67
+ "upsampling_ratios": [
68
+ 12,
69
+ 10,
70
+ 8,
71
+ 2
72
+ ]
73
+ },
74
+ "decoder_start_token_id": null,
75
+ "dtype": null,
76
+ "eos_token_id": null,
77
+ "finetuning_task": null,
78
+ "head_dim": 128,
79
+ "hidden_act": "silu",
80
+ "hidden_size": 768,
81
+ "id2label": {
82
+ "0": "LABEL_0",
83
+ "1": "LABEL_1"
84
+ },
85
+ "initializer_range": 0.02,
86
+ "intermediate_size": 2048,
87
+ "is_decoder": false,
88
+ "is_encoder_decoder": false,
89
+ "label2id": {
90
+ "LABEL_0": 0,
91
+ "LABEL_1": 1
92
+ },
93
+ "max_position_embeddings": 10000,
94
+ "model_type": "pe_audio_encoder",
95
+ "num_attention_heads": 6,
96
+ "num_hidden_layers": 12,
97
+ "num_key_value_heads": 6,
98
+ "output_attentions": false,
99
+ "output_hidden_states": false,
100
+ "pad_token_id": null,
101
+ "prefix": null,
102
+ "problem_type": null,
103
+ "return_dict": true,
104
+ "rms_norm_eps": 1e-05,
105
+ "rope_parameters": {
106
+ "rope_theta": 20000,
107
+ "rope_type": "default"
108
+ },
109
+ "sep_token_id": null,
110
+ "task_specific_params": null,
111
+ "tie_encoder_decoder": false,
112
+ "tie_word_embeddings": true,
113
+ "tokenizer_class": null
114
+ },
115
+ "head_dim": 128,
116
+ "hidden_act": "silu",
117
+ "hidden_size": 768,
118
+ "initializer_range": 0.02,
119
+ "intermediate_size": 2048,
120
+ "max_position_embeddings": 10000,
121
+ "model_type": "pe_audio_video_encoder",
122
+ "num_attention_heads": 6,
123
+ "num_hidden_layers": 6,
124
+ "num_key_value_heads": 6,
125
+ "rms_norm_eps": 1e-05,
126
+ "rope_parameters": {
127
+ "rope_theta": 20000,
128
+ "rope_type": "default"
129
+ },
130
+ "video_config": {
131
+ "_name_or_path": "",
132
+ "add_cross_attention": false,
133
+ "architectures": null,
134
+ "attention_bias": false,
135
+ "attention_dropout": 0.0,
136
+ "bos_token_id": null,
137
+ "chunk_size_feed_forward": 0,
138
+ "cross_attention_hidden_size": null,
139
+ "decoder_start_token_id": null,
140
+ "dtype": null,
141
+ "eos_token_id": null,
142
+ "finetuning_task": null,
143
+ "head_dim": 128,
144
+ "hidden_act": "silu",
145
+ "hidden_size": 768,
146
+ "id2label": {
147
+ "0": "LABEL_0",
148
+ "1": "LABEL_1"
149
+ },
150
+ "initializer_range": 0.02,
151
+ "intermediate_size": 2048,
152
+ "is_decoder": false,
153
+ "is_encoder_decoder": false,
154
+ "label2id": {
155
+ "LABEL_0": 0,
156
+ "LABEL_1": 1
157
+ },
158
+ "max_position_embeddings": 10000,
159
+ "model_type": "pe_video_encoder",
160
+ "num_attention_heads": 6,
161
+ "num_hidden_layers": 4,
162
+ "num_key_value_heads": 6,
163
+ "output_attentions": false,
164
+ "output_hidden_states": false,
165
+ "pad_token_id": null,
166
+ "prefix": null,
167
+ "problem_type": null,
168
+ "return_dict": true,
169
+ "rms_norm_eps": 1e-05,
170
+ "rope_parameters": {
171
+ "rope_theta": 20000,
172
+ "rope_type": "default"
173
+ },
174
+ "sep_token_id": null,
175
+ "task_specific_params": null,
176
+ "tie_encoder_decoder": false,
177
+ "tie_word_embeddings": true,
178
+ "tokenizer_class": null,
179
+ "vision_config": {
180
+ "_name_or_path": "",
181
+ "add_cross_attention": false,
182
+ "architecture": "vit_pe_core_large_patch14_336",
183
+ "architectures": null,
184
+ "bos_token_id": null,
185
+ "chunk_size_feed_forward": 0,
186
+ "cross_attention_hidden_size": null,
187
+ "decoder_start_token_id": null,
188
+ "do_pooling": true,
189
+ "dtype": null,
190
+ "eos_token_id": null,
191
+ "finetuning_task": null,
192
+ "global_pool": "map",
193
  "initializer_range": 0.02,
194
+ "is_decoder": false,
195
+ "is_encoder_decoder": false,
196
+ "label_names": [
197
+ "LABEL_0",
198
+ "LABEL_1",
199
+ "LABEL_2",
200
+ "LABEL_3",
201
+ "LABEL_4",
202
+ "LABEL_5",
203
+ "LABEL_6",
204
+ "LABEL_7",
205
+ "LABEL_8",
206
+ "LABEL_9",
207
+ "LABEL_10",
208
+ "LABEL_11",
209
+ "LABEL_12",
210
+ "LABEL_13",
211
+ "LABEL_14",
212
+ "LABEL_15",
213
+ "LABEL_16",
214
+ "LABEL_17",
215
+ "LABEL_18",
216
+ "LABEL_19",
217
+ "LABEL_20",
218
+ "LABEL_21",
219
+ "LABEL_22",
220
+ "LABEL_23",
221
+ "LABEL_24",
222
+ "LABEL_25",
223
+ "LABEL_26",
224
+ "LABEL_27",
225
+ "LABEL_28",
226
+ "LABEL_29",
227
+ "LABEL_30",
228
+ "LABEL_31",
229
+ "LABEL_32",
230
+ "LABEL_33",
231
+ "LABEL_34",
232
+ "LABEL_35",
233
+ "LABEL_36",
234
+ "LABEL_37",
235
+ "LABEL_38",
236
+ "LABEL_39",
237
+ "LABEL_40",
238
+ "LABEL_41",
239
+ "LABEL_42",
240
+ "LABEL_43",
241
+ "LABEL_44",
242
+ "LABEL_45",
243
+ "LABEL_46",
244
+ "LABEL_47",
245
+ "LABEL_48",
246
+ "LABEL_49",
247
+ "LABEL_50",
248
+ "LABEL_51",
249
+ "LABEL_52",
250
+ "LABEL_53",
251
+ "LABEL_54",
252
+ "LABEL_55",
253
+ "LABEL_56",
254
+ "LABEL_57",
255
+ "LABEL_58",
256
+ "LABEL_59",
257
+ "LABEL_60",
258
+ "LABEL_61",
259
+ "LABEL_62",
260
+ "LABEL_63",
261
+ "LABEL_64",
262
+ "LABEL_65",
263
+ "LABEL_66",
264
+ "LABEL_67",
265
+ "LABEL_68",
266
+ "LABEL_69",
267
+ "LABEL_70",
268
+ "LABEL_71",
269
+ "LABEL_72",
270
+ "LABEL_73",
271
+ "LABEL_74",
272
+ "LABEL_75",
273
+ "LABEL_76",
274
+ "LABEL_77",
275
+ "LABEL_78",
276
+ "LABEL_79",
277
+ "LABEL_80",
278
+ "LABEL_81",
279
+ "LABEL_82",
280
+ "LABEL_83",
281
+ "LABEL_84",
282
+ "LABEL_85",
283
+ "LABEL_86",
284
+ "LABEL_87",
285
+ "LABEL_88",
286
+ "LABEL_89",
287
+ "LABEL_90",
288
+ "LABEL_91",
289
+ "LABEL_92",
290
+ "LABEL_93",
291
+ "LABEL_94",
292
+ "LABEL_95",
293
+ "LABEL_96",
294
+ "LABEL_97",
295
+ "LABEL_98",
296
+ "LABEL_99",
297
+ "LABEL_100",
298
+ "LABEL_101",
299
+ "LABEL_102",
300
+ "LABEL_103",
301
+ "LABEL_104",
302
+ "LABEL_105",
303
+ "LABEL_106",
304
+ "LABEL_107",
305
+ "LABEL_108",
306
+ "LABEL_109",
307
+ "LABEL_110",
308
+ "LABEL_111",
309
+ "LABEL_112",
310
+ "LABEL_113",
311
+ "LABEL_114",
312
+ "LABEL_115",
313
+ "LABEL_116",
314
+ "LABEL_117",
315
+ "LABEL_118",
316
+ "LABEL_119",
317
+ "LABEL_120",
318
+ "LABEL_121",
319
+ "LABEL_122",
320
+ "LABEL_123",
321
+ "LABEL_124",
322
+ "LABEL_125",
323
+ "LABEL_126",
324
+ "LABEL_127",
325
+ "LABEL_128",
326
+ "LABEL_129",
327
+ "LABEL_130",
328
+ "LABEL_131",
329
+ "LABEL_132",
330
+ "LABEL_133",
331
+ "LABEL_134",
332
+ "LABEL_135",
333
+ "LABEL_136",
334
+ "LABEL_137",
335
+ "LABEL_138",
336
+ "LABEL_139",
337
+ "LABEL_140",
338
+ "LABEL_141",
339
+ "LABEL_142",
340
+ "LABEL_143",
341
+ "LABEL_144",
342
+ "LABEL_145",
343
+ "LABEL_146",
344
+ "LABEL_147",
345
+ "LABEL_148",
346
+ "LABEL_149",
347
+ "LABEL_150",
348
+ "LABEL_151",
349
+ "LABEL_152",
350
+ "LABEL_153",
351
+ "LABEL_154",
352
+ "LABEL_155",
353
+ "LABEL_156",
354
+ "LABEL_157",
355
+ "LABEL_158",
356
+ "LABEL_159",
357
+ "LABEL_160",
358
+ "LABEL_161",
359
+ "LABEL_162",
360
+ "LABEL_163",
361
+ "LABEL_164",
362
+ "LABEL_165",
363
+ "LABEL_166",
364
+ "LABEL_167",
365
+ "LABEL_168",
366
+ "LABEL_169",
367
+ "LABEL_170",
368
+ "LABEL_171",
369
+ "LABEL_172",
370
+ "LABEL_173",
371
+ "LABEL_174",
372
+ "LABEL_175",
373
+ "LABEL_176",
374
+ "LABEL_177",
375
+ "LABEL_178",
376
+ "LABEL_179",
377
+ "LABEL_180",
378
+ "LABEL_181",
379
+ "LABEL_182",
380
+ "LABEL_183",
381
+ "LABEL_184",
382
+ "LABEL_185",
383
+ "LABEL_186",
384
+ "LABEL_187",
385
+ "LABEL_188",
386
+ "LABEL_189",
387
+ "LABEL_190",
388
+ "LABEL_191",
389
+ "LABEL_192",
390
+ "LABEL_193",
391
+ "LABEL_194",
392
+ "LABEL_195",
393
+ "LABEL_196",
394
+ "LABEL_197",
395
+ "LABEL_198",
396
+ "LABEL_199",
397
+ "LABEL_200",
398
+ "LABEL_201",
399
+ "LABEL_202",
400
+ "LABEL_203",
401
+ "LABEL_204",
402
+ "LABEL_205",
403
+ "LABEL_206",
404
+ "LABEL_207",
405
+ "LABEL_208",
406
+ "LABEL_209",
407
+ "LABEL_210",
408
+ "LABEL_211",
409
+ "LABEL_212",
410
+ "LABEL_213",
411
+ "LABEL_214",
412
+ "LABEL_215",
413
+ "LABEL_216",
414
+ "LABEL_217",
415
+ "LABEL_218",
416
+ "LABEL_219",
417
+ "LABEL_220",
418
+ "LABEL_221",
419
+ "LABEL_222",
420
+ "LABEL_223",
421
+ "LABEL_224",
422
+ "LABEL_225",
423
+ "LABEL_226",
424
+ "LABEL_227",
425
+ "LABEL_228",
426
+ "LABEL_229",
427
+ "LABEL_230",
428
+ "LABEL_231",
429
+ "LABEL_232",
430
+ "LABEL_233",
431
+ "LABEL_234",
432
+ "LABEL_235",
433
+ "LABEL_236",
434
+ "LABEL_237",
435
+ "LABEL_238",
436
+ "LABEL_239",
437
+ "LABEL_240",
438
+ "LABEL_241",
439
+ "LABEL_242",
440
+ "LABEL_243",
441
+ "LABEL_244",
442
+ "LABEL_245",
443
+ "LABEL_246",
444
+ "LABEL_247",
445
+ "LABEL_248",
446
+ "LABEL_249",
447
+ "LABEL_250",
448
+ "LABEL_251",
449
+ "LABEL_252",
450
+ "LABEL_253",
451
+ "LABEL_254",
452
+ "LABEL_255",
453
+ "LABEL_256",
454
+ "LABEL_257",
455
+ "LABEL_258",
456
+ "LABEL_259",
457
+ "LABEL_260",
458
+ "LABEL_261",
459
+ "LABEL_262",
460
+ "LABEL_263",
461
+ "LABEL_264",
462
+ "LABEL_265",
463
+ "LABEL_266",
464
+ "LABEL_267",
465
+ "LABEL_268",
466
+ "LABEL_269",
467
+ "LABEL_270",
468
+ "LABEL_271",
469
+ "LABEL_272",
470
+ "LABEL_273",
471
+ "LABEL_274",
472
+ "LABEL_275",
473
+ "LABEL_276",
474
+ "LABEL_277",
475
+ "LABEL_278",
476
+ "LABEL_279",
477
+ "LABEL_280",
478
+ "LABEL_281",
479
+ "LABEL_282",
480
+ "LABEL_283",
481
+ "LABEL_284",
482
+ "LABEL_285",
483
+ "LABEL_286",
484
+ "LABEL_287",
485
+ "LABEL_288",
486
+ "LABEL_289",
487
+ "LABEL_290",
488
+ "LABEL_291",
489
+ "LABEL_292",
490
+ "LABEL_293",
491
+ "LABEL_294",
492
+ "LABEL_295",
493
+ "LABEL_296",
494
+ "LABEL_297",
495
+ "LABEL_298",
496
+ "LABEL_299",
497
+ "LABEL_300",
498
+ "LABEL_301",
499
+ "LABEL_302",
500
+ "LABEL_303",
501
+ "LABEL_304",
502
+ "LABEL_305",
503
+ "LABEL_306",
504
+ "LABEL_307",
505
+ "LABEL_308",
506
+ "LABEL_309",
507
+ "LABEL_310",
508
+ "LABEL_311",
509
+ "LABEL_312",
510
+ "LABEL_313",
511
+ "LABEL_314",
512
+ "LABEL_315",
513
+ "LABEL_316",
514
+ "LABEL_317",
515
+ "LABEL_318",
516
+ "LABEL_319",
517
+ "LABEL_320",
518
+ "LABEL_321",
519
+ "LABEL_322",
520
+ "LABEL_323",
521
+ "LABEL_324",
522
+ "LABEL_325",
523
+ "LABEL_326",
524
+ "LABEL_327",
525
+ "LABEL_328",
526
+ "LABEL_329",
527
+ "LABEL_330",
528
+ "LABEL_331",
529
+ "LABEL_332",
530
+ "LABEL_333",
531
+ "LABEL_334",
532
+ "LABEL_335",
533
+ "LABEL_336",
534
+ "LABEL_337",
535
+ "LABEL_338",
536
+ "LABEL_339",
537
+ "LABEL_340",
538
+ "LABEL_341",
539
+ "LABEL_342",
540
+ "LABEL_343",
541
+ "LABEL_344",
542
+ "LABEL_345",
543
+ "LABEL_346",
544
+ "LABEL_347",
545
+ "LABEL_348",
546
+ "LABEL_349",
547
+ "LABEL_350",
548
+ "LABEL_351",
549
+ "LABEL_352",
550
+ "LABEL_353",
551
+ "LABEL_354",
552
+ "LABEL_355",
553
+ "LABEL_356",
554
+ "LABEL_357",
555
+ "LABEL_358",
556
+ "LABEL_359",
557
+ "LABEL_360",
558
+ "LABEL_361",
559
+ "LABEL_362",
560
+ "LABEL_363",
561
+ "LABEL_364",
562
+ "LABEL_365",
563
+ "LABEL_366",
564
+ "LABEL_367",
565
+ "LABEL_368",
566
+ "LABEL_369",
567
+ "LABEL_370",
568
+ "LABEL_371",
569
+ "LABEL_372",
570
+ "LABEL_373",
571
+ "LABEL_374",
572
+ "LABEL_375",
573
+ "LABEL_376",
574
+ "LABEL_377",
575
+ "LABEL_378",
576
+ "LABEL_379",
577
+ "LABEL_380",
578
+ "LABEL_381",
579
+ "LABEL_382",
580
+ "LABEL_383",
581
+ "LABEL_384",
582
+ "LABEL_385",
583
+ "LABEL_386",
584
+ "LABEL_387",
585
+ "LABEL_388",
586
+ "LABEL_389",
587
+ "LABEL_390",
588
+ "LABEL_391",
589
+ "LABEL_392",
590
+ "LABEL_393",
591
+ "LABEL_394",
592
+ "LABEL_395",
593
+ "LABEL_396",
594
+ "LABEL_397",
595
+ "LABEL_398",
596
+ "LABEL_399",
597
+ "LABEL_400",
598
+ "LABEL_401",
599
+ "LABEL_402",
600
+ "LABEL_403",
601
+ "LABEL_404",
602
+ "LABEL_405",
603
+ "LABEL_406",
604
+ "LABEL_407",
605
+ "LABEL_408",
606
+ "LABEL_409",
607
+ "LABEL_410",
608
+ "LABEL_411",
609
+ "LABEL_412",
610
+ "LABEL_413",
611
+ "LABEL_414",
612
+ "LABEL_415",
613
+ "LABEL_416",
614
+ "LABEL_417",
615
+ "LABEL_418",
616
+ "LABEL_419",
617
+ "LABEL_420",
618
+ "LABEL_421",
619
+ "LABEL_422",
620
+ "LABEL_423",
621
+ "LABEL_424",
622
+ "LABEL_425",
623
+ "LABEL_426",
624
+ "LABEL_427",
625
+ "LABEL_428",
626
+ "LABEL_429",
627
+ "LABEL_430",
628
+ "LABEL_431",
629
+ "LABEL_432",
630
+ "LABEL_433",
631
+ "LABEL_434",
632
+ "LABEL_435",
633
+ "LABEL_436",
634
+ "LABEL_437",
635
+ "LABEL_438",
636
+ "LABEL_439",
637
+ "LABEL_440",
638
+ "LABEL_441",
639
+ "LABEL_442",
640
+ "LABEL_443",
641
+ "LABEL_444",
642
+ "LABEL_445",
643
+ "LABEL_446",
644
+ "LABEL_447",
645
+ "LABEL_448",
646
+ "LABEL_449",
647
+ "LABEL_450",
648
+ "LABEL_451",
649
+ "LABEL_452",
650
+ "LABEL_453",
651
+ "LABEL_454",
652
+ "LABEL_455",
653
+ "LABEL_456",
654
+ "LABEL_457",
655
+ "LABEL_458",
656
+ "LABEL_459",
657
+ "LABEL_460",
658
+ "LABEL_461",
659
+ "LABEL_462",
660
+ "LABEL_463",
661
+ "LABEL_464",
662
+ "LABEL_465",
663
+ "LABEL_466",
664
+ "LABEL_467",
665
+ "LABEL_468",
666
+ "LABEL_469",
667
+ "LABEL_470",
668
+ "LABEL_471",
669
+ "LABEL_472",
670
+ "LABEL_473",
671
+ "LABEL_474",
672
+ "LABEL_475",
673
+ "LABEL_476",
674
+ "LABEL_477",
675
+ "LABEL_478",
676
+ "LABEL_479",
677
+ "LABEL_480",
678
+ "LABEL_481",
679
+ "LABEL_482",
680
+ "LABEL_483",
681
+ "LABEL_484",
682
+ "LABEL_485",
683
+ "LABEL_486",
684
+ "LABEL_487",
685
+ "LABEL_488",
686
+ "LABEL_489",
687
+ "LABEL_490",
688
+ "LABEL_491",
689
+ "LABEL_492",
690
+ "LABEL_493",
691
+ "LABEL_494",
692
+ "LABEL_495",
693
+ "LABEL_496",
694
+ "LABEL_497",
695
+ "LABEL_498",
696
+ "LABEL_499",
697
+ "LABEL_500",
698
+ "LABEL_501",
699
+ "LABEL_502",
700
+ "LABEL_503",
701
+ "LABEL_504",
702
+ "LABEL_505",
703
+ "LABEL_506",
704
+ "LABEL_507",
705
+ "LABEL_508",
706
+ "LABEL_509",
707
+ "LABEL_510",
708
+ "LABEL_511",
709
+ "LABEL_512",
710
+ "LABEL_513",
711
+ "LABEL_514",
712
+ "LABEL_515",
713
+ "LABEL_516",
714
+ "LABEL_517",
715
+ "LABEL_518",
716
+ "LABEL_519",
717
+ "LABEL_520",
718
+ "LABEL_521",
719
+ "LABEL_522",
720
+ "LABEL_523",
721
+ "LABEL_524",
722
+ "LABEL_525",
723
+ "LABEL_526",
724
+ "LABEL_527",
725
+ "LABEL_528",
726
+ "LABEL_529",
727
+ "LABEL_530",
728
+ "LABEL_531",
729
+ "LABEL_532",
730
+ "LABEL_533",
731
+ "LABEL_534",
732
+ "LABEL_535",
733
+ "LABEL_536",
734
+ "LABEL_537",
735
+ "LABEL_538",
736
+ "LABEL_539",
737
+ "LABEL_540",
738
+ "LABEL_541",
739
+ "LABEL_542",
740
+ "LABEL_543",
741
+ "LABEL_544",
742
+ "LABEL_545",
743
+ "LABEL_546",
744
+ "LABEL_547",
745
+ "LABEL_548",
746
+ "LABEL_549",
747
+ "LABEL_550",
748
+ "LABEL_551",
749
+ "LABEL_552",
750
+ "LABEL_553",
751
+ "LABEL_554",
752
+ "LABEL_555",
753
+ "LABEL_556",
754
+ "LABEL_557",
755
+ "LABEL_558",
756
+ "LABEL_559",
757
+ "LABEL_560",
758
+ "LABEL_561",
759
+ "LABEL_562",
760
+ "LABEL_563",
761
+ "LABEL_564",
762
+ "LABEL_565",
763
+ "LABEL_566",
764
+ "LABEL_567",
765
+ "LABEL_568",
766
+ "LABEL_569",
767
+ "LABEL_570",
768
+ "LABEL_571",
769
+ "LABEL_572",
770
+ "LABEL_573",
771
+ "LABEL_574",
772
+ "LABEL_575",
773
+ "LABEL_576",
774
+ "LABEL_577",
775
+ "LABEL_578",
776
+ "LABEL_579",
777
+ "LABEL_580",
778
+ "LABEL_581",
779
+ "LABEL_582",
780
+ "LABEL_583",
781
+ "LABEL_584",
782
+ "LABEL_585",
783
+ "LABEL_586",
784
+ "LABEL_587",
785
+ "LABEL_588",
786
+ "LABEL_589",
787
+ "LABEL_590",
788
+ "LABEL_591",
789
+ "LABEL_592",
790
+ "LABEL_593",
791
+ "LABEL_594",
792
+ "LABEL_595",
793
+ "LABEL_596",
794
+ "LABEL_597",
795
+ "LABEL_598",
796
+ "LABEL_599",
797
+ "LABEL_600",
798
+ "LABEL_601",
799
+ "LABEL_602",
800
+ "LABEL_603",
801
+ "LABEL_604",
802
+ "LABEL_605",
803
+ "LABEL_606",
804
+ "LABEL_607",
805
+ "LABEL_608",
806
+ "LABEL_609",
807
+ "LABEL_610",
808
+ "LABEL_611",
809
+ "LABEL_612",
810
+ "LABEL_613",
811
+ "LABEL_614",
812
+ "LABEL_615",
813
+ "LABEL_616",
814
+ "LABEL_617",
815
+ "LABEL_618",
816
+ "LABEL_619",
817
+ "LABEL_620",
818
+ "LABEL_621",
819
+ "LABEL_622",
820
+ "LABEL_623",
821
+ "LABEL_624",
822
+ "LABEL_625",
823
+ "LABEL_626",
824
+ "LABEL_627",
825
+ "LABEL_628",
826
+ "LABEL_629",
827
+ "LABEL_630",
828
+ "LABEL_631",
829
+ "LABEL_632",
830
+ "LABEL_633",
831
+ "LABEL_634",
832
+ "LABEL_635",
833
+ "LABEL_636",
834
+ "LABEL_637",
835
+ "LABEL_638",
836
+ "LABEL_639",
837
+ "LABEL_640",
838
+ "LABEL_641",
839
+ "LABEL_642",
840
+ "LABEL_643",
841
+ "LABEL_644",
842
+ "LABEL_645",
843
+ "LABEL_646",
844
+ "LABEL_647",
845
+ "LABEL_648",
846
+ "LABEL_649",
847
+ "LABEL_650",
848
+ "LABEL_651",
849
+ "LABEL_652",
850
+ "LABEL_653",
851
+ "LABEL_654",
852
+ "LABEL_655",
853
+ "LABEL_656",
854
+ "LABEL_657",
855
+ "LABEL_658",
856
+ "LABEL_659",
857
+ "LABEL_660",
858
+ "LABEL_661",
859
+ "LABEL_662",
860
+ "LABEL_663",
861
+ "LABEL_664",
862
+ "LABEL_665",
863
+ "LABEL_666",
864
+ "LABEL_667",
865
+ "LABEL_668",
866
+ "LABEL_669",
867
+ "LABEL_670",
868
+ "LABEL_671",
869
+ "LABEL_672",
870
+ "LABEL_673",
871
+ "LABEL_674",
872
+ "LABEL_675",
873
+ "LABEL_676",
874
+ "LABEL_677",
875
+ "LABEL_678",
876
+ "LABEL_679",
877
+ "LABEL_680",
878
+ "LABEL_681",
879
+ "LABEL_682",
880
+ "LABEL_683",
881
+ "LABEL_684",
882
+ "LABEL_685",
883
+ "LABEL_686",
884
+ "LABEL_687",
885
+ "LABEL_688",
886
+ "LABEL_689",
887
+ "LABEL_690",
888
+ "LABEL_691",
889
+ "LABEL_692",
890
+ "LABEL_693",
891
+ "LABEL_694",
892
+ "LABEL_695",
893
+ "LABEL_696",
894
+ "LABEL_697",
895
+ "LABEL_698",
896
+ "LABEL_699",
897
+ "LABEL_700",
898
+ "LABEL_701",
899
+ "LABEL_702",
900
+ "LABEL_703",
901
+ "LABEL_704",
902
+ "LABEL_705",
903
+ "LABEL_706",
904
+ "LABEL_707",
905
+ "LABEL_708",
906
+ "LABEL_709",
907
+ "LABEL_710",
908
+ "LABEL_711",
909
+ "LABEL_712",
910
+ "LABEL_713",
911
+ "LABEL_714",
912
+ "LABEL_715",
913
+ "LABEL_716",
914
+ "LABEL_717",
915
+ "LABEL_718",
916
+ "LABEL_719",
917
+ "LABEL_720",
918
+ "LABEL_721",
919
+ "LABEL_722",
920
+ "LABEL_723",
921
+ "LABEL_724",
922
+ "LABEL_725",
923
+ "LABEL_726",
924
+ "LABEL_727",
925
+ "LABEL_728",
926
+ "LABEL_729",
927
+ "LABEL_730",
928
+ "LABEL_731",
929
+ "LABEL_732",
930
+ "LABEL_733",
931
+ "LABEL_734",
932
+ "LABEL_735",
933
+ "LABEL_736",
934
+ "LABEL_737",
935
+ "LABEL_738",
936
+ "LABEL_739",
937
+ "LABEL_740",
938
+ "LABEL_741",
939
+ "LABEL_742",
940
+ "LABEL_743",
941
+ "LABEL_744",
942
+ "LABEL_745",
943
+ "LABEL_746",
944
+ "LABEL_747",
945
+ "LABEL_748",
946
+ "LABEL_749",
947
+ "LABEL_750",
948
+ "LABEL_751",
949
+ "LABEL_752",
950
+ "LABEL_753",
951
+ "LABEL_754",
952
+ "LABEL_755",
953
+ "LABEL_756",
954
+ "LABEL_757",
955
+ "LABEL_758",
956
+ "LABEL_759",
957
+ "LABEL_760",
958
+ "LABEL_761",
959
+ "LABEL_762",
960
+ "LABEL_763",
961
+ "LABEL_764",
962
+ "LABEL_765",
963
+ "LABEL_766",
964
+ "LABEL_767",
965
+ "LABEL_768",
966
+ "LABEL_769",
967
+ "LABEL_770",
968
+ "LABEL_771",
969
+ "LABEL_772",
970
+ "LABEL_773",
971
+ "LABEL_774",
972
+ "LABEL_775",
973
+ "LABEL_776",
974
+ "LABEL_777",
975
+ "LABEL_778",
976
+ "LABEL_779",
977
+ "LABEL_780",
978
+ "LABEL_781",
979
+ "LABEL_782",
980
+ "LABEL_783",
981
+ "LABEL_784",
982
+ "LABEL_785",
983
+ "LABEL_786",
984
+ "LABEL_787",
985
+ "LABEL_788",
986
+ "LABEL_789",
987
+ "LABEL_790",
988
+ "LABEL_791",
989
+ "LABEL_792",
990
+ "LABEL_793",
991
+ "LABEL_794",
992
+ "LABEL_795",
993
+ "LABEL_796",
994
+ "LABEL_797",
995
+ "LABEL_798",
996
+ "LABEL_799",
997
+ "LABEL_800",
998
+ "LABEL_801",
999
+ "LABEL_802",
1000
+ "LABEL_803",
1001
+ "LABEL_804",
1002
+ "LABEL_805",
1003
+ "LABEL_806",
1004
+ "LABEL_807",
1005
+ "LABEL_808",
1006
+ "LABEL_809",
1007
+ "LABEL_810",
1008
+ "LABEL_811",
1009
+ "LABEL_812",
1010
+ "LABEL_813",
1011
+ "LABEL_814",
1012
+ "LABEL_815",
1013
+ "LABEL_816",
1014
+ "LABEL_817",
1015
+ "LABEL_818",
1016
+ "LABEL_819",
1017
+ "LABEL_820",
1018
+ "LABEL_821",
1019
+ "LABEL_822",
1020
+ "LABEL_823",
1021
+ "LABEL_824",
1022
+ "LABEL_825",
1023
+ "LABEL_826",
1024
+ "LABEL_827",
1025
+ "LABEL_828",
1026
+ "LABEL_829",
1027
+ "LABEL_830",
1028
+ "LABEL_831",
1029
+ "LABEL_832",
1030
+ "LABEL_833",
1031
+ "LABEL_834",
1032
+ "LABEL_835",
1033
+ "LABEL_836",
1034
+ "LABEL_837",
1035
+ "LABEL_838",
1036
+ "LABEL_839",
1037
+ "LABEL_840",
1038
+ "LABEL_841",
1039
+ "LABEL_842",
1040
+ "LABEL_843",
1041
+ "LABEL_844",
1042
+ "LABEL_845",
1043
+ "LABEL_846",
1044
+ "LABEL_847",
1045
+ "LABEL_848",
1046
+ "LABEL_849",
1047
+ "LABEL_850",
1048
+ "LABEL_851",
1049
+ "LABEL_852",
1050
+ "LABEL_853",
1051
+ "LABEL_854",
1052
+ "LABEL_855",
1053
+ "LABEL_856",
1054
+ "LABEL_857",
1055
+ "LABEL_858",
1056
+ "LABEL_859",
1057
+ "LABEL_860",
1058
+ "LABEL_861",
1059
+ "LABEL_862",
1060
+ "LABEL_863",
1061
+ "LABEL_864",
1062
+ "LABEL_865",
1063
+ "LABEL_866",
1064
+ "LABEL_867",
1065
+ "LABEL_868",
1066
+ "LABEL_869",
1067
+ "LABEL_870",
1068
+ "LABEL_871",
1069
+ "LABEL_872",
1070
+ "LABEL_873",
1071
+ "LABEL_874",
1072
+ "LABEL_875",
1073
+ "LABEL_876",
1074
+ "LABEL_877",
1075
+ "LABEL_878",
1076
+ "LABEL_879",
1077
+ "LABEL_880",
1078
+ "LABEL_881",
1079
+ "LABEL_882",
1080
+ "LABEL_883",
1081
+ "LABEL_884",
1082
+ "LABEL_885",
1083
+ "LABEL_886",
1084
+ "LABEL_887",
1085
+ "LABEL_888",
1086
+ "LABEL_889",
1087
+ "LABEL_890",
1088
+ "LABEL_891",
1089
+ "LABEL_892",
1090
+ "LABEL_893",
1091
+ "LABEL_894",
1092
+ "LABEL_895",
1093
+ "LABEL_896",
1094
+ "LABEL_897",
1095
+ "LABEL_898",
1096
+ "LABEL_899",
1097
+ "LABEL_900",
1098
+ "LABEL_901",
1099
+ "LABEL_902",
1100
+ "LABEL_903",
1101
+ "LABEL_904",
1102
+ "LABEL_905",
1103
+ "LABEL_906",
1104
+ "LABEL_907",
1105
+ "LABEL_908",
1106
+ "LABEL_909",
1107
+ "LABEL_910",
1108
+ "LABEL_911",
1109
+ "LABEL_912",
1110
+ "LABEL_913",
1111
+ "LABEL_914",
1112
+ "LABEL_915",
1113
+ "LABEL_916",
1114
+ "LABEL_917",
1115
+ "LABEL_918",
1116
+ "LABEL_919",
1117
+ "LABEL_920",
1118
+ "LABEL_921",
1119
+ "LABEL_922",
1120
+ "LABEL_923",
1121
+ "LABEL_924",
1122
+ "LABEL_925",
1123
+ "LABEL_926",
1124
+ "LABEL_927",
1125
+ "LABEL_928",
1126
+ "LABEL_929",
1127
+ "LABEL_930",
1128
+ "LABEL_931",
1129
+ "LABEL_932",
1130
+ "LABEL_933",
1131
+ "LABEL_934",
1132
+ "LABEL_935",
1133
+ "LABEL_936",
1134
+ "LABEL_937",
1135
+ "LABEL_938",
1136
+ "LABEL_939",
1137
+ "LABEL_940",
1138
+ "LABEL_941",
1139
+ "LABEL_942",
1140
+ "LABEL_943",
1141
+ "LABEL_944",
1142
+ "LABEL_945",
1143
+ "LABEL_946",
1144
+ "LABEL_947",
1145
+ "LABEL_948",
1146
+ "LABEL_949",
1147
+ "LABEL_950",
1148
+ "LABEL_951",
1149
+ "LABEL_952",
1150
+ "LABEL_953",
1151
+ "LABEL_954",
1152
+ "LABEL_955",
1153
+ "LABEL_956",
1154
+ "LABEL_957",
1155
+ "LABEL_958",
1156
+ "LABEL_959",
1157
+ "LABEL_960",
1158
+ "LABEL_961",
1159
+ "LABEL_962",
1160
+ "LABEL_963",
1161
+ "LABEL_964",
1162
+ "LABEL_965",
1163
+ "LABEL_966",
1164
+ "LABEL_967",
1165
+ "LABEL_968",
1166
+ "LABEL_969",
1167
+ "LABEL_970",
1168
+ "LABEL_971",
1169
+ "LABEL_972",
1170
+ "LABEL_973",
1171
+ "LABEL_974",
1172
+ "LABEL_975",
1173
+ "LABEL_976",
1174
+ "LABEL_977",
1175
+ "LABEL_978",
1176
+ "LABEL_979",
1177
+ "LABEL_980",
1178
+ "LABEL_981",
1179
+ "LABEL_982",
1180
+ "LABEL_983",
1181
+ "LABEL_984",
1182
+ "LABEL_985",
1183
+ "LABEL_986",
1184
+ "LABEL_987",
1185
+ "LABEL_988",
1186
+ "LABEL_989",
1187
+ "LABEL_990",
1188
+ "LABEL_991",
1189
+ "LABEL_992",
1190
+ "LABEL_993",
1191
+ "LABEL_994",
1192
+ "LABEL_995",
1193
+ "LABEL_996",
1194
+ "LABEL_997",
1195
+ "LABEL_998",
1196
+ "LABEL_999",
1197
+ "LABEL_1000",
1198
+ "LABEL_1001",
1199
+ "LABEL_1002",
1200
+ "LABEL_1003",
1201
+ "LABEL_1004",
1202
+ "LABEL_1005",
1203
+ "LABEL_1006",
1204
+ "LABEL_1007",
1205
+ "LABEL_1008",
1206
+ "LABEL_1009",
1207
+ "LABEL_1010",
1208
+ "LABEL_1011",
1209
+ "LABEL_1012",
1210
+ "LABEL_1013",
1211
+ "LABEL_1014",
1212
+ "LABEL_1015",
1213
+ "LABEL_1016",
1214
+ "LABEL_1017",
1215
+ "LABEL_1018",
1216
+ "LABEL_1019",
1217
+ "LABEL_1020",
1218
+ "LABEL_1021",
1219
+ "LABEL_1022",
1220
+ "LABEL_1023"
1221
+ ],
1222
+ "model_args": {},
1223
+ "model_type": "timm_wrapper",
1224
+ "num_classes": 1024,
1225
+ "output_attentions": false,
1226
+ "output_hidden_states": false,
1227
+ "pad_token_id": null,
1228
+ "prefix": null,
1229
+ "problem_type": null,
1230
+ "return_dict": true,
1231
+ "sep_token_id": null,
1232
+ "task_specific_params": null,
1233
+ "tie_encoder_decoder": false,
1234
+ "tie_word_embeddings": true,
1235
+ "tokenizer_class": null
1236
+ }
1237
  }
1238
+ },
1239
+ "dtype": "float32",
1240
+ "model_type": "pe_audio_video",
1241
+ "text_config": {
1242
+ "attention_bias": false,
1243
+ "attention_dropout": 0.0,
1244
+ "classifier_activation": "gelu",
1245
+ "classifier_bias": false,
1246
+ "classifier_dropout": 0.0,
1247
+ "classifier_pooling": "cls",
1248
+ "cls_token_id": 50281,
1249
+ "decoder_bias": true,
1250
+ "deterministic_flash_attn": false,
1251
+ "embedding_dropout": 0.0,
1252
+ "global_attn_every_n_layers": 3,
1253
+ "hidden_activation": "gelu",
1254
+ "hidden_size": 1024,
1255
+ "initializer_cutoff_factor": 2.0,
1256
+ "initializer_range": 0.02,
1257
+ "intermediate_size": 2624,
1258
+ "layer_types": [
1259
+ "full_attention",
1260
+ "sliding_attention",
1261
+ "sliding_attention",
1262
+ "full_attention",
1263
+ "sliding_attention",
1264
+ "sliding_attention",
1265
+ "full_attention",
1266
+ "sliding_attention",
1267
+ "sliding_attention",
1268
+ "full_attention",
1269
+ "sliding_attention",
1270
+ "sliding_attention",
1271
+ "full_attention",
1272
+ "sliding_attention",
1273
+ "sliding_attention",
1274
+ "full_attention",
1275
+ "sliding_attention",
1276
+ "sliding_attention",
1277
+ "full_attention",
1278
+ "sliding_attention",
1279
+ "sliding_attention",
1280
+ "full_attention"
1281
+ ],
1282
+ "local_attention": 128,
1283
+ "max_position_embeddings": 8192,
1284
+ "mlp_bias": false,
1285
+ "mlp_dropout": 0.0,
1286
+ "model_type": "modernbert",
1287
+ "norm_bias": false,
1288
+ "norm_eps": 1e-05,
1289
+ "num_attention_heads": 16,
1290
+ "num_hidden_layers": 22,
1291
+ "repad_logits_with_grad": false,
1292
+ "rope_parameters": {
1293
+ "full_attention": {
1294
+ "rope_theta": 160000.0,
1295
+ "rope_type": "default"
1296
+ },
1297
+ "sliding_attention": {
1298
+ "rope_theta": 10000.0,
1299
+ "rope_type": "default"
1300
+ }
1301
+ },
1302
+ "sparse_pred_ignore_index": -100,
1303
+ "sparse_prediction": false,
1304
+ "vocab_size": 50368
1305
+ },
1306
+ "transformers_version": "5.0.0.dev0"
1307
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd492748b94339c873b0d5795cf85a2262f21118f7d57bfb9abc8d61adefa682
3
- size 3388617568
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:522159f858ee6a01ce333ab9f41b317f6565b4ad4137e021905f262e046be66d
3
+ size 3388082648