xiaoyi1734 commited on
Commit
85d4bbf
·
verified ·
1 Parent(s): fcf3e04

Upload merged_model_separated_gemini_90_2000/config.json with huggingface_hub

Browse files
merged_model_separated_gemini_90_2000/config.json ADDED
@@ -0,0 +1,627 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen2_5OmniForConditionalGeneration"
4
+ ],
5
+ "enable_audio_output": true,
6
+ "enable_talker": true,
7
+ "model_type": "qwen2_5_omni",
8
+ "talker_config": {
9
+ "_attn_implementation_autoset": true,
10
+ "_name_or_path": "Qwen2.5-Omni-7B/talker",
11
+ "architectures": [
12
+ "Qwen2OmniTalkerForConditionalGeneration"
13
+ ],
14
+ "attention_dropout": 0.0,
15
+ "audio_end_token_id": 151648,
16
+ "audio_start_token_id": 151647,
17
+ "audio_token_index": 151646,
18
+ "embedding_size": 3584,
19
+ "head_dim": 128,
20
+ "hidden_act": "silu",
21
+ "hidden_size": 896,
22
+ "image_token_index": 151655,
23
+ "init_std": 0.02,
24
+ "initializer_range": 0.02,
25
+ "intermediate_size": 18944,
26
+ "layer_types": [
27
+ "full_attention",
28
+ "full_attention",
29
+ "full_attention",
30
+ "full_attention",
31
+ "full_attention",
32
+ "full_attention",
33
+ "full_attention",
34
+ "full_attention",
35
+ "full_attention",
36
+ "full_attention",
37
+ "full_attention",
38
+ "full_attention",
39
+ "full_attention",
40
+ "full_attention",
41
+ "full_attention",
42
+ "full_attention",
43
+ "full_attention",
44
+ "full_attention",
45
+ "full_attention",
46
+ "full_attention",
47
+ "full_attention",
48
+ "full_attention",
49
+ "full_attention",
50
+ "full_attention"
51
+ ],
52
+ "max_position_embeddings": 32768,
53
+ "max_window_layers": 28,
54
+ "model_type": "qwen2_5_omni_talker",
55
+ "num_attention_heads": 12,
56
+ "num_hidden_layers": 24,
57
+ "num_key_value_heads": 4,
58
+ "position_id_per_seconds": 25,
59
+ "rms_norm_eps": 1e-06,
60
+ "rope_scaling": {
61
+ "mrope_section": [
62
+ 16,
63
+ 24,
64
+ 24
65
+ ],
66
+ "rope_type": "default",
67
+ "type": "default"
68
+ },
69
+ "rope_theta": 1000000.0,
70
+ "seconds_per_chunk": 2,
71
+ "sliding_window": null,
72
+ "spatial_merge_size": 2,
73
+ "torch_dtype": "bfloat16",
74
+ "tts_codec_end_token_id": 8294,
75
+ "tts_codec_mask_token_id": 8296,
76
+ "tts_codec_pad_token_id": 8292,
77
+ "tts_codec_start_token_id": 8293,
78
+ "tts_text_end_token_id": 151861,
79
+ "tts_text_pad_token_id": 151859,
80
+ "tts_text_start_token_id": 151860,
81
+ "use_cache": true,
82
+ "use_sliding_window": false,
83
+ "video_token_index": 151656,
84
+ "vision_end_token_id": 151653,
85
+ "vision_start_token_id": 151652,
86
+ "vocab_size": 8448
87
+ },
88
+ "thinker_config": {
89
+ "_attn_implementation_autoset": true,
90
+ "_name_or_path": "Qwen2.5-Omni-7B/thinker",
91
+ "architectures": [
92
+ "Qwen2OmniNaViTThinkerForConditionalGeneration"
93
+ ],
94
+ "audio_config": {
95
+ "_attn_implementation_autoset": true,
96
+ "_name_or_path": "",
97
+ "activation_dropout": 0.0,
98
+ "activation_function": "gelu",
99
+ "add_cross_attention": false,
100
+ "architectures": null,
101
+ "attention_dropout": 0.0,
102
+ "bad_words_ids": null,
103
+ "begin_suppress_tokens": null,
104
+ "bos_token_id": null,
105
+ "chunk_size_feed_forward": 0,
106
+ "cross_attention_hidden_size": null,
107
+ "d_model": 1280,
108
+ "decoder_start_token_id": null,
109
+ "diversity_penalty": 0.0,
110
+ "do_sample": false,
111
+ "dropout": 0.0,
112
+ "early_stopping": false,
113
+ "encoder_attention_heads": 20,
114
+ "encoder_ffn_dim": 5120,
115
+ "encoder_layerdrop": 0.0,
116
+ "encoder_layers": 32,
117
+ "encoder_no_repeat_ngram_size": 0,
118
+ "eos_token_id": null,
119
+ "exponential_decay_length_penalty": null,
120
+ "finetuning_task": null,
121
+ "forced_bos_token_id": null,
122
+ "forced_eos_token_id": null,
123
+ "id2label": {
124
+ "0": "LABEL_0",
125
+ "1": "LABEL_1"
126
+ },
127
+ "init_std": 0.02,
128
+ "initializer_range": 0.02,
129
+ "is_decoder": false,
130
+ "is_encoder_decoder": false,
131
+ "label2id": {
132
+ "LABEL_0": 0,
133
+ "LABEL_1": 1
134
+ },
135
+ "length_penalty": 1.0,
136
+ "max_length": 20,
137
+ "max_source_positions": 1500,
138
+ "min_length": 0,
139
+ "model_type": "qwen2_5_omni_audio_encoder",
140
+ "n_window": 100,
141
+ "no_repeat_ngram_size": 0,
142
+ "num_beam_groups": 1,
143
+ "num_beams": 1,
144
+ "num_hidden_layers": 32,
145
+ "num_mel_bins": 128,
146
+ "num_return_sequences": 1,
147
+ "output_attentions": false,
148
+ "output_dim": 3584,
149
+ "output_hidden_states": false,
150
+ "output_scores": false,
151
+ "pad_token_id": null,
152
+ "prefix": null,
153
+ "problem_type": null,
154
+ "pruned_heads": {},
155
+ "remove_invalid_values": false,
156
+ "repetition_penalty": 1.0,
157
+ "return_dict": true,
158
+ "return_dict_in_generate": false,
159
+ "scale_embedding": false,
160
+ "sep_token_id": null,
161
+ "suppress_tokens": null,
162
+ "task_specific_params": null,
163
+ "temperature": 1.0,
164
+ "tf_legacy_loss": false,
165
+ "tie_encoder_decoder": false,
166
+ "tie_word_embeddings": true,
167
+ "tokenizer_class": null,
168
+ "top_k": 50,
169
+ "top_p": 1.0,
170
+ "torch_dtype": null,
171
+ "torchscript": false,
172
+ "typical_p": 1.0,
173
+ "use_bfloat16": false
174
+ },
175
+ "audio_end_token_id": 151648,
176
+ "audio_start_token_id": 151647,
177
+ "audio_token_index": 151646,
178
+ "bos_token_id": 151644,
179
+ "eos_token_id": 151645,
180
+ "ignore_index": -100,
181
+ "image_token_index": 151655,
182
+ "init_std": 0.02,
183
+ "initializer_range": 0.02,
184
+ "model_type": "qwen2_5_omni_thinker",
185
+ "pad_token_id": 151643,
186
+ "position_id_per_seconds": 25,
187
+ "seconds_per_chunk": 2,
188
+ "text_config": {
189
+ "_name_or_path": "",
190
+ "add_cross_attention": false,
191
+ "architectures": null,
192
+ "attention_dropout": 0.0,
193
+ "bad_words_ids": null,
194
+ "begin_suppress_tokens": null,
195
+ "bos_token_id": null,
196
+ "chunk_size_feed_forward": 0,
197
+ "cross_attention_hidden_size": null,
198
+ "decoder_start_token_id": null,
199
+ "diversity_penalty": 0.0,
200
+ "do_sample": false,
201
+ "early_stopping": false,
202
+ "encoder_no_repeat_ngram_size": 0,
203
+ "eos_token_id": null,
204
+ "exponential_decay_length_penalty": null,
205
+ "finetuning_task": null,
206
+ "forced_bos_token_id": null,
207
+ "forced_eos_token_id": null,
208
+ "hidden_act": "silu",
209
+ "hidden_size": 3584,
210
+ "id2label": {
211
+ "0": "LABEL_0",
212
+ "1": "LABEL_1"
213
+ },
214
+ "init_std": 0.02,
215
+ "initializer_range": 0.02,
216
+ "intermediate_size": 18944,
217
+ "is_decoder": false,
218
+ "is_encoder_decoder": false,
219
+ "label2id": {
220
+ "LABEL_0": 0,
221
+ "LABEL_1": 1
222
+ },
223
+ "layer_types": [
224
+ "full_attention",
225
+ "full_attention",
226
+ "full_attention",
227
+ "full_attention",
228
+ "full_attention",
229
+ "full_attention",
230
+ "full_attention",
231
+ "full_attention",
232
+ "full_attention",
233
+ "full_attention",
234
+ "full_attention",
235
+ "full_attention",
236
+ "full_attention",
237
+ "full_attention",
238
+ "full_attention",
239
+ "full_attention",
240
+ "full_attention",
241
+ "full_attention",
242
+ "full_attention",
243
+ "full_attention",
244
+ "full_attention",
245
+ "full_attention",
246
+ "full_attention",
247
+ "full_attention",
248
+ "full_attention",
249
+ "full_attention",
250
+ "full_attention",
251
+ "full_attention"
252
+ ],
253
+ "length_penalty": 1.0,
254
+ "max_length": 20,
255
+ "max_position_embeddings": 32768,
256
+ "max_window_layers": 28,
257
+ "min_length": 0,
258
+ "model_type": "qwen2_5_omni_text",
259
+ "no_repeat_ngram_size": 0,
260
+ "num_attention_heads": 28,
261
+ "num_beam_groups": 1,
262
+ "num_beams": 1,
263
+ "num_hidden_layers": 28,
264
+ "num_key_value_heads": 4,
265
+ "num_return_sequences": 1,
266
+ "output_attentions": false,
267
+ "output_hidden_states": false,
268
+ "output_scores": false,
269
+ "pad_token_id": null,
270
+ "prefix": null,
271
+ "problem_type": null,
272
+ "pruned_heads": {},
273
+ "remove_invalid_values": false,
274
+ "repetition_penalty": 1.0,
275
+ "return_dict": true,
276
+ "return_dict_in_generate": false,
277
+ "rms_norm_eps": 1e-06,
278
+ "rope_scaling": {
279
+ "mrope_section": [
280
+ 16,
281
+ 24,
282
+ 24
283
+ ],
284
+ "rope_type": "default",
285
+ "type": "default"
286
+ },
287
+ "rope_theta": 1000000.0,
288
+ "sep_token_id": null,
289
+ "sliding_window": null,
290
+ "suppress_tokens": null,
291
+ "task_specific_params": null,
292
+ "temperature": 1.0,
293
+ "tf_legacy_loss": false,
294
+ "tie_encoder_decoder": false,
295
+ "tie_word_embeddings": false,
296
+ "tokenizer_class": null,
297
+ "top_k": 50,
298
+ "top_p": 1.0,
299
+ "torch_dtype": null,
300
+ "torchscript": false,
301
+ "typical_p": 1.0,
302
+ "use_bfloat16": false,
303
+ "use_cache": true,
304
+ "use_sliding_window": false,
305
+ "vocab_size": 152064
306
+ },
307
+ "torch_dtype": "bfloat16",
308
+ "user_token_id": 872,
309
+ "video_token_index": 151656,
310
+ "vision_config": {
311
+ "_attn_implementation_autoset": true,
312
+ "_name_or_path": "",
313
+ "add_cross_attention": false,
314
+ "architectures": null,
315
+ "bad_words_ids": null,
316
+ "begin_suppress_tokens": null,
317
+ "bos_token_id": null,
318
+ "chunk_size_feed_forward": 0,
319
+ "cross_attention_hidden_size": null,
320
+ "decoder_start_token_id": null,
321
+ "depth": 32,
322
+ "diversity_penalty": 0.0,
323
+ "do_sample": false,
324
+ "early_stopping": false,
325
+ "embed_dim": 1280,
326
+ "encoder_no_repeat_ngram_size": 0,
327
+ "eos_token_id": null,
328
+ "exponential_decay_length_penalty": null,
329
+ "finetuning_task": null,
330
+ "forced_bos_token_id": null,
331
+ "forced_eos_token_id": null,
332
+ "fullatt_block_indexes": [
333
+ 7,
334
+ 15,
335
+ 23,
336
+ 31
337
+ ],
338
+ "hidden_act": "silu",
339
+ "hidden_size": 1280,
340
+ "id2label": {
341
+ "0": "LABEL_0",
342
+ "1": "LABEL_1"
343
+ },
344
+ "in_channels": 3,
345
+ "in_chans": 3,
346
+ "init_std": 0.02,
347
+ "initializer_range": 0.02,
348
+ "intermediate_size": 3420,
349
+ "is_decoder": false,
350
+ "is_encoder_decoder": false,
351
+ "label2id": {
352
+ "LABEL_0": 0,
353
+ "LABEL_1": 1
354
+ },
355
+ "length_penalty": 1.0,
356
+ "max_length": 20,
357
+ "min_length": 0,
358
+ "model_type": "qwen2_5_omni_vision_encoder",
359
+ "no_repeat_ngram_size": 0,
360
+ "num_beam_groups": 1,
361
+ "num_beams": 1,
362
+ "num_heads": 16,
363
+ "num_return_sequences": 1,
364
+ "out_hidden_size": 3584,
365
+ "output_attentions": false,
366
+ "output_hidden_states": false,
367
+ "output_scores": false,
368
+ "pad_token_id": null,
369
+ "patch_size": 14,
370
+ "prefix": null,
371
+ "problem_type": null,
372
+ "pruned_heads": {},
373
+ "remove_invalid_values": false,
374
+ "repetition_penalty": 1.0,
375
+ "return_dict": true,
376
+ "return_dict_in_generate": false,
377
+ "sep_token_id": null,
378
+ "spatial_merge_size": 2,
379
+ "spatial_patch_size": 14,
380
+ "suppress_tokens": null,
381
+ "task_specific_params": null,
382
+ "temperature": 1.0,
383
+ "temporal_patch_size": 2,
384
+ "tf_legacy_loss": false,
385
+ "tie_encoder_decoder": false,
386
+ "tie_word_embeddings": true,
387
+ "tokenizer_class": null,
388
+ "tokens_per_second": 25,
389
+ "top_k": 50,
390
+ "top_p": 1.0,
391
+ "torch_dtype": null,
392
+ "torchscript": false,
393
+ "typical_p": 1.0,
394
+ "use_bfloat16": false,
395
+ "window_size": 112
396
+ },
397
+ "vision_end_token_id": 151653,
398
+ "vision_start_token_id": 151652,
399
+ "vision_token_id": 151654
400
+ },
401
+ "token2wav_config": {
402
+ "_attn_implementation_autoset": true,
403
+ "bigvgan_config": {
404
+ "_attn_implementation_autoset": true,
405
+ "_name_or_path": "",
406
+ "add_cross_attention": false,
407
+ "architectures": null,
408
+ "bad_words_ids": null,
409
+ "begin_suppress_tokens": null,
410
+ "bos_token_id": null,
411
+ "chunk_size_feed_forward": 0,
412
+ "cross_attention_hidden_size": null,
413
+ "decoder_start_token_id": null,
414
+ "diversity_penalty": 0.0,
415
+ "do_sample": false,
416
+ "early_stopping": false,
417
+ "encoder_no_repeat_ngram_size": 0,
418
+ "eos_token_id": null,
419
+ "exponential_decay_length_penalty": null,
420
+ "finetuning_task": null,
421
+ "forced_bos_token_id": null,
422
+ "forced_eos_token_id": null,
423
+ "id2label": {
424
+ "0": "LABEL_0",
425
+ "1": "LABEL_1"
426
+ },
427
+ "is_decoder": false,
428
+ "is_encoder_decoder": false,
429
+ "label2id": {
430
+ "LABEL_0": 0,
431
+ "LABEL_1": 1
432
+ },
433
+ "length_penalty": 1.0,
434
+ "max_length": 20,
435
+ "mel_dim": 80,
436
+ "min_length": 0,
437
+ "model_type": "qwen2_5_omni_bigvgan",
438
+ "no_repeat_ngram_size": 0,
439
+ "num_beam_groups": 1,
440
+ "num_beams": 1,
441
+ "num_return_sequences": 1,
442
+ "output_attentions": false,
443
+ "output_hidden_states": false,
444
+ "output_scores": false,
445
+ "pad_token_id": null,
446
+ "prefix": null,
447
+ "problem_type": null,
448
+ "pruned_heads": {},
449
+ "remove_invalid_values": false,
450
+ "repetition_penalty": 1.0,
451
+ "resblock_dilation_sizes": [
452
+ [
453
+ 1,
454
+ 3,
455
+ 5
456
+ ],
457
+ [
458
+ 1,
459
+ 3,
460
+ 5
461
+ ],
462
+ [
463
+ 1,
464
+ 3,
465
+ 5
466
+ ]
467
+ ],
468
+ "resblock_kernel_sizes": [
469
+ 3,
470
+ 7,
471
+ 11
472
+ ],
473
+ "return_dict": true,
474
+ "return_dict_in_generate": false,
475
+ "sep_token_id": null,
476
+ "suppress_tokens": null,
477
+ "task_specific_params": null,
478
+ "temperature": 1.0,
479
+ "tf_legacy_loss": false,
480
+ "tie_encoder_decoder": false,
481
+ "tie_word_embeddings": true,
482
+ "tokenizer_class": null,
483
+ "top_k": 50,
484
+ "top_p": 1.0,
485
+ "torch_dtype": null,
486
+ "torchscript": false,
487
+ "typical_p": 1.0,
488
+ "upsample_initial_channel": 1536,
489
+ "upsample_kernel_sizes": [
490
+ 11,
491
+ 7,
492
+ 4,
493
+ 4,
494
+ 4,
495
+ 4
496
+ ],
497
+ "upsample_rates": [
498
+ 5,
499
+ 3,
500
+ 2,
501
+ 2,
502
+ 2,
503
+ 2
504
+ ],
505
+ "use_bfloat16": false,
506
+ "use_bias_at_final": false
507
+ },
508
+ "dit_config": {
509
+ "_attn_implementation_autoset": true,
510
+ "_name_or_path": "",
511
+ "add_cross_attention": false,
512
+ "architectures": null,
513
+ "bad_words_ids": null,
514
+ "begin_suppress_tokens": null,
515
+ "block_size": 24,
516
+ "bos_token_id": null,
517
+ "chunk_size_feed_forward": 0,
518
+ "cross_attention_hidden_size": null,
519
+ "decoder_start_token_id": null,
520
+ "depth": 22,
521
+ "dim": 1024,
522
+ "diversity_penalty": 0.0,
523
+ "do_sample": false,
524
+ "dropout": 0.1,
525
+ "early_stopping": false,
526
+ "emb_dim": 512,
527
+ "enc_attention_channels": 64,
528
+ "enc_channels": [
529
+ 256,
530
+ 256,
531
+ 256,
532
+ 256,
533
+ 768
534
+ ],
535
+ "enc_dilations": [
536
+ 1,
537
+ 2,
538
+ 3,
539
+ 4,
540
+ 1
541
+ ],
542
+ "enc_dim": 128,
543
+ "enc_emb_dim": 192,
544
+ "enc_global_context": true,
545
+ "enc_kernel_sizes": [
546
+ 5,
547
+ 3,
548
+ 3,
549
+ 3,
550
+ 1
551
+ ],
552
+ "enc_lin_neurons": 192,
553
+ "enc_res2net_scale": 2,
554
+ "enc_se_channels": 64,
555
+ "encoder_no_repeat_ngram_size": 0,
556
+ "eos_token_id": null,
557
+ "exponential_decay_length_penalty": null,
558
+ "ff_mult": 2,
559
+ "finetuning_task": null,
560
+ "forced_bos_token_id": null,
561
+ "forced_eos_token_id": null,
562
+ "head_dim": 64,
563
+ "heads": 16,
564
+ "hidden_size": 1024,
565
+ "id2label": {
566
+ "0": "LABEL_0",
567
+ "1": "LABEL_1"
568
+ },
569
+ "is_decoder": false,
570
+ "is_encoder_decoder": false,
571
+ "label2id": {
572
+ "LABEL_0": 0,
573
+ "LABEL_1": 1
574
+ },
575
+ "length_penalty": 1.0,
576
+ "look_ahead_layers": [
577
+ 10
578
+ ],
579
+ "look_backward_layers": [
580
+ 0,
581
+ 20
582
+ ],
583
+ "max_length": 20,
584
+ "max_position_embeddings": 32768,
585
+ "mel_dim": 80,
586
+ "min_length": 0,
587
+ "model_type": "qwen2_5_omni_dit",
588
+ "no_repeat_ngram_size": 0,
589
+ "num_attention_heads": 16,
590
+ "num_beam_groups": 1,
591
+ "num_beams": 1,
592
+ "num_embeds": 8193,
593
+ "num_hidden_layers": 22,
594
+ "num_return_sequences": 1,
595
+ "output_attentions": false,
596
+ "output_hidden_states": false,
597
+ "output_scores": false,
598
+ "pad_token_id": null,
599
+ "prefix": null,
600
+ "problem_type": null,
601
+ "pruned_heads": {},
602
+ "remove_invalid_values": false,
603
+ "repeats": 2,
604
+ "repetition_penalty": 1.0,
605
+ "return_dict": true,
606
+ "return_dict_in_generate": false,
607
+ "rope_theta": 10000.0,
608
+ "sep_token_id": null,
609
+ "suppress_tokens": null,
610
+ "task_specific_params": null,
611
+ "temperature": 1.0,
612
+ "tf_legacy_loss": false,
613
+ "tie_encoder_decoder": false,
614
+ "tie_word_embeddings": true,
615
+ "tokenizer_class": null,
616
+ "top_k": 50,
617
+ "top_p": 1.0,
618
+ "torch_dtype": "float32",
619
+ "torchscript": false,
620
+ "typical_p": 1.0,
621
+ "use_bfloat16": false
622
+ },
623
+ "model_type": "qwen2_5_omni_token2wav"
624
+ },
625
+ "torch_dtype": "bfloat16",
626
+ "transformers_version": "4.55.4"
627
+ }