| { | |
| "architectures": [ | |
| "EncoderTuningModel" | |
| ], | |
| "audio_encoder_name": "models/flamingo_qwen/flamingo_qwen2_moe.py", | |
| "audio_encoder_params": { | |
| "adapter_dropout": 0.1, | |
| "adapter_type": "adapter", | |
| "cls_task_ids": "None", | |
| "fusion_mode": "moe_swiglu", | |
| "num_tasks": 12, | |
| "qformer_d_model": 1024, | |
| "qformer_drop_path": 0.05, | |
| "qformer_dropout": 0.1, | |
| "qformer_heads": 16, | |
| "qformer_layers": 6, | |
| "qformer_num_global_queries": 32, | |
| "qformer_num_local_queries": 96, | |
| "qformer_pool_stride": 4, | |
| "task_cond": false | |
| }, | |
| "decoder_type": "/private/models/SmolLM2-135M", | |
| "dtype": "float32", | |
| "lora_alpha": 32, | |
| "lora_dropout": 0.1, | |
| "lora_r": 8, | |
| "lora_target_modules": "all-linear", | |
| "model_type": "encoder_tuning_model", | |
| "train_encoder_stage1": false, | |
| "train_encoder_stage2": false, | |
| "transformers_version": "5.0.0" | |
| } | |