| { |
| "audio_llama_proj_model": "", |
| "beats_cfg": { |
| "activation_dropout": 0.0, |
| "activation_fn": "gelu", |
| "attention_dropout": 0.0, |
| "conv_bias": false, |
| "conv_pos": 128, |
| "conv_pos_groups": 16, |
| "deep_norm": true, |
| "dropout": 0.0, |
| "dropout_input": 0.0, |
| "embed_dim": 512, |
| "encoder_attention_heads": 12, |
| "encoder_embed_dim": 768, |
| "encoder_ffn_embed_dim": 3072, |
| "encoder_layerdrop": 0.05, |
| "encoder_layers": 12, |
| "finetuned_model": true, |
| "gru_rel_pos": true, |
| "input_patch_size": 16, |
| "layer_norm_first": false, |
| "layer_wise_gradient_decay_ratio": 0.6, |
| "max_distance": 800, |
| "num_buckets": 320, |
| "predictor_class": 527, |
| "predictor_dropout": 0.0, |
| "relative_position_embedding": true |
| }, |
| "downsample_factor": 8, |
| "end_sym": "<|end_of_text|>", |
| "freeze_audio_QFormer": false, |
| "freeze_audio_llama_proj": false, |
| "freeze_beats": true, |
| "llama_path": "meta-llama/Meta-Llama-3.1-8B-Instruct", |
| "lora": true, |
| "lora_alpha": 32, |
| "lora_dropout": 0.1, |
| "lora_rank": 32, |
| "max_pooling": false, |
| "max_txt_len": 160, |
| "num_audio_query_token": 1, |
| "prompt_template": "<|start_header_id|>user<|end_header_id|>\n\n{}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n", |
| "second_per_window": 0.333333, |
| "second_stride": 0.333333, |
| "use_audio_Qformer": true, |
| "window_level_Qformer": true |
| } |