File size: 726 Bytes
a96a421 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 |
{
"audio_encoder": {
"embed_dim_audio": 1024,
"joint_dim": 512,
"audio_cfg": {
"audio_length": 1024,
"clip_samples": 480000,
"mel_bins": 64,
"sample_rate": 48000,
"window_size": 1024,
"hop_size": 480,
"fmin": 50,
"fmax": 14000,
"class_num": 527,
"model_type": "HTSAT",
"model_name": "base"
}
},
"LLM": {
"t5_model": "google/flan-t5-xl",
"repetition_penalty": 10.0
},
"num_query_tokens": 16,
"embed_dim": 256,
"max_txt_len": 120,
"prompt": "Caption this data:",
"apply_lemmatizer": false,
"atRandom": true
} |