{ "whisper_model": "openai/whisper-small", "xcodec_model": "HKUSTAudio/xcodec2", "whisper_dim": 768, "hidden_size": 2048, "u_start_id": 128262, "u_end_id": 128263, "g_start_id": 128260, "g_end_id": 128261, "pad_id": 128009, "instruction_prefix": "Convert ", "instruction_middle": " into speech using this speaker: " }