asr_model: openai/whisper-medium llm_model: gemini-2.5-flash svs_model: espnet/aceopencpop_svs_visinger2_40singer_pretrain melody_source: sample-lyric-kising language: mandarin character: Limei cache_dir: .cache track_latency: True evaluators: svs: - singmos - per - melody - aesthetic