S2ST-SubjectiveTest / samples.json
Mia11939's picture
swap models: drop seamless-medium/large, add stepaudio2-notrain (now 8 models per sample)
90675c1 verified
Raw
History Blame Contribute Delete
15.8 kB
{
"en2zh": {
"model_order": [
"qwen2.5-omni",
"kimi-audio",
"seamless-m4t-v2-large",
"uniss",
"stepaudio2-notrain",
"our-stage1-wocot",
"our-wostage2",
"our1"
],
"tokens": {
"qwen2.5-omni": "m8",
"kimi-audio": "m5",
"seamless-m4t-v2-large": "m1",
"uniss": "m7",
"stepaudio2-notrain": "m6",
"our-stage1-wocot": "m2",
"our-wostage2": "m4",
"our1": "m3"
},
"samples": [
{
"sample_idx": 1,
"id": "common_voice_zh-CN_18670722.mp3",
"source_text": "stationed in kakeromajima of amami islands",
"source_audio": "s1_en2zh_source.wav",
"models": {
"qwen2.5-omni": {
"text": "驻扎在奄美群岛的鹿儿岛。如果还有类似的翻译需求,欢迎随时告诉我哦。",
"audio": "s1_en2zh_m8.wav"
},
"kimi-audio": {
"text": "驻扎在奄美大岛",
"audio": "s1_en2zh_m5.wav"
},
"seamless-m4t-v2-large": {
"text": "站点在卡卡罗米吉马阿马米岛",
"audio": "s1_en2zh_m1.wav"
},
"uniss": {
"text": "驻扎在波科拉诺岛的卡卡罗米群岛。",
"audio": "s1_en2zh_m7.wav"
},
"stepaudio2-notrain": {
"text": "位于奄美群岛的卡卡拉梅吉马。",
"audio": "s1_en2zh_m6.wav"
},
"our-stage1-wocot": {
"text": "驻扎在奄美诸岛的嘉麻罗岛。",
"audio": "s1_en2zh_m2.wav"
},
"our-wostage2": {
"text": "驻扎在奄美群岛的加克罗马岛。",
"audio": "s1_en2zh_m4.wav"
},
"our1": {
"text": "驻扎在奄美群岛的嘉罗马岛上。",
"audio": "s1_en2zh_m3.wav"
}
}
},
{
"sample_idx": 2,
"id": "common_voice_zh-CN_18598178.mp3",
"source_text": "after the uprising of the five barbarians northern chinese rushed into wuyue region in mass",
"source_audio": "s2_en2zh_source.wav",
"models": {
"qwen2.5-omni": {
"text": "五胡乱华之后,北方汉人大量涌入关中地区。如果还有类似的翻译需求,你可以随时告诉我哦。",
"audio": "s2_en2zh_m8.wav"
},
"kimi-audio": {
"text": "在五胡乱华之后,北方的中国人大量涌入了河西走廊地区。",
"audio": "s2_en2zh_m5.wav"
},
"seamless-m4t-v2-large": {
"text": "在五个野蛮人起义后,北方中国人大规模冲进威威地区",
"audio": "s2_en2zh_m1.wav"
},
"uniss": {
"text": "五蛮族起义后,北方的中国人蜂拥而至涌入武夷地区。",
"audio": "s2_en2zh_m7.wav"
},
"stepaudio2-notrain": {
"text": "五胡乱华后,中国北方人蜂拥涌入吴越地区。",
"audio": "s2_en2zh_m6.wav"
},
"our-stage1-wocot": {
"text": "在五胡乱起之后,大量北方人涌入了吴越地区。",
"audio": "s2_en2zh_m2.wav"
},
"our-wostage2": {
"text": "五胡起义后,北方中国人大量涌入吴越地区。",
"audio": "s2_en2zh_m4.wav"
},
"our1": {
"text": "在五胡乱华之后,北方人大量涌入了吴越地区。",
"audio": "s2_en2zh_m3.wav"
}
}
},
{
"sample_idx": 3,
"id": "common_voice_zh-CN_18774434.mp3",
"source_text": "filipinos in singapore refer to filipino citizens living in singapore",
"source_audio": "s3_en2zh_source.wav",
"models": {
"qwen2.5-omni": {
"text": "新加坡的菲律宾人指的是居住在新加坡的菲律宾公民。如果还有类似的翻译需求,你可以随时告诉我哦。",
"audio": "s3_en2zh_m8.wav"
},
"kimi-audio": {
"text": "新加坡的菲律宾人,指的是居住在新加坡的菲律宾公民。",
"audio": "s3_en2zh_m5.wav"
},
"seamless-m4t-v2-large": {
"text": "菲律宾人和新加坡人,指的是菲律宾公民生活在新加坡",
"audio": "s3_en2zh_m1.wav"
},
"uniss": {
"text": "菲律宾人和新加坡人指的是居住在新加坡的菲律宾公民。",
"audio": "s3_en2zh_m7.wav"
},
"stepaudio2-notrain": {
"text": "新加坡的菲律宾人指的是住在新加坡的菲律宾公民。",
"audio": "s3_en2zh_m6.wav"
},
"our-stage1-wocot": {
"text": "新加坡的菲律宾人指的是住在新加坡的菲律宾公民。",
"audio": "s3_en2zh_m2.wav"
},
"our-wostage2": {
"text": "新加坡的菲律宾人指的是在新加坡的菲律宾公民。",
"audio": "s3_en2zh_m4.wav"
},
"our1": {
"text": "新加坡的菲律宾人指的是居住在新加坡的菲律宾公民。",
"audio": "s3_en2zh_m3.wav"
}
}
},
{
"sample_idx": 4,
"id": "common_voice_zh-CN_18715326.mp3",
"source_text": "henrique the fourth",
"source_audio": "s4_en2zh_source.wav",
"models": {
"qwen2.5-omni": {
"text": "亨利四世。如果还有其他翻译需求,随时告诉我哦。",
"audio": "s4_en2zh_m8.wav"
},
"kimi-audio": {
"text": "亨利四世",
"audio": "s4_en2zh_m5.wav"
},
"seamless-m4t-v2-large": {
"text": "亨利四世",
"audio": "s4_en2zh_m1.wav"
},
"uniss": {
"text": "亨利四世。",
"audio": "s4_en2zh_m7.wav"
},
"stepaudio2-notrain": {
"text": "亨利四世",
"audio": "s4_en2zh_m6.wav"
},
"our-stage1-wocot": {
"text": "亨利四世。",
"audio": "s4_en2zh_m2.wav"
},
"our-wostage2": {
"text": "亨利四世",
"audio": "s4_en2zh_m4.wav"
},
"our1": {
"text": "亨里克四世",
"audio": "s4_en2zh_m3.wav"
}
}
},
{
"sample_idx": 5,
"id": "common_voice_zh-CN_18977934.mp3",
"source_text": "clefmont",
"source_audio": "s5_en2zh_source.wav",
"models": {
"qwen2.5-omni": {
"text": "克莱蒙特。如果还有其他翻译需求,随时告诉我哦。",
"audio": "s5_en2zh_m8.wav"
},
"kimi-audio": {
"text": "对不起,我无法直接翻译音频内容。请提供音频的文本内容,我将很乐意帮助您翻译成中文。",
"audio": "s5_en2zh_m5.wav"
},
"seamless-m4t-v2-large": {
"text": "克莱蒙特",
"audio": "s5_en2zh_m1.wav"
},
"uniss": {
"text": "克莱蒙特。",
"audio": "s5_en2zh_m7.wav"
},
"stepaudio2-notrain": {
"text": "克莱蒙。",
"audio": "s5_en2zh_m6.wav"
},
"our-stage1-wocot": {
"text": "克莱蒙特。",
"audio": "s5_en2zh_m2.wav"
},
"our-wostage2": {
"text": "克莱蒙特",
"audio": "s5_en2zh_m4.wav"
},
"our1": {
"text": "克莱蒙",
"audio": "s5_en2zh_m3.wav"
}
}
}
]
},
"zh2en": {
"model_order": [
"qwen2.5-omni",
"kimi-audio",
"seamless-m4t-v2-large",
"uniss",
"stepaudio2-notrain",
"our-stage1-wocot",
"our-wostage2",
"our1"
],
"tokens": {
"qwen2.5-omni": "m5",
"kimi-audio": "m4",
"seamless-m4t-v2-large": "m2",
"uniss": "m7",
"stepaudio2-notrain": "m8",
"our-stage1-wocot": "m1",
"our-wostage2": "m6",
"our1": "m3"
},
"samples": [
{
"sample_idx": 1,
"id": "common_voice_zh-CN_18662485.mp3",
"source_text": "总部位于利雅得,在科威特、约旦和马来西亚有分行。",
"source_audio": "s1_zh2en_source.mp3",
"models": {
"qwen2.5-omni": {
"text": "The headquarters are in Riyadh. It has branches in Kuwait, Jordan and Malaysia.",
"audio": "s1_zh2en_m5.wav"
},
"kimi-audio": {
"text": "Headquartered in Riyadh, it has branches in Kuwait, Jordan, and Malaysia.",
"audio": "s1_zh2en_m4.wav"
},
"seamless-m4t-v2-large": {
"text": "Headquartered in Riyadh, it has branches in Kuwait, Vietnam and Malaysia.",
"audio": "s1_zh2en_m2.wav"
},
"uniss": {
"text": "the headquarter is located in leia and it also has branches in Kuwait jordan and malaysia",
"audio": "s1_zh2en_m7.wav"
},
"stepaudio2-notrain": {
"text": "Headquartered in Riyadh, branches are also found in Kuwait, Jordan and Malaysia.",
"audio": "s1_zh2en_m8.wav"
},
"our-stage1-wocot": {
"text": "Headquartered in Riyadh, it has branches in Kuwait, Jordan, and Malaysia.",
"audio": "s1_zh2en_m1.wav"
},
"our-wostage2": {
"text": "Headquarters are based in Riyadh and have branches in Kuwait, Jordan, and Malaysia.",
"audio": "s1_zh2en_m6.wav"
},
"our1": {
"text": "headquartered in riyadh it has branches in kuwait jordan and malaysia",
"audio": "s1_zh2en_m3.wav"
}
}
},
{
"sample_idx": 2,
"id": "common_voice_zh-CN_18978243.mp3",
"source_text": "电子浩室是浩室音乐的一个类型。",
"source_audio": "s2_zh2en_source.mp3",
"models": {
"qwen2.5-omni": {
"text": "Electronic post - 44 - 44 music is a type of music.",
"audio": "s2_zh2en_m5.wav"
},
"kimi-audio": {
"text": "Electronic house is a type of house music.",
"audio": "s2_zh2en_m4.wav"
},
"seamless-m4t-v2-large": {
"text": "Electronic noise is a type of noise music.",
"audio": "s2_zh2en_m2.wav"
},
"uniss": {
"text": "electronic浩室is a type of music in the浩室",
"audio": "s2_zh2en_m7.wav"
},
"stepaudio2-notrain": {
"text": "Electronic Heisei is a type of Heisei music.",
"audio": "s2_zh2en_m8.wav"
},
"our-stage1-wocot": {
"text": "Electronic house music is a type of house music.",
"audio": "s2_zh2en_m1.wav"
},
"our-wostage2": {
"text": "So, electronic house is just one type of house music.",
"audio": "s2_zh2en_m6.wav"
},
"our1": {
"text": "electronic house is a type of house music",
"audio": "s2_zh2en_m3.wav"
}
}
},
{
"sample_idx": 3,
"id": "common_voice_zh-CN_18664928.mp3",
"source_text": "纳什梅德是位于美国加利福尼亚州门多西诺县的一个非建制地区。",
"source_audio": "s3_zh2en_source.mp3",
"models": {
"qwen2.5-omni": {
"text": "Nashmead is an unincorporated community in Mendocino County, California, USA.",
"audio": "s3_zh2en_m5.wav"
},
"kimi-audio": {
"text": "纳什梅德是位于美国加利福尼亚州门多西诺县的一个非建制地区。",
"audio": "s3_zh2en_m4.wav"
},
"seamless-m4t-v2-large": {
"text": "Nashville is an unincorporated area located in Mendocino County, California, USA.",
"audio": "s3_zh2en_m2.wav"
},
"uniss": {
"text": "Nash Meade is an unincorporated community located in Mendocino County, California, United States.",
"audio": "s3_zh2en_m7.wav"
},
"stepaudio2-notrain": {
"text": "Nashmeid is an unincorporated area in Mendocino County, California, USA.",
"audio": "s3_zh2en_m8.wav"
},
"our-stage1-wocot": {
"text": "Nashmed is an unincorporated community situated in Mendocino County, located in the United States of America.",
"audio": "s3_zh2en_m1.wav"
},
"our-wostage2": {
"text": "Nashmead is an unincorporated area in Mendocino County, California, USA.",
"audio": "s3_zh2en_m6.wav"
},
"our1": {
"text": "nashmead is an unincorporated community in mendocino county california united states",
"audio": "s3_zh2en_m3.wav"
}
}
},
{
"sample_idx": 4,
"id": "common_voice_zh-CN_18979384.mp3",
"source_text": "出身于高知县。",
"source_audio": "s4_zh2en_source.mp3",
"models": {
"qwen2.5-omni": {
"text": "Born in Kochi Prefecture.",
"audio": "s4_zh2en_m5.wav"
},
"kimi-audio": {
"text": "Chushengyigao Zixian.",
"audio": "s4_zh2en_m4.wav"
},
"seamless-m4t-v2-large": {
"text": "Born in Kaohsiung County.",
"audio": "s4_zh2en_m2.wav"
},
"uniss": {
"text": "born in kochi county",
"audio": "s4_zh2en_m7.wav"
},
"stepaudio2-notrain": {
"text": "Born in Kōchi Prefecture.",
"audio": "s4_zh2en_m8.wav"
},
"our-stage1-wocot": {
"text": "Born in the city of Takahama Prefecture.",
"audio": "s4_zh2en_m1.wav"
},
"our-wostage2": {
"text": "Born in Kochi Prefecture.",
"audio": "s4_zh2en_m6.wav"
},
"our1": {
"text": "born in kochi prefecture",
"audio": "s4_zh2en_m3.wav"
}
}
},
{
"sample_idx": 5,
"id": "common_voice_zh-CN_18669987.mp3",
"source_text": "湖岛可以指:",
"source_audio": "s5_zh2en_source.mp3",
"models": {
"qwen2.5-omni": {
"text": "Fudao can refer to.",
"audio": "s5_zh2en_m5.wav"
},
"kimi-audio": {
"text": "Huda can refer to:",
"audio": "s5_zh2en_m4.wav"
},
"seamless-m4t-v2-large": {
"text": "Lake Island can refer to:",
"audio": "s5_zh2en_m2.wav"
},
"uniss": {
"text": "hu island can refer to",
"audio": "s5_zh2en_m7.wav"
},
"stepaudio2-notrain": {
"text": "Hu Island could refer to:",
"audio": "s5_zh2en_m8.wav"
},
"our-stage1-wocot": {
"text": "The term 'Lake Island' can denote.",
"audio": "s5_zh2en_m1.wav"
},
"our-wostage2": {
"text": "Hu Island could mean several things.",
"audio": "s5_zh2en_m6.wav"
},
"our1": {
"text": "lake island may refer to",
"audio": "s5_zh2en_m3.wav"
}
}
}
]
}
}