Spaces:
Running
Running
Anonymous commited on
Commit ·
a4e61d9
1
Parent(s): f69c8ff
Adjust demo layout and restore contexts
Browse files- index.html +15 -11
- static/css/index.css +26 -1
- static/task/emo/CosyVoice3/manifest.jsonl +18 -18
- static/task/emo/IndexTTS2/manifest.jsonl +18 -18
- static/task/emo/MiMo-V2.5/manifest.jsonl +18 -18
- static/task/emo/Ours/manifest.jsonl +18 -18
- static/task/emo/Qwen3/manifest.jsonl +18 -18
- static/task/punct/MiMo-V2.5/manifest.jsonl +13 -13
- static/task/punct/Ours/manifest.jsonl +13 -13
- static/task/punct/SoulX-Podcast/manifest.jsonl +13 -13
index.html
CHANGED
|
@@ -34,14 +34,18 @@
|
|
| 34 |
<p>PromptDialog task demos.</p>
|
| 35 |
</div>
|
| 36 |
|
| 37 |
-
<
|
| 38 |
-
<
|
| 39 |
-
|
| 40 |
-
|
| 41 |
-
|
| 42 |
-
|
| 43 |
-
<
|
| 44 |
</div>
|
|
|
|
|
|
|
|
|
|
|
|
|
| 45 |
</div>
|
| 46 |
</div>
|
| 47 |
</section>
|
|
@@ -128,10 +132,10 @@
|
|
| 128 |
target.innerHTML = formatScriptText(item.target_text, highlightParalinguistic);
|
| 129 |
wrapper.appendChild(target);
|
| 130 |
|
| 131 |
-
item.variants.forEach((variant) => {
|
| 132 |
const context = document.createElement("p");
|
| 133 |
context.className = "variant-context";
|
| 134 |
-
context.innerHTML = `<strong>${
|
| 135 |
wrapper.appendChild(context);
|
| 136 |
});
|
| 137 |
|
|
@@ -214,12 +218,12 @@
|
|
| 214 |
return wrapper;
|
| 215 |
}
|
| 216 |
|
| 217 |
-
modelItem.variants.forEach((variant) => {
|
| 218 |
const row = document.createElement("div");
|
| 219 |
row.className = "variant-audio-row";
|
| 220 |
|
| 221 |
const label = document.createElement("span");
|
| 222 |
-
label.textContent =
|
| 223 |
|
| 224 |
row.appendChild(label);
|
| 225 |
row.appendChild(createAudio(`${taskRoot}/${model}/${variant.output_audio}`));
|
|
|
|
| 34 |
<p>PromptDialog task demos.</p>
|
| 35 |
</div>
|
| 36 |
|
| 37 |
+
<div class="demo-layout">
|
| 38 |
+
<div class="demo-main">
|
| 39 |
+
<div class="task-list" id="task-list" aria-live="polite">
|
| 40 |
+
<div class="task-card">
|
| 41 |
+
<p class="loading">Loading audio demos...</p>
|
| 42 |
+
</div>
|
| 43 |
+
</div>
|
| 44 |
</div>
|
| 45 |
+
|
| 46 |
+
<nav class="task-directory" id="task-directory" aria-label="Audio demo tasks">
|
| 47 |
+
<p class="loading">Loading task directory...</p>
|
| 48 |
+
</nav>
|
| 49 |
</div>
|
| 50 |
</div>
|
| 51 |
</section>
|
|
|
|
| 132 |
target.innerHTML = formatScriptText(item.target_text, highlightParalinguistic);
|
| 133 |
wrapper.appendChild(target);
|
| 134 |
|
| 135 |
+
item.variants.forEach((variant, index) => {
|
| 136 |
const context = document.createElement("p");
|
| 137 |
context.className = "variant-context";
|
| 138 |
+
context.innerHTML = `<strong>instruction${index + 1}</strong> <span class="context-cue">${escapeHtml(variant.context)}</span>`;
|
| 139 |
wrapper.appendChild(context);
|
| 140 |
});
|
| 141 |
|
|
|
|
| 218 |
return wrapper;
|
| 219 |
}
|
| 220 |
|
| 221 |
+
modelItem.variants.forEach((variant, index) => {
|
| 222 |
const row = document.createElement("div");
|
| 223 |
row.className = "variant-audio-row";
|
| 224 |
|
| 225 |
const label = document.createElement("span");
|
| 226 |
+
label.textContent = `instruction${index + 1}`;
|
| 227 |
|
| 228 |
row.appendChild(label);
|
| 229 |
row.appendChild(createAudio(`${taskRoot}/${model}/${variant.output_audio}`));
|
static/css/index.css
CHANGED
|
@@ -101,15 +101,28 @@ body {
|
|
| 101 |
line-height: 1.55;
|
| 102 |
}
|
| 103 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 104 |
.task-directory {
|
| 105 |
display: grid;
|
| 106 |
grid-template-columns: 8rem minmax(0, 1fr);
|
| 107 |
gap: 0.9rem;
|
| 108 |
align-items: start;
|
| 109 |
-
margin: 0
|
| 110 |
border: 1px solid var(--line);
|
| 111 |
background: var(--soft);
|
| 112 |
padding: 0.9rem;
|
|
|
|
|
|
|
| 113 |
}
|
| 114 |
|
| 115 |
.task-directory-title {
|
|
@@ -149,6 +162,9 @@ body {
|
|
| 149 |
border-bottom: 1px solid var(--line);
|
| 150 |
background: var(--soft);
|
| 151 |
padding: 1rem 1.15rem;
|
|
|
|
|
|
|
|
|
|
| 152 |
}
|
| 153 |
|
| 154 |
.task-card-heading h3 {
|
|
@@ -301,11 +317,20 @@ audio {
|
|
| 301 |
width: min(100% - 1rem, 1640px);
|
| 302 |
}
|
| 303 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 304 |
.task-directory {
|
| 305 |
grid-template-columns: 1fr;
|
|
|
|
| 306 |
}
|
| 307 |
|
| 308 |
.audio-grid {
|
| 309 |
grid-template-columns: repeat(2, minmax(0, 1fr));
|
| 310 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
| 311 |
}
|
|
|
|
| 101 |
line-height: 1.55;
|
| 102 |
}
|
| 103 |
|
| 104 |
+
.demo-layout {
|
| 105 |
+
display: grid;
|
| 106 |
+
grid-template-columns: minmax(0, 1fr) 17rem;
|
| 107 |
+
gap: 1.5rem;
|
| 108 |
+
align-items: start;
|
| 109 |
+
}
|
| 110 |
+
|
| 111 |
+
.demo-main {
|
| 112 |
+
min-width: 0;
|
| 113 |
+
}
|
| 114 |
+
|
| 115 |
.task-directory {
|
| 116 |
display: grid;
|
| 117 |
grid-template-columns: 8rem minmax(0, 1fr);
|
| 118 |
gap: 0.9rem;
|
| 119 |
align-items: start;
|
| 120 |
+
margin: 0;
|
| 121 |
border: 1px solid var(--line);
|
| 122 |
background: var(--soft);
|
| 123 |
padding: 0.9rem;
|
| 124 |
+
position: sticky;
|
| 125 |
+
top: 1rem;
|
| 126 |
}
|
| 127 |
|
| 128 |
.task-directory-title {
|
|
|
|
| 162 |
border-bottom: 1px solid var(--line);
|
| 163 |
background: var(--soft);
|
| 164 |
padding: 1rem 1.15rem;
|
| 165 |
+
position: sticky;
|
| 166 |
+
top: 0;
|
| 167 |
+
z-index: 5;
|
| 168 |
}
|
| 169 |
|
| 170 |
.task-card-heading h3 {
|
|
|
|
| 317 |
width: min(100% - 1rem, 1640px);
|
| 318 |
}
|
| 319 |
|
| 320 |
+
.demo-layout {
|
| 321 |
+
grid-template-columns: 1fr;
|
| 322 |
+
}
|
| 323 |
+
|
| 324 |
.task-directory {
|
| 325 |
grid-template-columns: 1fr;
|
| 326 |
+
position: static;
|
| 327 |
}
|
| 328 |
|
| 329 |
.audio-grid {
|
| 330 |
grid-template-columns: repeat(2, minmax(0, 1fr));
|
| 331 |
}
|
| 332 |
+
|
| 333 |
+
.task-card-heading {
|
| 334 |
+
position: static;
|
| 335 |
+
}
|
| 336 |
}
|
static/task/emo/CosyVoice3/manifest.jsonl
CHANGED
|
@@ -1,18 +1,18 @@
|
|
| 1 |
-
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "", "output_audio": "sample/utt_0001_fear.wav"}
|
| 2 |
-
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "", "output_audio": "sample/utt_0002_nervous.wav"}
|
| 3 |
-
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "", "output_audio": "sample/utt_0003_tired.wav"}
|
| 4 |
-
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先
|
| 5 |
-
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "", "output_audio": "sample/utt_0005_enthusiastic.wav"}
|
| 6 |
-
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "", "output_audio": "sample/utt_0006_proud.wav"}
|
| 7 |
-
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "", "output_audio": "sample/utt_0007_happy.wav"}
|
| 8 |
-
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "", "output_audio": "sample/utt_0008_confused.wav"}
|
| 9 |
-
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "", "output_audio": "sample/utt_0009_surprise.wav"}
|
| 10 |
-
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "", "output_audio": "sample/utt_0010_worried.wav"}
|
| 11 |
-
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "", "output_audio": "sample/utt_0011_sadness.wav"}
|
| 12 |
-
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "", "output_audio": "sample/utt_0012_frustration.wav"}
|
| 13 |
-
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "", "output_audio": "sample/utt_0013_shameful.wav"}
|
| 14 |
-
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "", "output_audio": "sample/utt_0014_disappointed.wav"}
|
| 15 |
-
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "", "output_audio": "sample/utt_0015_anger.wav"}
|
| 16 |
-
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "", "output_audio": "sample/utt_0016_disgust.wav"}
|
| 17 |
-
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "", "output_audio": "sample/utt_0017_contempt.wav"}
|
| 18 |
-
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "", "output_audio": "sample/utt_0018_pity.wav"}
|
|
|
|
| 1 |
+
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "", "output_audio": "sample/utt_0001_fear.wav", "context": "害怕"}
|
| 2 |
+
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "", "output_audio": "sample/utt_0002_nervous.wav", "context": "紧张"}
|
| 3 |
+
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "", "output_audio": "sample/utt_0003_tired.wav", "context": "疲惫"}
|
| 4 |
+
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先���一会儿,喝口温水——现在这样就挺好。", "speaker": "", "output_audio": "sample/utt_0004_peaceful.wav", "context": "平静"}
|
| 5 |
+
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "", "output_audio": "sample/utt_0005_enthusiastic.wav", "context": "热情"}
|
| 6 |
+
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "", "output_audio": "sample/utt_0006_proud.wav", "context": "自信"}
|
| 7 |
+
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "", "output_audio": "sample/utt_0007_happy.wav", "context": "开心"}
|
| 8 |
+
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "", "output_audio": "sample/utt_0008_confused.wav", "context": "困惑"}
|
| 9 |
+
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "", "output_audio": "sample/utt_0009_surprise.wav", "context": "惊讶"}
|
| 10 |
+
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "", "output_audio": "sample/utt_0010_worried.wav", "context": "担忧"}
|
| 11 |
+
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "", "output_audio": "sample/utt_0011_sadness.wav", "context": "悲伤"}
|
| 12 |
+
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "", "output_audio": "sample/utt_0012_frustration.wav", "context": "沮丧"}
|
| 13 |
+
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "", "output_audio": "sample/utt_0013_shameful.wav", "context": "害羞"}
|
| 14 |
+
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "", "output_audio": "sample/utt_0014_disappointed.wav", "context": "失望"}
|
| 15 |
+
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "", "output_audio": "sample/utt_0015_anger.wav", "context": "愤怒"}
|
| 16 |
+
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "", "output_audio": "sample/utt_0016_disgust.wav", "context": "不快"}
|
| 17 |
+
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "", "output_audio": "sample/utt_0017_contempt.wav", "context": "鄙视"}
|
| 18 |
+
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "", "output_audio": "sample/utt_0018_pity.wav", "context": "同情"}
|
static/task/emo/IndexTTS2/manifest.jsonl
CHANGED
|
@@ -1,18 +1,18 @@
|
|
| 1 |
-
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "", "output_audio": "sample/utt_0001_fear.wav"}
|
| 2 |
-
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "", "output_audio": "sample/utt_0002_nervous.wav"}
|
| 3 |
-
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "", "output_audio": "sample/utt_0003_tired.wav"}
|
| 4 |
-
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先
|
| 5 |
-
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "", "output_audio": "sample/utt_0005_enthusiastic.wav"}
|
| 6 |
-
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "", "output_audio": "sample/utt_0006_proud.wav"}
|
| 7 |
-
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "", "output_audio": "sample/utt_0007_happy.wav"}
|
| 8 |
-
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "", "output_audio": "sample/utt_0008_confused.wav"}
|
| 9 |
-
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "", "output_audio": "sample/utt_0009_surprise.wav"}
|
| 10 |
-
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "", "output_audio": "sample/utt_0010_worried.wav"}
|
| 11 |
-
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "", "output_audio": "sample/utt_0011_sadness.wav"}
|
| 12 |
-
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "", "output_audio": "sample/utt_0012_frustration.wav"}
|
| 13 |
-
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "", "output_audio": "sample/utt_0013_shameful.wav"}
|
| 14 |
-
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "", "output_audio": "sample/utt_0014_disappointed.wav"}
|
| 15 |
-
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "", "output_audio": "sample/utt_0015_anger.wav"}
|
| 16 |
-
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "", "output_audio": "sample/utt_0016_disgust.wav"}
|
| 17 |
-
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "", "output_audio": "sample/utt_0017_contempt.wav"}
|
| 18 |
-
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "", "output_audio": "sample/utt_0018_pity.wav"}
|
|
|
|
| 1 |
+
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "", "output_audio": "sample/utt_0001_fear.wav", "context": "害怕"}
|
| 2 |
+
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "", "output_audio": "sample/utt_0002_nervous.wav", "context": "紧张"}
|
| 3 |
+
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "", "output_audio": "sample/utt_0003_tired.wav", "context": "疲惫"}
|
| 4 |
+
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先���一会儿,喝口温水——现在这样就挺好。", "speaker": "", "output_audio": "sample/utt_0004_peaceful.wav", "context": "平静"}
|
| 5 |
+
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "", "output_audio": "sample/utt_0005_enthusiastic.wav", "context": "热情"}
|
| 6 |
+
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "", "output_audio": "sample/utt_0006_proud.wav", "context": "自信"}
|
| 7 |
+
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "", "output_audio": "sample/utt_0007_happy.wav", "context": "开心"}
|
| 8 |
+
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "", "output_audio": "sample/utt_0008_confused.wav", "context": "困惑"}
|
| 9 |
+
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "", "output_audio": "sample/utt_0009_surprise.wav", "context": "惊讶"}
|
| 10 |
+
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "", "output_audio": "sample/utt_0010_worried.wav", "context": "担忧"}
|
| 11 |
+
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "", "output_audio": "sample/utt_0011_sadness.wav", "context": "悲伤"}
|
| 12 |
+
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "", "output_audio": "sample/utt_0012_frustration.wav", "context": "沮丧"}
|
| 13 |
+
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "", "output_audio": "sample/utt_0013_shameful.wav", "context": "害羞"}
|
| 14 |
+
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "", "output_audio": "sample/utt_0014_disappointed.wav", "context": "失望"}
|
| 15 |
+
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "", "output_audio": "sample/utt_0015_anger.wav", "context": "愤怒"}
|
| 16 |
+
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "", "output_audio": "sample/utt_0016_disgust.wav", "context": "不快"}
|
| 17 |
+
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "", "output_audio": "sample/utt_0017_contempt.wav", "context": "鄙视"}
|
| 18 |
+
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "", "output_audio": "sample/utt_0018_pity.wav", "context": "同情"}
|
static/task/emo/MiMo-V2.5/manifest.jsonl
CHANGED
|
@@ -1,18 +1,18 @@
|
|
| 1 |
-
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "白桦", "output_audio": "samples/utt_0001_fear.wav"}
|
| 2 |
-
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "冰糖", "output_audio": "samples/utt_0002_nervous.wav"}
|
| 3 |
-
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "白桦", "output_audio": "samples/utt_0003_tired.wav"}
|
| 4 |
-
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先坐一会儿,喝口温水——现在这样就挺好。", "speaker": "冰糖", "output_audio": "samples/utt_0004_peaceful.wav"}
|
| 5 |
-
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "苏打", "output_audio": "samples/utt_0005_enthusiastic.wav"}
|
| 6 |
-
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "白桦", "output_audio": "samples/utt_0006_proud.wav"}
|
| 7 |
-
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "茉莉", "output_audio": "samples/utt_0007_happy.wav"}
|
| 8 |
-
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "白桦", "output_audio": "samples/utt_0008_confused.wav"}
|
| 9 |
-
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "冰糖", "output_audio": "samples/utt_0009_surprise.wav"}
|
| 10 |
-
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "苏打", "output_audio": "samples/utt_0010_worried.wav"}
|
| 11 |
-
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "茉莉", "output_audio": "samples/utt_0011_sadness.wav"}
|
| 12 |
-
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "冰糖", "output_audio": "samples/utt_0012_frustration.wav"}
|
| 13 |
-
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "冰糖", "output_audio": "samples/utt_0013_shameful.wav"}
|
| 14 |
-
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "苏打", "output_audio": "samples/utt_0014_disappointed.wav"}
|
| 15 |
-
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "白桦", "output_audio": "samples/utt_0015_anger.wav"}
|
| 16 |
-
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "冰糖", "output_audio": "samples/utt_0016_disgust.wav"}
|
| 17 |
-
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "白桦", "output_audio": "samples/utt_0017_contempt.wav"}
|
| 18 |
-
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "苏打", "output_audio": "samples/utt_0018_pity.wav"}
|
|
|
|
| 1 |
+
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "白桦", "output_audio": "samples/utt_0001_fear.wav", "context": "害怕"}
|
| 2 |
+
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "冰糖", "output_audio": "samples/utt_0002_nervous.wav", "context": "紧张"}
|
| 3 |
+
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "白桦", "output_audio": "samples/utt_0003_tired.wav", "context": "疲惫"}
|
| 4 |
+
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先坐一会儿,喝口温水——现在这样就挺好。", "speaker": "冰糖", "output_audio": "samples/utt_0004_peaceful.wav", "context": "平静"}
|
| 5 |
+
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "苏打", "output_audio": "samples/utt_0005_enthusiastic.wav", "context": "热情"}
|
| 6 |
+
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "白桦", "output_audio": "samples/utt_0006_proud.wav", "context": "自信"}
|
| 7 |
+
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "茉莉", "output_audio": "samples/utt_0007_happy.wav", "context": "开心"}
|
| 8 |
+
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "白桦", "output_audio": "samples/utt_0008_confused.wav", "context": "困惑"}
|
| 9 |
+
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "冰糖", "output_audio": "samples/utt_0009_surprise.wav", "context": "惊讶"}
|
| 10 |
+
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "苏打", "output_audio": "samples/utt_0010_worried.wav", "context": "担忧"}
|
| 11 |
+
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "茉莉", "output_audio": "samples/utt_0011_sadness.wav", "context": "悲伤"}
|
| 12 |
+
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "冰糖", "output_audio": "samples/utt_0012_frustration.wav", "context": "沮丧"}
|
| 13 |
+
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "冰糖", "output_audio": "samples/utt_0013_shameful.wav", "context": "害羞"}
|
| 14 |
+
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "苏打", "output_audio": "samples/utt_0014_disappointed.wav", "context": "失望"}
|
| 15 |
+
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "白桦", "output_audio": "samples/utt_0015_anger.wav", "context": "愤怒"}
|
| 16 |
+
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "冰糖", "output_audio": "samples/utt_0016_disgust.wav", "context": "不快"}
|
| 17 |
+
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "白桦", "output_audio": "samples/utt_0017_contempt.wav", "context": "鄙视"}
|
| 18 |
+
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "苏打", "output_audio": "samples/utt_0018_pity.wav", "context": "同情"}
|
static/task/emo/Ours/manifest.jsonl
CHANGED
|
@@ -1,18 +1,18 @@
|
|
| 1 |
-
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "", "output_audio": "samples/utt_0001_fear.wav"}
|
| 2 |
-
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "", "output_audio": "samples/utt_0002_nervous.wav"}
|
| 3 |
-
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "", "output_audio": "samples/utt_0003_tired.wav"}
|
| 4 |
-
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自
|
| 5 |
-
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "", "output_audio": "samples/utt_0005_enthusiastic.wav"}
|
| 6 |
-
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "", "output_audio": "samples/utt_0006_proud.wav"}
|
| 7 |
-
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "", "output_audio": "samples/utt_0007_happy.wav"}
|
| 8 |
-
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "", "output_audio": "samples/utt_0008_confused.wav"}
|
| 9 |
-
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "", "output_audio": "samples/utt_0009_surprise.wav"}
|
| 10 |
-
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "", "output_audio": "samples/utt_0010_worried.wav"}
|
| 11 |
-
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "", "output_audio": "samples/utt_0011_sadness.wav"}
|
| 12 |
-
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "", "output_audio": "samples/utt_0012_frustration.wav"}
|
| 13 |
-
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "", "output_audio": "samples/utt_0013_shameful.wav"}
|
| 14 |
-
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "", "output_audio": "samples/utt_0014_disappointed.wav"}
|
| 15 |
-
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "", "output_audio": "samples/utt_0015_anger.wav"}
|
| 16 |
-
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "", "output_audio": "samples/utt_0016_disgust.wav"}
|
| 17 |
-
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "", "output_audio": "samples/utt_0017_contempt.wav"}
|
| 18 |
-
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "", "output_audio": "samples/utt_0018_pity.wav"}
|
|
|
|
| 1 |
+
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "", "output_audio": "samples/utt_0001_fear.wav", "context": "害怕"}
|
| 2 |
+
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "", "output_audio": "samples/utt_0002_nervous.wav", "context": "紧张"}
|
| 3 |
+
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "", "output_audio": "samples/utt_0003_tired.wav", "context": "疲惫"}
|
| 4 |
+
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自���的步子来。先坐一会儿,喝口温水——现在这样就挺好。", "speaker": "", "output_audio": "samples/utt_0004_peaceful.wav", "context": "平静"}
|
| 5 |
+
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "", "output_audio": "samples/utt_0005_enthusiastic.wav", "context": "热情"}
|
| 6 |
+
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "", "output_audio": "samples/utt_0006_proud.wav", "context": "自信"}
|
| 7 |
+
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "", "output_audio": "samples/utt_0007_happy.wav", "context": "开心"}
|
| 8 |
+
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "", "output_audio": "samples/utt_0008_confused.wav", "context": "困惑"}
|
| 9 |
+
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "", "output_audio": "samples/utt_0009_surprise.wav", "context": "惊讶"}
|
| 10 |
+
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "", "output_audio": "samples/utt_0010_worried.wav", "context": "担忧"}
|
| 11 |
+
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "", "output_audio": "samples/utt_0011_sadness.wav", "context": "悲伤"}
|
| 12 |
+
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "", "output_audio": "samples/utt_0012_frustration.wav", "context": "沮丧"}
|
| 13 |
+
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "", "output_audio": "samples/utt_0013_shameful.wav", "context": "害羞"}
|
| 14 |
+
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "", "output_audio": "samples/utt_0014_disappointed.wav", "context": "失望"}
|
| 15 |
+
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "", "output_audio": "samples/utt_0015_anger.wav", "context": "愤怒"}
|
| 16 |
+
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "", "output_audio": "samples/utt_0016_disgust.wav", "context": "不快"}
|
| 17 |
+
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "", "output_audio": "samples/utt_0017_contempt.wav", "context": "鄙视"}
|
| 18 |
+
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "", "output_audio": "samples/utt_0018_pity.wav", "context": "同情"}
|
static/task/emo/Qwen3/manifest.jsonl
CHANGED
|
@@ -1,18 +1,18 @@
|
|
| 1 |
-
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "Serena", "output_audio": "samples/utt_0001_fear.wav"}
|
| 2 |
-
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "Maia", "output_audio": "samples/utt_0002_nervous.wav"}
|
| 3 |
-
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "Momo", "output_audio": "samples/utt_0003_tired.wav"}
|
| 4 |
-
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先坐一会儿,喝口温水——现在这样就挺好。", "speaker": "Chelsie", "output_audio": "samples/utt_0004_peaceful.wav"}
|
| 5 |
-
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "Momo", "output_audio": "samples/utt_0005_enthusiastic.wav"}
|
| 6 |
-
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "Momo", "output_audio": "samples/utt_0006_proud.wav"}
|
| 7 |
-
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "Moon", "output_audio": "samples/utt_0007_happy.wav"}
|
| 8 |
-
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "Kai", "output_audio": "samples/utt_0008_confused.wav"}
|
| 9 |
-
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "Cherry", "output_audio": "samples/utt_0009_surprise.wav"}
|
| 10 |
-
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "Maia", "output_audio": "samples/utt_0010_worried.wav"}
|
| 11 |
-
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "Moon", "output_audio": "samples/utt_0011_sadness.wav"}
|
| 12 |
-
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "Kai", "output_audio": "samples/utt_0012_frustration.wav"}
|
| 13 |
-
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "Maia", "output_audio": "samples/utt_0013_shameful.wav"}
|
| 14 |
-
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "Serena", "output_audio": "samples/utt_0014_disappointed.wav"}
|
| 15 |
-
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "Nofish", "output_audio": "samples/utt_0015_anger.wav"}
|
| 16 |
-
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "Momo", "output_audio": "samples/utt_0016_disgust.wav"}
|
| 17 |
-
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "Nofish", "output_audio": "samples/utt_0017_contempt.wav"}
|
| 18 |
-
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "Ethan", "output_audio": "samples/utt_0018_pity.wav"}
|
|
|
|
| 1 |
+
{"utt": "utt_0001_fear", "target_text": "别、别过来……我们可以好好说,求你了,我真的没做什么,别靠近我,好吗?", "speaker": "Serena", "output_audio": "samples/utt_0001_fear.wav", "context": "害怕"}
|
| 2 |
+
{"utt": "utt_0002_nervous", "target_text": "我……我不是想拖延,我只是——能不能再给我一点时间?我怕说错话……真的,我现在脑子有点乱,手也在抖。", "speaker": "Maia", "output_audio": "samples/utt_0002_nervous.wav", "context": "紧张"}
|
| 3 |
+
{"utt": "utt_0003_tired", "target_text": "先别催了,给我两分钟喘口气……唉,昨晚基本没睡,脑子像糊住了。让我坐一下,喝口水,等我缓过来再说行吗?", "speaker": "Momo", "output_audio": "samples/utt_0003_tired.wav", "context": "疲惫"}
|
| 4 |
+
{"utt": "utt_0004_peaceful", "target_text": "嗯,别急,我们就按自己的步子来。先坐一会儿,喝口温水——现在这样就挺好。", "speaker": "Chelsie", "output_audio": "samples/utt_0004_peaceful.wav", "context": "平静"}
|
| 5 |
+
{"utt": "utt_0005_enthusiastic", "target_text": "太给力了!就按这个来!我现在就去把人叫上、把材料备好,你把时间敲定——十分钟后咱们直接开干!", "speaker": "Momo", "output_audio": "samples/utt_0005_enthusiastic.wav", "context": "热情"}
|
| 6 |
+
{"utt": "utt_0006_proud", "target_text": "这块交给我吧,我已经把方案推了三遍,坑都踩过了。你只管等结果,今晚给你一个漂亮的答复——放心,看我的。", "speaker": "Momo", "output_audio": "samples/utt_0006_proud.wav", "context": "自信"}
|
| 7 |
+
{"utt": "utt_0007_happy", "target_text": "太好了!我就说肯定没问题的!走走走,今晚我请客,必须好好庆祝一下!", "speaker": "Moon", "output_audio": "samples/utt_0007_happy.wav", "context": "开心"}
|
| 8 |
+
{"utt": "utt_0008_confused", "target_text": "等一下,我有点没听明白……你说的‘那个’是现在要做,还是等会儿?为啥跟我理解的不太一样啊?", "speaker": "Kai", "output_audio": "samples/utt_0008_confused.wav", "context": "困惑"}
|
| 9 |
+
{"utt": "utt_0009_surprise", "target_text": "等、等等,这是真的?你别逗我——我刚才没看错吧?!", "speaker": "Cherry", "output_audio": "samples/utt_0009_surprise.wav", "context": "惊讶"}
|
| 10 |
+
{"utt": "utt_0010_worried", "target_text": "对不起我又给你打了……可是电话一直不通,你没事吧?能不能回我一下,好吗?就发个字也行,我真的有点慌。", "speaker": "Maia", "output_audio": "samples/utt_0010_worried.wav", "context": "担忧"}
|
| 11 |
+
{"utt": "utt_0011_sadness", "target_text": "我以为会好起来的……结果还是没撑住。对不起,我现在真的不想说话,给我一点时间,好吗?", "speaker": "Moon", "output_audio": "samples/utt_0011_sadness.wav", "context": "悲伤"}
|
| 12 |
+
{"utt": "utt_0012_frustration", "target_text": "我真的是尽力了,可还是搞不定……唉,怎么就差一点点呢?算了,你们先说吧,我现在脑子一团糟。", "speaker": "Kai", "output_audio": "samples/utt_0012_frustration.wav", "context": "沮丧"}
|
| 13 |
+
{"utt": "utt_0013_shameful", "target_text": "我……我不是那个意思啦,别一直看我嘛。嗯……要不我们改天再说?", "speaker": "Maia", "output_audio": "samples/utt_0013_shameful.wav", "context": "害羞"}
|
| 14 |
+
{"utt": "utt_0014_disappointed", "target_text": "好吧,我懂了。我以为这次会不一样,结果……还是这样。算了,你别解释了,我没事。", "speaker": "Serena", "output_audio": "samples/utt_0014_disappointed.wav", "context": "失望"}
|
| 15 |
+
{"utt": "utt_0015_anger", "target_text": "你这是在耍我吗?!说好的呢?别跟我打太极,我现在就要一个痛快的说法——要么立刻兑现,要么别在这儿装无辜!", "speaker": "Nofish", "output_audio": "samples/utt_0015_anger.wav", "context": "愤怒"}
|
| 16 |
+
{"utt": "utt_0016_disgust", "target_text": "呃……别靠近我行吗?这味儿真的受不了,把它拿走,好吗?我现在特别不舒服。", "speaker": "Momo", "output_audio": "samples/utt_0016_disgust.wav", "context": "不快"}
|
| 17 |
+
{"utt": "utt_0017_contempt", "target_text": "呵——就这?别把小把戏端到我面前,挺丢人的。省省吧,我没空陪你演。", "speaker": "Nofish", "output_audio": "samples/utt_0017_contempt.wav", "context": "鄙视"}
|
| 18 |
+
{"utt": "utt_0018_pity", "target_text": "唉……别急,慢慢来,好吗?我在这儿。先擦擦眼睛,要不要喝口水,或者我们出去透透气?", "speaker": "Ethan", "output_audio": "samples/utt_0018_pity.wav", "context": "同情"}
|
static/task/punct/MiMo-V2.5/manifest.jsonl
CHANGED
|
@@ -1,13 +1,13 @@
|
|
| 1 |
-
{"utt": "case1", "target_text": "我…我知道了…别催我。", "speaker": "苏打", "output_audio": "samples/case1.wav"}
|
| 2 |
-
{"utt": "case2", "target_text": "好啦——我去就是了。", "speaker": "茉莉", "output_audio": "samples/case2.wav"}
|
| 3 |
-
{"utt": "case3", "target_text": "我没醉!谁说我醉了?再来……再来一杯!", "speaker": "白桦", "output_audio": "samples/case3.wav"}
|
| 4 |
-
{"utt": "case4", "target_text": "等…等等我…哈…我…我真的跑不动了。", "speaker": "冰糖", "output_audio": "samples/case4.wav"}
|
| 5 |
-
{"utt": "case5", "target_text": "这是什…啊!别、别靠近!", "speaker": "白桦", "output_audio": "samples/case5.wav"}
|
| 6 |
-
{"utt": "case6", "target_text": "呼——冷静…冷静…别急。", "speaker": "白桦", "output_audio": "samples/case6.wav"}
|
| 7 |
-
{"utt": "case7", "target_text": "咳…咳咳…我没事,继续。", "speaker": "苏打", "output_audio": "samples/case7.wav"}
|
| 8 |
-
{"utt": "case8", "target_text": "你先…先别说话,让我想想。", "speaker": "苏打", "output_audio": "samples/case8.wav"}
|
| 9 |
-
{"utt": "case9", "target_text": "唉……算了,我认了。", "speaker": "白桦", "output_audio": "samples/case9.wav"}
|
| 10 |
-
{"utt": "case10", "target_text": "行行行——你说得都对。", "speaker": "苏打", "output_audio": "samples/case10.wav"}
|
| 11 |
-
{"utt": "case11", "target_text": "等等……我改主意了。", "speaker": "茉莉", "output_audio": "samples/case11.wav"}
|
| 12 |
-
{"utt": "case12", "target_text": "哈…哈…别、别让我再跑了。", "speaker": "白桦", "output_audio": "samples/case12.wav"}
|
| 13 |
-
{"utt": "case13", "target_text": "嘶…疼…疼疼疼!", "speaker": "白桦", "output_audio": "samples/case13.wav"}
|
|
|
|
| 1 |
+
{"utt": "case1", "target_text": "我…我知道了…别催我。", "speaker": "苏打", "output_audio": "samples/case1.wav", "context": "带点紧张,结巴着开口"}
|
| 2 |
+
{"utt": "case2", "target_text": "好啦——我去就是了。", "speaker": "茉莉", "output_audio": "samples/case2.wav", "context": "无奈得很,拖着长音嘟囔"}
|
| 3 |
+
{"utt": "case3", "target_text": "我没醉!谁说我醉了?再来……再来一杯!", "speaker": "白桦", "output_audio": "samples/case3.wav", "context": "情绪上头,舌头打结似的含糊嚷着"}
|
| 4 |
+
{"utt": "case4", "target_text": "等…等等我…哈…我…我真的跑不动了。", "speaker": "冰糖", "output_audio": "samples/case4.wav", "context": "喘得断断续续,声音发虚地喊着"}
|
| 5 |
+
{"utt": "case5", "target_text": "这是什…啊!别、别靠近!", "speaker": "白桦", "output_audio": "samples/case5.wav", "context": "被吓得一激灵,嗓子一下拔高地叫着"}
|
| 6 |
+
{"utt": "case6", "target_text": "呼——冷静…冷静…别急。", "speaker": "白桦", "output_audio": "samples/case6.wav", "context": "先压住气息,放慢语速低声念叨"}
|
| 7 |
+
{"utt": "case7", "target_text": "咳…咳咳…我没事,继续。", "speaker": "苏打", "output_audio": "samples/case7.wav", "context": "咳得停不下来,还硬撑着开口"}
|
| 8 |
+
{"utt": "case8", "target_text": "你先…先别说话,让我想想。", "speaker": "苏打", "output_audio": "samples/case8.wav", "context": "犹豫着放轻声音,小心地请求"}
|
| 9 |
+
{"utt": "case9", "target_text": "唉……算了,我认了。", "speaker": "白桦", "output_audio": "samples/case9.wav", "context": "泄了气似的,低声认下"}
|
| 10 |
+
{"utt": "case10", "target_text": "行行行——你说得都对。", "speaker": "苏打", "output_audio": "samples/case10.wav", "context": "敷衍得很,拖长声调嘀咕"}
|
| 11 |
+
{"utt": "case11", "target_text": "等等……我改主意了。", "speaker": "茉莉", "output_audio": "samples/case11.wav", "context": "语气冷下来,斩钉截铁地改口"}
|
| 12 |
+
{"utt": "case12", "target_text": "哈…哈…别、别让我再跑了。", "speaker": "白桦", "output_audio": "samples/case12.wav", "context": "喘得上气不接下气,发虚地求饶"}
|
| 13 |
+
{"utt": "case13", "target_text": "嘶…疼…疼疼疼!", "speaker": "白桦", "output_audio": "samples/case13.wav", "context": "疼得倒吸一口气,带着哭腔地喊着"}
|
static/task/punct/Ours/manifest.jsonl
CHANGED
|
@@ -1,13 +1,13 @@
|
|
| 1 |
-
{"utt": "case1", "target_text": "我…我知道了…别催我。", "speaker": "", "output_audio": "samples/case1.wav"}
|
| 2 |
-
{"utt": "case2", "target_text": "好啦——我去就是了。", "speaker": "", "output_audio": "samples/case2.wav"}
|
| 3 |
-
{"utt": "case3", "target_text": "我没醉!谁说我醉了?再来……再来一杯!", "speaker": "", "output_audio": "samples/case3.wav"}
|
| 4 |
-
{"utt": "case4", "target_text": "等…等等我…哈…我…我真的跑不动了。", "speaker": "", "output_audio": "samples/case4.wav"}
|
| 5 |
-
{"utt": "case5", "target_text": "这是什…啊!别、别靠近!", "speaker": "", "output_audio": "samples/case5.wav"}
|
| 6 |
-
{"utt": "case6", "target_text": "呼——冷静…冷静…别急。", "speaker": "", "output_audio": "samples/case6.wav"}
|
| 7 |
-
{"utt": "case7", "target_text": "咳…咳咳…我没事,继续。", "speaker": "", "output_audio": "samples/case7.wav"}
|
| 8 |
-
{"utt": "case8", "target_text": "你先…先别说话,让我想想。", "speaker": "", "output_audio": "samples/case8.wav"}
|
| 9 |
-
{"utt": "case9", "target_text": "唉……算了,我认了。", "speaker": "", "output_audio": "samples/case9.wav"}
|
| 10 |
-
{"utt": "case10", "target_text": "行行行——你说得都对。", "speaker": "", "output_audio": "samples/case10.wav"}
|
| 11 |
-
{"utt": "case11", "target_text": "等等……我改主意了。", "speaker": "", "output_audio": "samples/case11.wav"}
|
| 12 |
-
{"utt": "case12", "target_text": "哈…哈…别、别让我再跑了。", "speaker": "", "output_audio": "samples/case12.wav"}
|
| 13 |
-
{"utt": "case13", "target_text": "嘶…疼…疼疼疼!", "speaker": "", "output_audio": "samples/case13.wav"}
|
|
|
|
| 1 |
+
{"utt": "case1", "target_text": "我…我知道了…别催我。", "speaker": "", "output_audio": "samples/case1.wav", "context": "带点紧张,结巴着开口"}
|
| 2 |
+
{"utt": "case2", "target_text": "好啦——我去就是了。", "speaker": "", "output_audio": "samples/case2.wav", "context": "无奈得很,拖着长音嘟囔"}
|
| 3 |
+
{"utt": "case3", "target_text": "我没醉!谁说我醉了?再来……再来一杯!", "speaker": "", "output_audio": "samples/case3.wav", "context": "情绪上头,舌头打结似的含糊嚷着"}
|
| 4 |
+
{"utt": "case4", "target_text": "等…等等我…哈…我…我真的跑不动了。", "speaker": "", "output_audio": "samples/case4.wav", "context": "喘得断断续续,声音发虚地喊着"}
|
| 5 |
+
{"utt": "case5", "target_text": "这是什…啊!别、别靠近!", "speaker": "", "output_audio": "samples/case5.wav", "context": "被吓得一激灵,嗓子一下拔高地叫着"}
|
| 6 |
+
{"utt": "case6", "target_text": "呼——冷静…冷静…别急。", "speaker": "", "output_audio": "samples/case6.wav", "context": "先压住气息,放慢语速低声念叨"}
|
| 7 |
+
{"utt": "case7", "target_text": "咳…咳咳…我没事,继续。", "speaker": "", "output_audio": "samples/case7.wav", "context": "咳得停不下来,还硬撑着开口"}
|
| 8 |
+
{"utt": "case8", "target_text": "你先…先别说话,让我想想。", "speaker": "", "output_audio": "samples/case8.wav", "context": "犹豫着放轻声音,小心地请求"}
|
| 9 |
+
{"utt": "case9", "target_text": "唉……算了,我认了。", "speaker": "", "output_audio": "samples/case9.wav", "context": "泄了气似的,低声认下"}
|
| 10 |
+
{"utt": "case10", "target_text": "行行行——你说得都对。", "speaker": "", "output_audio": "samples/case10.wav", "context": "敷衍得很,拖长声调嘀咕"}
|
| 11 |
+
{"utt": "case11", "target_text": "等等……我改主意了。", "speaker": "", "output_audio": "samples/case11.wav", "context": "语气冷下来,斩钉截铁地改口"}
|
| 12 |
+
{"utt": "case12", "target_text": "哈…哈…别、别让我再跑了。", "speaker": "", "output_audio": "samples/case12.wav", "context": "喘得上气不接下气,发虚地求饶"}
|
| 13 |
+
{"utt": "case13", "target_text": "嘶…疼…疼疼疼!", "speaker": "", "output_audio": "samples/case13.wav", "context": "疼得倒吸一口气,带着哭腔地喊着"}
|
static/task/punct/SoulX-Podcast/manifest.jsonl
CHANGED
|
@@ -1,13 +1,13 @@
|
|
| 1 |
-
{"utt": "case1", "target_text": "我…我知道了…别催我。", "speaker": "", "output_audio": "samples/case1.wav"}
|
| 2 |
-
{"utt": "case2", "target_text": "好啦——我去就是了。", "speaker": "", "output_audio": "samples/case2.wav"}
|
| 3 |
-
{"utt": "case3", "target_text": "我没醉!谁说我醉了?再来……再来一杯!", "speaker": "", "output_audio": "samples/case3.wav"}
|
| 4 |
-
{"utt": "case4", "target_text": "等…等等我…哈…我…我真的跑不动了。", "speaker": "", "output_audio": "samples/case4.wav"}
|
| 5 |
-
{"utt": "case5", "target_text": "这是什…啊!别、别靠近!", "speaker": "", "output_audio": "samples/case5.wav"}
|
| 6 |
-
{"utt": "case6", "target_text": "呼——冷静…冷静…别急。", "speaker": "", "output_audio": "samples/case6.wav"}
|
| 7 |
-
{"utt": "case7", "target_text": "咳…咳咳…我没事,继续。", "speaker": "", "output_audio": "samples/case7.wav"}
|
| 8 |
-
{"utt": "case8", "target_text": "你先…先别说话,让我想想。", "speaker": "", "output_audio": "samples/case8.wav"}
|
| 9 |
-
{"utt": "case9", "target_text": "唉……算了,我认了。", "speaker": "", "output_audio": "samples/case9.wav"}
|
| 10 |
-
{"utt": "case10", "target_text": "行行行——你说得都对。", "speaker": "", "output_audio": "samples/case10.wav"}
|
| 11 |
-
{"utt": "case11", "target_text": "等等……我改主意了。", "speaker": "", "output_audio": "samples/case11.wav"}
|
| 12 |
-
{"utt": "case12", "target_text": "哈…哈…别、别让我再跑了。", "speaker": "", "output_audio": "samples/case12.wav"}
|
| 13 |
-
{"utt": "case13", "target_text": "嘶…疼…疼疼疼!", "speaker": "", "output_audio": "samples/case13.wav"}
|
|
|
|
| 1 |
+
{"utt": "case1", "target_text": "我…我知道了…别催我。", "speaker": "", "output_audio": "samples/case1.wav", "context": "带点紧张,结巴着开口"}
|
| 2 |
+
{"utt": "case2", "target_text": "好啦——我去就是了。", "speaker": "", "output_audio": "samples/case2.wav", "context": "无奈得很,拖着长音嘟囔"}
|
| 3 |
+
{"utt": "case3", "target_text": "我没醉!谁说我醉了?再来……再来一杯!", "speaker": "", "output_audio": "samples/case3.wav", "context": "情绪上头,舌头打结似的含糊嚷着"}
|
| 4 |
+
{"utt": "case4", "target_text": "等…等等我…哈…我…我真的跑不动了。", "speaker": "", "output_audio": "samples/case4.wav", "context": "喘得断断续续,声音发虚地喊着"}
|
| 5 |
+
{"utt": "case5", "target_text": "这是什…啊!别、别靠近!", "speaker": "", "output_audio": "samples/case5.wav", "context": "被吓得一激灵,嗓子一下拔高地叫着"}
|
| 6 |
+
{"utt": "case6", "target_text": "呼——冷静…冷静…别急。", "speaker": "", "output_audio": "samples/case6.wav", "context": "先压住气息,放慢语速低声念叨"}
|
| 7 |
+
{"utt": "case7", "target_text": "咳…咳咳…我没事,继续。", "speaker": "", "output_audio": "samples/case7.wav", "context": "咳得停不下来,还硬撑着开口"}
|
| 8 |
+
{"utt": "case8", "target_text": "你先…先别说话,让我想想。", "speaker": "", "output_audio": "samples/case8.wav", "context": "犹豫着放轻声音,小心地请求"}
|
| 9 |
+
{"utt": "case9", "target_text": "唉……算了,我认了。", "speaker": "", "output_audio": "samples/case9.wav", "context": "泄了气似的,低声认下"}
|
| 10 |
+
{"utt": "case10", "target_text": "行行行——你说得都对。", "speaker": "", "output_audio": "samples/case10.wav", "context": "敷衍得很,拖长声调嘀咕"}
|
| 11 |
+
{"utt": "case11", "target_text": "等等……我改主意了。", "speaker": "", "output_audio": "samples/case11.wav", "context": "语气冷下来,斩钉截铁地改口"}
|
| 12 |
+
{"utt": "case12", "target_text": "哈…哈…别、别让我再跑了。", "speaker": "", "output_audio": "samples/case12.wav", "context": "喘得上气不接下气,发虚地求饶"}
|
| 13 |
+
{"utt": "case13", "target_text": "嘶…疼…疼疼疼!", "speaker": "", "output_audio": "samples/case13.wav", "context": "疼得倒吸一口气,带着哭腔地喊着"}
|