Commit
·
f2d53f6
1
Parent(s):
3e85610
Aligned with tts
Browse files- processing_moss_tts.py +2 -1
processing_moss_tts.py
CHANGED
|
@@ -159,7 +159,7 @@ class UserMessage(Message):
|
|
| 159 |
reference = []
|
| 160 |
for speaker_idx, speaker_reference in enumerate(self.reference):
|
| 161 |
if speaker_reference is not None:
|
| 162 |
-
reference.append(f"[S{speaker_idx}]:\n{AUDIO_PLACEHOLDER}")
|
| 163 |
reference = "\n".join(reference)
|
| 164 |
audio_codes_list = [
|
| 165 |
speaker_reference
|
|
@@ -631,6 +631,7 @@ class MossTTSDelayProcessor(ProcessorMixin):
|
|
| 631 |
"""
|
| 632 |
if role == "user":
|
| 633 |
audio_gen_slot_token = audio_delay_slot_token = self.audio_user_slot_token
|
|
|
|
| 634 |
else:
|
| 635 |
audio_gen_slot_token = self.audio_assistant_gen_slot_token
|
| 636 |
audio_delay_slot_token = self.audio_assistant_delay_slot_token
|
|
|
|
| 159 |
reference = []
|
| 160 |
for speaker_idx, speaker_reference in enumerate(self.reference):
|
| 161 |
if speaker_reference is not None:
|
| 162 |
+
reference.append(f"[S{speaker_idx+1}]:\n{AUDIO_PLACEHOLDER}")
|
| 163 |
reference = "\n".join(reference)
|
| 164 |
audio_codes_list = [
|
| 165 |
speaker_reference
|
|
|
|
| 631 |
"""
|
| 632 |
if role == "user":
|
| 633 |
audio_gen_slot_token = audio_delay_slot_token = self.audio_user_slot_token
|
| 634 |
+
truncation = False
|
| 635 |
else:
|
| 636 |
audio_gen_slot_token = self.audio_assistant_gen_slot_token
|
| 637 |
audio_delay_slot_token = self.audio_assistant_delay_slot_token
|