Commit
·
3e85610
1
Parent(s):
833d379
Fix Normalization
Browse files- processing_moss_tts.py +2 -2
processing_moss_tts.py
CHANGED
|
@@ -687,7 +687,7 @@ class MossTTSDelayProcessor(ProcessorMixin):
|
|
| 687 |
audio_start_idx = int(audio_start_idx_t.item())
|
| 688 |
audio_end_idx = int(audio_end_idx_t.item())
|
| 689 |
delay_audio_codes = self.apply_delay_pattern(
|
| 690 |
-
|
| 691 |
)
|
| 692 |
pad_codes = torch.full(
|
| 693 |
(audio_start_idx - prefix_idx + 1, n_vq),
|
|
@@ -762,7 +762,7 @@ class MossTTSDelayProcessor(ProcessorMixin):
|
|
| 762 |
if breaks.numel() == 0:
|
| 763 |
segments_idx = [idx]
|
| 764 |
else:
|
| 765 |
-
segments_idx = torch.split(idx, breaks
|
| 766 |
|
| 767 |
audio_codes_list = [audio_codes[s] for s in segments_idx]
|
| 768 |
|
|
|
|
| 687 |
audio_start_idx = int(audio_start_idx_t.item())
|
| 688 |
audio_end_idx = int(audio_end_idx_t.item())
|
| 689 |
delay_audio_codes = self.apply_delay_pattern(
|
| 690 |
+
audio_codes, self.model_config.audio_pad_code
|
| 691 |
)
|
| 692 |
pad_codes = torch.full(
|
| 693 |
(audio_start_idx - prefix_idx + 1, n_vq),
|
|
|
|
| 762 |
if breaks.numel() == 0:
|
| 763 |
segments_idx = [idx]
|
| 764 |
else:
|
| 765 |
+
segments_idx = torch.split(idx, breaks)
|
| 766 |
|
| 767 |
audio_codes_list = [audio_codes[s] for s in segments_idx]
|
| 768 |
|