Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
|
@@ -37,16 +37,19 @@ LANGS = ["vi", "en", "zh-cn", "ja", "ko"]
|
|
| 37 |
# ===== TTS FUNCTION =====
|
| 38 |
def tts_fn(text, language, ref_audio):
|
| 39 |
gpt_latent, spk_embed = MODEL.get_conditioning_latents(
|
| 40 |
-
audio_path=ref_audio,
|
|
|
|
|
|
|
|
|
|
| 41 |
)
|
| 42 |
out = MODEL.inference(
|
| 43 |
text=text,
|
| 44 |
language=language,
|
| 45 |
-
gpt_cond_latent=gpt_latent,
|
| 46 |
speaker_embedding=spk_embed,
|
| 47 |
temperature=0.65,
|
| 48 |
repetition_penalty=2.5,
|
| 49 |
-
enable_text_splitting=
|
| 50 |
)
|
| 51 |
wav = torch.tensor(out["wav"]).unsqueeze(0)
|
| 52 |
torchaudio.save("output.wav", wav, 24000)
|
|
|
|
| 37 |
# ===== TTS FUNCTION =====
|
| 38 |
def tts_fn(text, language, ref_audio):
|
| 39 |
gpt_latent, spk_embed = MODEL.get_conditioning_latents(
|
| 40 |
+
audio_path=ref_audio,
|
| 41 |
+
gpt_cond_len=18,
|
| 42 |
+
gpt_cond_chunk_len=4,
|
| 43 |
+
max_ref_length=50
|
| 44 |
)
|
| 45 |
out = MODEL.inference(
|
| 46 |
text=text,
|
| 47 |
language=language,
|
| 48 |
+
gpt_cond_latent=gpt_latent,
|
| 49 |
speaker_embedding=spk_embed,
|
| 50 |
temperature=0.65,
|
| 51 |
repetition_penalty=2.5,
|
| 52 |
+
enable_text_splitting=True
|
| 53 |
)
|
| 54 |
wav = torch.tensor(out["wav"]).unsqueeze(0)
|
| 55 |
torchaudio.save("output.wav", wav, 24000)
|