nxhong commited on
Commit
b9aa16e
·
verified ·
1 Parent(s): f1134ba

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -3
app.py CHANGED
@@ -37,16 +37,19 @@ LANGS = ["vi", "en", "zh-cn", "ja", "ko"]
37
  # ===== TTS FUNCTION =====
38
  def tts_fn(text, language, ref_audio):
39
  gpt_latent, spk_embed = MODEL.get_conditioning_latents(
40
- audio_path=ref_audio, gpt_cond_len=18, gpt_cond_chunk_len=4, max_ref_length=50
 
 
 
41
  )
42
  out = MODEL.inference(
43
  text=text,
44
  language=language,
45
- gpt_cond_latent=gpt_latent,
46
  speaker_embedding=spk_embed,
47
  temperature=0.65,
48
  repetition_penalty=2.5,
49
- enable_text_splitting=False
50
  )
51
  wav = torch.tensor(out["wav"]).unsqueeze(0)
52
  torchaudio.save("output.wav", wav, 24000)
 
37
  # ===== TTS FUNCTION =====
38
  def tts_fn(text, language, ref_audio):
39
  gpt_latent, spk_embed = MODEL.get_conditioning_latents(
40
+ audio_path=ref_audio,
41
+ gpt_cond_len=18,
42
+ gpt_cond_chunk_len=4,
43
+ max_ref_length=50
44
  )
45
  out = MODEL.inference(
46
  text=text,
47
  language=language,
48
+ gpt_cond_latent=gpt_latent,
49
  speaker_embedding=spk_embed,
50
  temperature=0.65,
51
  repetition_penalty=2.5,
52
+ enable_text_splitting=True
53
  )
54
  wav = torch.tensor(out["wav"]).unsqueeze(0)
55
  torchaudio.save("output.wav", wav, 24000)