Inial commited on
Commit
d378de6
·
verified ·
1 Parent(s): a3c62ff

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -14
app.py CHANGED
@@ -1,23 +1,21 @@
1
  import gradio as gr
2
  import torch
3
- from transformers import AutoProcessor, AutoModelForTextToSpeech
4
- import scipy.io.wavfile
5
- import tempfile
6
-
7
- model_id = "facebook/mms-tts-lis"
8
 
9
  def tts_lisu(text):
 
10
  try:
11
- processor = AutoProcessor.from_pretrained(model_id)
12
- model = AutoModelForTextToSpeech.from_pretrained(model_id)
13
-
14
- inputs = processor(text=text, return_tensors="pt")
15
  with torch.no_grad():
16
- speech = model(**inputs).waveform
17
-
18
- with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
19
- scipy.io.wavfile.write(f.name, rate=16000, data=speech.squeeze().cpu().numpy())
20
- return "✅ Giọng Lisu (ꓡꓲ-ꓢꓴ)", f.name
 
21
  except Exception as e:
22
  return f"❌ Lỗi: {str(e)}", None
23
 
 
1
  import gradio as gr
2
  import torch
3
+ import torchaudio
4
+ from transformers import VitsModel, VitsTokenizer
 
 
 
5
 
6
  def tts_lisu(text):
7
+ model_id = "facebook/mms-tts-lis"
8
  try:
9
+ tokenizer = VitsTokenizer.from_pretrained(model_id)
10
+ model = VitsModel.from_pretrained(model_id)
11
+ inputs = tokenizer(text, return_tensors="pt")
 
12
  with torch.no_grad():
13
+ output = model(**inputs)
14
+ waveform = output.waveform.squeeze().cpu()
15
+ sample_rate = model.config.sampling_rate
16
+ path = "lisu.wav"
17
+ torchaudio.save(path, waveform.unsqueeze(0), sample_rate)
18
+ return "✅ Giọng Lisu (ꓡꓲ-ꓢꓴ)", path
19
  except Exception as e:
20
  return f"❌ Lỗi: {str(e)}", None
21