ollui commited on
Commit
f6de20b
·
verified ·
1 Parent(s): 3e8bbee

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +23 -0
app.py ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ from transformers import AutoModelForSpeechSeq2Seq, AutoProcessor
3
+ import gradio as gr
4
+ import scipy.io.wavfile
5
+
6
+ # Load processor và mô hình MMS TTS cho Chuvash
7
+ processor = AutoProcessor.from_pretrained("facebook/mms-tts-chv")
8
+ model = AutoModelForSpeechSeq2Seq.from_pretrained("facebook/mms-tts-chv")
9
+
10
+ def tts(text):
11
+ inputs = processor(text, return_tensors="pt")
12
+ with torch.no_grad():
13
+ generated_ids = model.generate(**inputs)
14
+ audio = processor.batch_decode(generated_ids, output_attentions=False)[0]
15
+
16
+ # audio trả về là list float, cần chuyển sang int16 để lưu file wav
17
+ audio_np = (torch.tensor(audio) * 32767).numpy().astype("int16")
18
+ scipy.io.wavfile.write("output.wav", 22050, audio_np)
19
+ return "output.wav"
20
+
21
+ # Tạo giao diện web với Gradio
22
+ iface = gr.Interface(fn=tts, inputs="text", outputs="audio", title="TTS Chuvash Facebook MMS")
23
+ iface.launch()