ollui commited on
Commit
a5ae415
·
verified ·
1 Parent(s): f2bf50b

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +21 -0
app.py ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import AutoProcessor, VitsModel
2
+ import torch
3
+ import gradio as gr
4
+ import scipy.io.wavfile
5
+
6
+ model_id = "facebook/mms-tts-bod"
7
+
8
+ processor = AutoProcessor.from_pretrained(model_id)
9
+ model = VitsModel.from_pretrained(model_id)
10
+ model.eval()
11
+
12
+ def tts_fn(text):
13
+ inputs = processor(text=text, return_tensors="pt")
14
+ with torch.no_grad():
15
+ output = model(**inputs)
16
+ audio = output.waveform.squeeze().numpy()
17
+ sample_rate = model.config.sampling_rate
18
+ return (sample_rate, audio)
19
+
20
+ demo = gr.Interface(fn=tts_fn, inputs=gr.Textbox(label="Nhập văn bản tiếng Tây Tạng"), outputs="audio")
21
+ demo.launch()