Spaces:
Running
Running
File size: 826 Bytes
d9e57de 9686155 d9e57de 9686155 d9e57de 9686155 5c622e0 9686155 d9e57de 9686155 d9e57de | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 | import tempfile
import gradio as gr
import soundfile as sf
from transformers import (
AutoTokenizer,
VitsModel
)
import torch
MODEL_NAME = "facebook/mms-tts-nan"
tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
model = VitsModel.from_pretrained(MODEL_NAME)
def tts(text):
inputs = tokenizer(text, return_tensors="pt")
with torch.no_grad():
output = model(**inputs)
waveform = output.waveform.squeeze().cpu().numpy()
file = tempfile.NamedTemporaryFile(
suffix=".wav",
delete=False
)
sf.write(
file.name,
waveform,
model.config.sampling_rate
)
return file.name
demo = gr.Interface(
fn=tts,
inputs=gr.Textbox(label="輸入文字"),
outputs=gr.Audio(type="filepath"),
title="Taiwanese TTS"
)
demo.launch() |