Create app.py
Browse files
app.py
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from chatterbox_git.src.chatterbox import mtl_tts
|
| 2 |
+
import torchaudio as ta
|
| 3 |
+
from safetensors.torch import load_file as load_safetensors
|
| 4 |
+
|
| 5 |
+
device = "cpu" # or mps or cuda
|
| 6 |
+
|
| 7 |
+
multilingual_model = mtl_tts.ChatterboxMultilingualTTS.from_pretrained(device=device)
|
| 8 |
+
|
| 9 |
+
# ----
|
| 10 |
+
# Then download the file from huggingface and place it in the current directory.
|
| 11 |
+
# ----
|
| 12 |
+
|
| 13 |
+
|
| 14 |
+
t3_state = load_safetensors("Thomcles/Chatterbox-TTS-Persian-Farsi/t3_fa.safetensors", device="cpu")
|
| 15 |
+
multilingual_model.t3.load_state_dict(t3_state)
|
| 16 |
+
multilingual_model.t3.to(device).eval()
|
| 17 |
+
|
| 18 |
+
persian_text = "سلام! به آزمایش تبدیل متن به گفتار خوش آمدید."
|
| 19 |
+
wav_persian = multilingual_model.generate(persian_text, language_id=None)
|
| 20 |
+
ta.save("test-fa.wav", wav_persian, multilingual_model.sr)
|