File size: 773 Bytes
f1938e2
93b1734
 
 
 
a61efa6
2425131
93b1734
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
from src.chatterbox.mtl_tts import ChatterboxMultilingualTTS
import torchaudio as ta
from safetensors.torch import load_file as load_safetensors

device = "cpu" # or mps or cuda

multilingual_model = ChatterboxMultilingualTTS.from_pretrained(device=device)

# ----
# Then download the file from huggingface and place it in the current directory.
# ----
t3_state = load_safetensors("Thomcles/Chatterbox-TTS-Persian-Farsi/t3_fa.safetensors", device="cpu")
multilingual_model.t3.load_state_dict(t3_state)
multilingual_model.t3.to(device).eval()

persian_text = "سلام! به آزمایش تبدیل متن به گفتار خوش آمدید."
wav_persian = multilingual_model.generate(persian_text, language_id=None)
ta.save("test-fa.wav", wav_persian, multilingual_model.sr)