XTTSv2-multi / requirements.txt
Rasmus Lellep
initial commit
e9a0669
# core deps
numpy==1.26.0
cython>=3.0.0
scipy>=1.13.0
torch>=2.1
torchaudio>=2.1.0
soundfile>=0.12.0
librosa>=0.11.0
###scikit-learn>=1.3.0
numba>0.58.0 #
inflect>=5.6.0
tqdm>=4.64.1
anyascii>=0.3.0
pyyaml>=6.0
fsspec[http]>=2023.6.0
aiohttp>=3.8.1 #
packaging>=23.1
typing_extensions>=4.10
###mutagen==1.47.0
# deps for examples
flask>=3.0.0 #
# deps for inference
pysbd>=0.3.4
# deps for notebooks
bokeh==3.0.3
umap-learn>=0.5.1
pandas>=1.4,<3.0
# deps for training
matplotlib>=3.8.4
# coqui stack
###trainer>=0.0.36
coqui-tts-trainer>=0.3.0,<0.4.0
# config management
coqpit-config>=0.2.0,<0.3.0
monotonic-alignment-search>=0.1.0
# gruut+supported langs
gruut[de,es,fr]==2.4.0
# chinese g2p deps
jieba>=0.42.1
pypinyin>=0.40.0
# deps for korean
hangul_romanize>=0.1.0
jamo>=0.4.1
###nltk
g2pkk>=0.1.1
pip>=22.2
# deps for bangla
bangla>=0.0.2
bnnumerizer>=0.0.2
bnunicodenormalizer>=0.1.0
# deps for japanese
mecab-python3>=1.0.2
unidic-lite==1.0.8
cutlet>=0.2.0
fugashi[unidic-lite]>=1.3.0
# deps for estonian
tts_preprocess_et @ git+https://github.com/TartuNLP/tts_preprocess_et.git@v1.0.1
#deps for tortoise
einops>=0.6.0
transformers>=4.52.1
#deps for bark
encodec>=0.1.1
# deps for XTTS
###unidecode>=1.3.2
num2words>=0.5.14
spacy[ja]>=3,<3.8
tokenizers==0.21.4
langid
gradio
torchcodec