| [build-system] |
| requires = ["setuptools >= 61.0", "setuptools-scm>=8.0"] |
| build-backend = "setuptools.build_meta" |
|
|
| [project] |
| name = "f5-tts" |
| version = "1.1.9" |
| description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching" |
| readme = "README.md" |
| license = {text = "MIT License"} |
| classifiers = [ |
| "License :: OSI Approved :: MIT License", |
| "Operating System :: OS Independent", |
| "Programming Language :: Python :: 3", |
|
|
| ] |
| requires-python = ">=3.9,<3.12" |
| dependencies = [ |
| "accelerate>=0.33.0", |
| "bitsandbytes>0.37.0; platform_machine!='arm64' and platform_system!='Darwin'", |
| "cached_path", |
| "click", |
| "datasets", |
| "ema-pytorch==0.7.9", |
| "gradio>=5.0.0", |
| "hydra-core>=1.3.0", |
| "jiwer", |
| "jieba", |
| "zhon", |
| "pytorch-wpe==0.0.1", |
| "torch-complex==0.4.4", |
| "torchcodec==0.9.1", |
| "librosa", |
| "matplotlib", |
| "numpy<=1.26.4; python_version<='3.10'", |
| "pydantic<=2.10.6", |
| "pydub", |
| "pypinyin", |
| "safetensors", |
| "soundfile", |
| "tomli", |
| "torch==2.6.0", |
| "torchaudio==2.6.0", |
| "torchdiffeq==0.2.5", |
| "torchelastic==0.2.2", |
| "torchvision==0.21.0", |
| "tqdm>=4.65.0", |
| "transformers", |
| "transformers_stream_generator", |
| "unidecode", |
| "vocos", |
| "wandb", |
| "x_transformers>=1.31.14", |
| ] |
|
|
| [project.optional-dependencies] |
| eval = [ |
| "faster_whisper==1.2.1", |
| "funasr", |
| "jiwer", |
| "modelscope", |
| "s3prl", |
| "zhconv", |
| "zhon", |
| ] |
|
|
| [project.urls] |
| Homepage = "https://github.com/SWivid/F5-TTS" |
|
|
| [project.scripts] |
| "f5-tts_infer-cli" = "f5_tts.infer.infer_cli:main" |
| "f5-tts_infer-gradio" = "f5_tts.infer.infer_gradio:main" |
| "f5-tts_finetune-cli" = "f5_tts.train.finetune_cli:main" |
| "f5-tts_finetune-gradio" = "f5_tts.train.finetune_gradio:main" |
|
|