[build-system] requires = ["setuptools >= 61.0", "setuptools-scm>=8.0"] build-backend = "setuptools.build_meta" [project] name = "f5-tts" version = "1.1.9" description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching" readme = "README.md" license = {text = "MIT License"} classifiers = [ "License :: OSI Approved :: MIT License", "Operating System :: OS Independent", "Programming Language :: Python :: 3", ] requires-python = ">=3.9,<3.12" dependencies = [ "accelerate>=0.33.0", "bitsandbytes>0.37.0; platform_machine!='arm64' and platform_system!='Darwin'", "cached_path", "click", "datasets", "ema-pytorch==0.7.9", "gradio>=5.0.0", "hydra-core>=1.3.0", "jiwer", "jieba", "zhon", "pytorch-wpe==0.0.1", "torch-complex==0.4.4", "torchcodec==0.9.1", "librosa", "matplotlib", "numpy<=1.26.4; python_version<='3.10'", "pydantic<=2.10.6", "pydub", "pypinyin", "safetensors", "soundfile", "tomli", "torch==2.6.0", "torchaudio==2.6.0", "torchdiffeq==0.2.5", "torchelastic==0.2.2", "torchvision==0.21.0", "tqdm>=4.65.0", "transformers", "transformers_stream_generator", "unidecode", "vocos", "wandb", "x_transformers>=1.31.14", ] [project.optional-dependencies] eval = [ "faster_whisper==1.2.1", "funasr", "jiwer", "modelscope", "s3prl", "zhconv", "zhon", ] [project.urls] Homepage = "https://github.com/SWivid/F5-TTS" [project.scripts] "f5-tts_infer-cli" = "f5_tts.infer.infer_cli:main" "f5-tts_infer-gradio" = "f5_tts.infer.infer_gradio:main" "f5-tts_finetune-cli" = "f5_tts.train.finetune_cli:main" "f5-tts_finetune-gradio" = "f5_tts.train.finetune_gradio:main"