Instructions to use Renderlib-dev/sooktam2 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use Renderlib-dev/sooktam2 with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("text-to-speech", model="Renderlib-dev/sooktam2", trust_remote_code=True)# Load model directly from transformers import AutoModel model = AutoModel.from_pretrained("Renderlib-dev/sooktam2", trust_remote_code=True, dtype="auto") - F5-TTS
How to use Renderlib-dev/sooktam2 with F5-TTS:
# No code snippets available yet for this library. # To use this model, check the repository files and the library's documentation. # Want to help? PRs adding snippets are welcome at: # https://github.com/huggingface/huggingface.js
- Notebooks
- Google Colab
- Kaggle
| [build-system] | |
| requires = ["setuptools >= 61.0", "setuptools-scm>=8.0"] | |
| build-backend = "setuptools.build_meta" | |
| [project] | |
| name = "f5-tts" | |
| version = "1.1.9" | |
| description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching" | |
| readme = "README.md" | |
| license = {text = "MIT License"} | |
| classifiers = [ | |
| "License :: OSI Approved :: MIT License", | |
| "Operating System :: OS Independent", | |
| "Programming Language :: Python :: 3", | |
| ] | |
| requires-python = ">=3.9,<3.12" | |
| dependencies = [ | |
| "accelerate>=0.33.0", | |
| "bitsandbytes>0.37.0; platform_machine!='arm64' and platform_system!='Darwin'", | |
| "cached_path", | |
| "click", | |
| "datasets", | |
| "ema-pytorch==0.7.9", | |
| "gradio>=5.0.0", | |
| "hydra-core>=1.3.0", | |
| "jiwer", | |
| "jieba", | |
| "zhon", | |
| "pytorch-wpe==0.0.1", | |
| "torch-complex==0.4.4", | |
| "torchcodec==0.9.1", | |
| "librosa", | |
| "matplotlib", | |
| "numpy<=1.26.4; python_version<='3.10'", | |
| "pydantic<=2.10.6", | |
| "pydub", | |
| "pypinyin", | |
| "safetensors", | |
| "soundfile", | |
| "tomli", | |
| "torch==2.6.0", | |
| "torchaudio==2.6.0", | |
| "torchdiffeq==0.2.5", | |
| "torchelastic==0.2.2", | |
| "torchvision==0.21.0", | |
| "tqdm>=4.65.0", | |
| "transformers", | |
| "transformers_stream_generator", | |
| "unidecode", | |
| "vocos", | |
| "wandb", | |
| "x_transformers>=1.31.14", | |
| ] | |
| [project.optional-dependencies] | |
| eval = [ | |
| "faster_whisper==1.2.1", | |
| "funasr", | |
| "jiwer", | |
| "modelscope", | |
| "s3prl", | |
| "zhconv", | |
| "zhon", | |
| ] | |
| [project.urls] | |
| Homepage = "https://github.com/SWivid/F5-TTS" | |
| [project.scripts] | |
| "f5-tts_infer-cli" = "f5_tts.infer.infer_cli:main" | |
| "f5-tts_infer-gradio" = "f5_tts.infer.infer_gradio:main" | |
| "f5-tts_finetune-cli" = "f5_tts.train.finetune_cli:main" | |
| "f5-tts_finetune-gradio" = "f5_tts.train.finetune_gradio:main" | |