Spaces:
Running
Running
TTS added: LLaSa 8B; re-enabled openvoice to get to ~1000 votes; FS broken
Browse files- app/models.py +23 -9
app/models.py
CHANGED
|
@@ -25,14 +25,14 @@ AVAILABLE_MODELS = {
|
|
| 25 |
# gradio version that works with most spaces: 4.29
|
| 26 |
# 'coqui/xtts': 'coqui/xtts', # 4.29 4.32; extra_headers error appears for 5.13
|
| 27 |
# 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
|
| 28 |
-
|
| 29 |
-
|
| 30 |
# 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
|
| 31 |
'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
| 32 |
'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
| 33 |
# 'coqui/CoquiTTS': 'coqui/CoquiTTS',
|
| 34 |
-
|
| 35 |
-
|
| 36 |
|
| 37 |
# E2 & F5 TTS
|
| 38 |
# F5 model
|
|
@@ -46,7 +46,7 @@ AVAILABLE_MODELS = {
|
|
| 46 |
# Parler Mini model
|
| 47 |
# 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
|
| 48 |
# 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
|
| 49 |
-
'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
|
| 50 |
|
| 51 |
# # Microsoft Edge TTS
|
| 52 |
# 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # API disabled
|
|
@@ -55,7 +55,7 @@ AVAILABLE_MODELS = {
|
|
| 55 |
# 'Flux9665/MassivelyMultilingualTTS': 'Flux9665/MassivelyMultilingualTTS', # 5.1
|
| 56 |
|
| 57 |
# StyleTTS v2
|
| 58 |
-
'Pendrokar/style-tts-2': 'Pendrokar/style-tts-2', # more votes in OG arena; emotionless
|
| 59 |
|
| 60 |
# StyleTTS Kokoro v0.19
|
| 61 |
# 'hexgrad/kokoro': 'hexgrad/Kokoro-TTS',
|
|
@@ -79,6 +79,8 @@ AVAILABLE_MODELS = {
|
|
| 79 |
|
| 80 |
# llasa 3b TTS
|
| 81 |
'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
|
|
|
|
|
|
|
| 82 |
|
| 83 |
# Mars5
|
| 84 |
# 'CAMB-AI/mars5_space': 'CAMB-AI/mars5_space', # slow inference; Unstable
|
|
@@ -288,7 +290,7 @@ HF_SPACES = {
|
|
| 288 |
|
| 289 |
# StyleTTS Kokoro v0.19
|
| 290 |
'hexgrad/kokoro': {
|
| 291 |
-
'name': '
|
| 292 |
'function': '/generate',
|
| 293 |
'text_param_index': 'text',
|
| 294 |
'return_audio_index': 0,
|
|
@@ -375,8 +377,17 @@ HF_SPACES = {
|
|
| 375 |
'text_param_index': 'target_text',
|
| 376 |
'return_audio_index': 0,
|
| 377 |
'is_zero_gpu_space': True,
|
| 378 |
-
'series': 'llasa
|
| 379 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 380 |
},
|
| 381 |
|
| 382 |
# Mars5
|
|
@@ -611,6 +622,9 @@ OVERRIDE_INPUTS = {
|
|
| 611 |
'srinivasbilla/llasa-3b-tts': {
|
| 612 |
'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
|
| 613 |
},
|
|
|
|
|
|
|
|
|
|
| 614 |
|
| 615 |
# MARS 5
|
| 616 |
'CAMB-AI/mars5_space': {
|
|
|
|
| 25 |
# gradio version that works with most spaces: 4.29
|
| 26 |
# 'coqui/xtts': 'coqui/xtts', # 4.29 4.32; extra_headers error appears for 5.13
|
| 27 |
# 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
|
| 28 |
+
'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
|
| 29 |
+
'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
|
| 30 |
# 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
|
| 31 |
'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
| 32 |
'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
| 33 |
# 'coqui/CoquiTTS': 'coqui/CoquiTTS',
|
| 34 |
+
'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
|
| 35 |
+
# 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # Queue ERROR
|
| 36 |
|
| 37 |
# E2 & F5 TTS
|
| 38 |
# F5 model
|
|
|
|
| 46 |
# Parler Mini model
|
| 47 |
# 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
|
| 48 |
# 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
|
| 49 |
+
# 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
|
| 50 |
|
| 51 |
# # Microsoft Edge TTS
|
| 52 |
# 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # API disabled
|
|
|
|
| 55 |
# 'Flux9665/MassivelyMultilingualTTS': 'Flux9665/MassivelyMultilingualTTS', # 5.1
|
| 56 |
|
| 57 |
# StyleTTS v2
|
| 58 |
+
# 'Pendrokar/style-tts-2': 'Pendrokar/style-tts-2', # more votes in OG arena; emotionless
|
| 59 |
|
| 60 |
# StyleTTS Kokoro v0.19
|
| 61 |
# 'hexgrad/kokoro': 'hexgrad/Kokoro-TTS',
|
|
|
|
| 79 |
|
| 80 |
# llasa 3b TTS
|
| 81 |
'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
|
| 82 |
+
# llasa 8b TTS
|
| 83 |
+
'srinivasbilla/llasa-8b-tts': 'srinivasbilla/llasa-8b-tts',
|
| 84 |
|
| 85 |
# Mars5
|
| 86 |
# 'CAMB-AI/mars5_space': 'CAMB-AI/mars5_space', # slow inference; Unstable
|
|
|
|
| 290 |
|
| 291 |
# StyleTTS Kokoro v0.19
|
| 292 |
'hexgrad/kokoro': {
|
| 293 |
+
'name': 'Kokoro v0.19',
|
| 294 |
'function': '/generate',
|
| 295 |
'text_param_index': 'text',
|
| 296 |
'return_audio_index': 0,
|
|
|
|
| 377 |
'text_param_index': 'target_text',
|
| 378 |
'return_audio_index': 0,
|
| 379 |
'is_zero_gpu_space': True,
|
| 380 |
+
'series': 'llasa',
|
| 381 |
+
},
|
| 382 |
+
|
| 383 |
+
# LlaSa 8B
|
| 384 |
+
'srinivasbilla/llasa-8b-tts': {
|
| 385 |
+
'name': 'LLaSA 8B',
|
| 386 |
+
'function': '/infer',
|
| 387 |
+
'text_param_index': 'target_text',
|
| 388 |
+
'return_audio_index': 0,
|
| 389 |
+
'is_zero_gpu_space': True,
|
| 390 |
+
'series': 'llasa',
|
| 391 |
},
|
| 392 |
|
| 393 |
# Mars5
|
|
|
|
| 622 |
'srinivasbilla/llasa-3b-tts': {
|
| 623 |
'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
|
| 624 |
},
|
| 625 |
+
'srinivasbilla/llasa-8b-tts': {
|
| 626 |
+
'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
|
| 627 |
+
},
|
| 628 |
|
| 629 |
# MARS 5
|
| 630 |
'CAMB-AI/mars5_space': {
|