Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -33,13 +33,25 @@ def load_tts_model(model_key):
|
|
| 33 |
MODEL_CACHE[model_key] = tts
|
| 34 |
return tts
|
| 35 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 36 |
def extract_speakers(model_key):
|
| 37 |
info = VOICE_MODELS[model_key]
|
| 38 |
if info["multi_speaker"]:
|
| 39 |
-
|
| 40 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 41 |
return []
|
| 42 |
|
|
|
|
| 43 |
def docx_to_wav(doc_file, selected_voice, selected_speaker=None):
|
| 44 |
info = VOICE_MODELS[selected_voice]
|
| 45 |
tts = load_tts_model(selected_voice)
|
|
|
|
| 33 |
MODEL_CACHE[model_key] = tts
|
| 34 |
return tts
|
| 35 |
|
| 36 |
+
# def extract_speakers(model_key):
|
| 37 |
+
# info = VOICE_MODELS[model_key]
|
| 38 |
+
# if info["multi_speaker"]:
|
| 39 |
+
# tts = load_tts_model(model_key)
|
| 40 |
+
# return list(tts.speakers)
|
| 41 |
+
# return []
|
| 42 |
+
|
| 43 |
def extract_speakers(model_key):
|
| 44 |
info = VOICE_MODELS[model_key]
|
| 45 |
if info["multi_speaker"]:
|
| 46 |
+
if info["model_name"] == "tts_models/en/vctk/vits":
|
| 47 |
+
# Common VCTK speakers
|
| 48 |
+
return ["p225", "p226", "p227", "p228", "p229", "p230", "p231", "p232", "p233", "p234"]
|
| 49 |
+
else:
|
| 50 |
+
tts = load_tts_model(model_key)
|
| 51 |
+
return getattr(tts, "speakers", [])
|
| 52 |
return []
|
| 53 |
|
| 54 |
+
|
| 55 |
def docx_to_wav(doc_file, selected_voice, selected_speaker=None):
|
| 56 |
info = VOICE_MODELS[selected_voice]
|
| 57 |
tts = load_tts_model(selected_voice)
|