Spaces:
Sleeping
Sleeping
Michael Hu
commited on
Commit
·
e3843d2
1
Parent(s):
22bd0b9
update to set a voice
Browse files- utils/tts.py +3 -8
utils/tts.py
CHANGED
|
@@ -107,13 +107,6 @@ class TTSEngine:
|
|
| 107 |
self.client = Client("Remsky/Kokoro-TTS-Zero")
|
| 108 |
self.engine_type = "kokoro_space"
|
| 109 |
logger.info("TTS engine successfully initialized with Kokoro FastAPI server")
|
| 110 |
-
result = client.predict(
|
| 111 |
-
text="The studio was filled with the rich odour of roses, and when the light",
|
| 112 |
-
voice_names=None,
|
| 113 |
-
speed=1,
|
| 114 |
-
api_name="/generate_speech_from_ui"
|
| 115 |
-
)
|
| 116 |
-
logger.info(result)
|
| 117 |
except Exception as kokoro_err:
|
| 118 |
logger.error(f"Failed to initialize Kokoro pipeline: {str(kokoro_err)}")
|
| 119 |
logger.error(f"Error type: {type(kokoro_err).__name__}")
|
|
@@ -170,12 +163,14 @@ class TTSEngine:
|
|
| 170 |
elif self.engine_type == "kokoro_space":
|
| 171 |
# Use Kokoro FastAPI server for TTS generation
|
| 172 |
logger.info("Generating speech using Kokoro FastAPI server")
|
|
|
|
| 173 |
result = self.client.predict(
|
| 174 |
text=text,
|
| 175 |
-
voice_names=
|
| 176 |
speed=speed,
|
| 177 |
api_name="/generate_speech_from_ui"
|
| 178 |
)
|
|
|
|
| 179 |
elif self.engine_type == "dia":
|
| 180 |
# Use Dia for TTS generation
|
| 181 |
try:
|
|
|
|
| 107 |
self.client = Client("Remsky/Kokoro-TTS-Zero")
|
| 108 |
self.engine_type = "kokoro_space"
|
| 109 |
logger.info("TTS engine successfully initialized with Kokoro FastAPI server")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 110 |
except Exception as kokoro_err:
|
| 111 |
logger.error(f"Failed to initialize Kokoro pipeline: {str(kokoro_err)}")
|
| 112 |
logger.error(f"Error type: {type(kokoro_err).__name__}")
|
|
|
|
| 163 |
elif self.engine_type == "kokoro_space":
|
| 164 |
# Use Kokoro FastAPI server for TTS generation
|
| 165 |
logger.info("Generating speech using Kokoro FastAPI server")
|
| 166 |
+
logger.info(f"text to generate speech on is: {text}")
|
| 167 |
result = self.client.predict(
|
| 168 |
text=text,
|
| 169 |
+
voice_names=voice,
|
| 170 |
speed=speed,
|
| 171 |
api_name="/generate_speech_from_ui"
|
| 172 |
)
|
| 173 |
+
logger.info(f"Received audio from Kokoro FastAPI server: {result}")
|
| 174 |
elif self.engine_type == "dia":
|
| 175 |
# Use Dia for TTS generation
|
| 176 |
try:
|