Commit
·
dab4429
1
Parent(s):
19ae156
(wip)debug
Browse files
tts.py
CHANGED
|
@@ -7,6 +7,8 @@ import fal_client
|
|
| 7 |
import requests
|
| 8 |
import time
|
| 9 |
import io
|
|
|
|
|
|
|
| 10 |
from pyht import Client as PyhtClient
|
| 11 |
from pyht.client import TTSOptions
|
| 12 |
import base64
|
|
@@ -204,8 +206,10 @@ def predict_index_tts(text, reference_audio_path=None):
|
|
| 204 |
result = client.predict(
|
| 205 |
prompt=prompt,
|
| 206 |
text=text,
|
|
|
|
| 207 |
api_name="/gen_single"
|
| 208 |
)
|
|
|
|
| 209 |
return result
|
| 210 |
|
| 211 |
|
|
@@ -220,8 +224,10 @@ def predict_spark_tts(text, reference_audio_path=None):
|
|
| 220 |
prompt_text=text,
|
| 221 |
prompt_wav_upload=prompt_wav,
|
| 222 |
prompt_wav_record=prompt_wav,
|
|
|
|
| 223 |
api_name="/voice_clone"
|
| 224 |
)
|
|
|
|
| 225 |
return result
|
| 226 |
|
| 227 |
|
|
@@ -230,7 +236,7 @@ def predict_cosyvoice_tts(text, reference_audio_path=None):
|
|
| 230 |
client = Client("https://iic-cosyvoice2-0-5b.ms.show/")
|
| 231 |
if not reference_audio_path:
|
| 232 |
raise ValueError("cosyvoice-2.0 需要 reference_audio_path")
|
| 233 |
-
prompt_wav =
|
| 234 |
result = client.predict(
|
| 235 |
tts_text=text,
|
| 236 |
mode_checkbox_group="3s极速复刻",
|
|
@@ -242,6 +248,8 @@ def predict_cosyvoice_tts(text, reference_audio_path=None):
|
|
| 242 |
stream="false",
|
| 243 |
api_name="/generate_audio"
|
| 244 |
)
|
|
|
|
|
|
|
| 245 |
return result
|
| 246 |
|
| 247 |
|
|
|
|
| 7 |
import requests
|
| 8 |
import time
|
| 9 |
import io
|
| 10 |
+
|
| 11 |
+
from gradio_client import handle_file
|
| 12 |
from pyht import Client as PyhtClient
|
| 13 |
from pyht.client import TTSOptions
|
| 14 |
import base64
|
|
|
|
| 206 |
result = client.predict(
|
| 207 |
prompt=prompt,
|
| 208 |
text=text,
|
| 209 |
+
stream="false",
|
| 210 |
api_name="/gen_single"
|
| 211 |
)
|
| 212 |
+
print("index-tts result:", result)
|
| 213 |
return result
|
| 214 |
|
| 215 |
|
|
|
|
| 224 |
prompt_text=text,
|
| 225 |
prompt_wav_upload=prompt_wav,
|
| 226 |
prompt_wav_record=prompt_wav,
|
| 227 |
+
stream="false",
|
| 228 |
api_name="/voice_clone"
|
| 229 |
)
|
| 230 |
+
print("spark-tts result:", result)
|
| 231 |
return result
|
| 232 |
|
| 233 |
|
|
|
|
| 236 |
client = Client("https://iic-cosyvoice2-0-5b.ms.show/")
|
| 237 |
if not reference_audio_path:
|
| 238 |
raise ValueError("cosyvoice-2.0 需要 reference_audio_path")
|
| 239 |
+
prompt_wav = handle_file(reference_audio_path)
|
| 240 |
result = client.predict(
|
| 241 |
tts_text=text,
|
| 242 |
mode_checkbox_group="3s极速复刻",
|
|
|
|
| 248 |
stream="false",
|
| 249 |
api_name="/generate_audio"
|
| 250 |
)
|
| 251 |
+
print("cosyvoice-2.0 result:", result)
|
| 252 |
+
|
| 253 |
return result
|
| 254 |
|
| 255 |
|