Spaces:

Ryanus
/

CoquiTTS

Sleeping

App Files Files Community

Ryanus commited on Jun 28, 2025

Commit

1cc29b6

verified ·

1 Parent(s): 3640a27

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -24

app.py CHANGED Viewed

@@ -5,7 +5,6 @@ import os
 import tempfile
 # --- 打印 Gradio 版本以供診斷 ---
-# 再次強調：請務必檢查日誌中這行打印出的 Gradio 版本，這對診斷問題根源至關重要。
 print(f"Gradio version at runtime: {gr.__version__}")
 # ---
@@ -92,11 +91,15 @@ SUPPORTED_LANGUAGES = [
     "te",      # Telugu
 ]
-def generate_speech(text, language, speaker_audio_path):
     """
-    根據輸入文字、語言和語音參考檔案生成語音。
-    XTTS-v2 支援語音克隆，需要提供 speaker_wav。
     """
     if model_load_error:
         return None, f"應用程式啟動錯誤：{model_load_error}"
@@ -108,16 +111,19 @@ def generate_speech(text, language, speaker_audio_path):
         return None, "請輸入一些文字！"
     if not language:
         return None, "請選擇一個語言！"
-    if not speaker_audio_path:
-        return None, "請上傳一個語音參考檔案 (WAV 格式) 來克隆語音！"
     output_file = None
     try:
         with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
             output_file = fp.name
-        print(f"正在為語言 '{language}' 生成語音，使用語音參考檔案: {speaker_audio_path}...")
-        tts.tts_to_file(text=text, language=language, speaker_wav=speaker_audio_path, file_path=output_file)
         print(f"語音已生成到：{output_file}")
         return output_file, "語音生成成功！"
@@ -133,27 +139,20 @@ iface = gr.Interface(
     inputs=[
         gr.Textbox(lines=5, label="輸入文字", placeholder="請在這裡輸入你想要轉換成語音的文字..."),
         gr.Dropdown(choices=SUPPORTED_LANGUAGES, label="選擇語言", value="en"),
-        gr.Audio(
-            type="filepath",
-            label="上傳語音參考檔案 (WAV)",
-            sources=["microphone", "upload"],
-            # 移除 waveform_options 參數
-            # waveform_options=gr.Audio.WaveformOptions(
-            #     skip_length=True,
-            #     show_controls=False,
-            #     show_labels=False,
-            #     create_waveform=True,
-            # ),
-            # 移除 info 參數
-            # info="請上傳一個清晰的語音檔案 (建議 3-10 秒，WAV 格式) 來克隆語音。",
-        ),
     ],
     outputs=[
         gr.Audio(label="生成的語音", type="filepath"),
         gr.Textbox(label="狀態")
     ],
-    title="Coqui TTS XTTS-v2 語音生成 (CPU)",
-    description="在 Hugging Face Space 上使用 Coqui TTS XTTS-v2 模型將文字轉換為語音。此演示使用 CPU 運行，請注意 XTTS-v2 在 CPU 上運行會非常慢。首次運行時會下載模型。",
     flagging_mode="never",
 )

 import tempfile
 # --- 打印 Gradio 版本以供診斷 ---
 print(f"Gradio version at runtime: {gr.__version__}")
 # ---
     "te",      # Telugu
 ]
+# 定義預設說話者音訊檔案的路徑
+# 請確保你已將 'speaker.wav' 檔案上傳到 Hugging Face Space 的根目錄
+DEFAULT_SPEAKER_WAV = "speaker.wav"
+def generate_speech(text, language): # 移除 speaker_audio_path 參數
     """
+    根據輸入文字和語言生成語音。
+    此版本使用 XTTS-v2 模型，並使用預設的 speaker.wav 檔案作為語音參考。
     """
     if model_load_error:
         return None, f"應用程式啟動錯誤：{model_load_error}"
         return None, "請輸入一些文字！"
     if not language:
         return None, "請選擇一個語言！"
+    # 檢查預設說話者音訊檔案是否存在
+    if not os.path.exists(DEFAULT_SPEAKER_WAV):
+        return None, f"錯誤：預設語音參考檔案 ({DEFAULT_SPEAKER_WAV}) 未找到。請確保該檔案已上傳到您的 Hugging Face Space 的根目錄。"
     output_file = None
     try:
         with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
             output_file = fp.name
+        print(f"正在為語言 '{language}' 生成語音，使用預設語音參考檔案: {DEFAULT_SPEAKER_WAV}...")
+        # 將 DEFAULT_SPEAKER_WAV 作為 speaker_wav 參數傳遞
+        tts.tts_to_file(text=text, language=language, speaker_wav=DEFAULT_SPEAKER_WAV, file_path=output_file)
         print(f"語音已生成到：{output_file}")
         return output_file, "語音生成成功！"
     inputs=[
         gr.Textbox(lines=5, label="輸入文字", placeholder="請在這裡輸入你想要轉換成語音的文字..."),
         gr.Dropdown(choices=SUPPORTED_LANGUAGES, label="選擇語言", value="en"),
+        # 移除語音參考檔案上傳組件
+        # gr.Audio(
+        #     type="filepath",
+        #     label="上傳語音參考檔案 (WAV)",
+        #     sources=["microphone", "upload"],
+        #     info="請上傳一個清晰的語音檔案 (建議 3-10 秒，WAV 格式) 來克隆語音。",
+        # ),
     ],
     outputs=[
         gr.Audio(label="生成的語音", type="filepath"),
         gr.Textbox(label="狀態")
     ],
+    title="Coqui TTS XTTS-v2 語音生成 (CPU - 使用預設語音)",
+    description="在 Hugging Face Space 上使用 Coqui TTS XTTS-v2 模型將文字轉換為語音。此演示使用 CPU 運行，請注意 XTTS-v2 在 CPU 上運行會非常慢。語音將使用預設的 speaker.wav 檔案進行克隆。",
     flagging_mode="never",
 )