work_one

Sleeping

App Files Files Community

txh17 commited on Jun 16, 2025

Commit

370a67d

verified ·

1 Parent(s): 69781f1

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -89

app.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import gradio as gr
 import subprocess
 import os
-import pandas as pd # 仍保留，以备报告内容需要用到数据帧时使用
 # --- TTS 模型函数 (CPU 友好) ---
@@ -17,29 +16,25 @@ def synthesize_espeak(text: str, lang: str = "en-us") -> str | None:
         os.remove(output_file)
     try:
-        # 运行 espeak-ng 的命令。--stdout 输出到标准输出，我们捕获它。
-        # 添加了 timeout 以防止无限期挂起
         command = ["espeak-ng", f"-v{lang}", "--stdout", text]
         process = subprocess.run(command, capture_output=True, check=True, timeout=10)
-        # 检查 espeak-ng 是否实际产生了音频输出
         if not process.stdout:
             gr.Warning("eSpeak-ng 没有为给定文本生成任何音频输出。请尝试不同的文本。")
             print(f"eSpeak-ng 为文本 '{text}' 未产生输出。")
-            return None # 返回 None 以清空音频组件
-        # 将捕获到的标准输出（音频数据）写入 WAV 文件
         with open(output_file, "wb") as f:
             f.write(process.stdout)
         print(f"eSpeak-ng 合成成功: {output_file}")
-        return output_file # 返回生成的音频文件路径
     except FileNotFoundError:
         error_msg = "错误：未找到 espeak-ng。请确保它已安装在您 Space 的 Dockerfile 中，并且 Space 已重建。"
         print(error_msg)
-        gr.Error(error_msg) # 在 Gradio 中显示一个持久性错误消息
         return None
     except subprocess.CalledProcessError as e:
         error_msg = f"eSpeak-ng 合成过程中出现错误。命令以代码 {e.returncode} 退出。错误输出：{e.stderr.decode()}"
@@ -64,93 +59,42 @@ def synthesize_api_tts(text: str) -> str | None:
     对于此演示，它返回一个占位符音频文件。
     """
     print(f"正在模拟 API TTS：'{text}'")
-    # --- 重要：请用您真实的 API 调用替换此处 ---
-    # --------------------------------------------------------
-    # 占位符：返回一个通用音频用于演示
-    # 在实际场景中，您会从 API 获取一个真实的音频文件。
     return "https://www.soundhelix.com/examples/mp3/SoundHelix-Song-2.mp3" # 占位符 WAV/MP3
-# --- Gradio 界面 ---
-with gr.Blocks(css="""
-    /* 自定义 CSS from 原始模板或添加您自己的 */
-    .markdown-text {
-        font-family: 'IBM Plex Sans', sans-serif;
-        color: #333;
-        line-height: 1.6;
-    }
-    h1, h2, h3, h4, h5, h6 {
-        color: #0056b3; /* 漂亮的蓝色 */
-    }
-    table {
-        width: 100%;
-        border-collapse: collapse;
-        margin-top: 15px;
-    }
-    th, td {
-        border: 1px solid #ddd;
-        padding: 8px;
-        text-align: left;
-    }
-    th {
-        background-color: #f2f2f2;
-    }
-""") as demo:
-    gr.HTML("<h1 style='text-align: center; color: #0056b3;'>🎙️ 文本转音频模型对比实验</h1>")
-    gr.Markdown(
-        "欢迎来到我们的文本转音频模型对比实验空间。在这里，您可以对比不同模型在文本转音频任务上的表现。",
-        elem_classes="markdown-text"
-    )
-    with gr.Tabs(elem_classes="tab-buttons") as tabs:
-        # --- Arena Tab ---
-        with gr.TabItem("⚔️ Arena", id=0):
-            gr.Markdown(
-                "在'Arena'中，您可以输入文本，并观察不同文本转音频模型的输出。通过统一输入，直观比较模型效果。",
-                elem_classes="markdown-text"
-            )
-            text_input = gr.Textbox(
-                label="输入您想要合成的文本",
-                lines=3,
-                placeholder="例如：您好，这是一个文本转音频的测试。"
-            )
-            with gr.Row():
-                espeak_button = gr.Button("🎤 合成 (eSpeak-ng)")
-                api_tts_button = gr.Button("🎧 合成 (API TTS 示例)")
-            with gr.Row():
-                espeak_output = gr.Audio(label="eSpeak-ng 输出", type="filepath")
-                api_tts_output = gr.Audio(label="API TTS 示例输出", type="filepath")
-            espeak_button.click(
-                synthesize_espeak,
-                inputs=[text_input],
-                outputs=[espeak_output]
-            )
-            api_tts_button.click(
-                synthesize_api_tts,
-                inputs=[text_input],
-                outputs=[api_tts_output]
-            )
-        # --- Report Tab (暂时注释掉) ---
-        # with gr.TabItem("📝 Report", id=1):
-        #     gr.Markdown(
-        #         """
-        #         # 文本转音频模型对比实验报告
-        #         # ... 大量报告内容 ...
-        #         """,
-        #         elem_classes="markdown-text"
-        #     )
-        #
-        # 注意：为了让应用能够正常启动，我们暂时移除了 "Report" 选项卡。
-        # 如果应用能成功运行，说明问题出在报告内容上。
-        # 之后您可以尝试逐步添加报告内容，或简化其格式，以找出具体原因。
-        # 例如，可以先只放几段简单的文字，不包含表格或 mermaid 图。
 # --- 启动 Gradio Demo ---
-# 使用 queue() 是 Spaces 的良好实践
 demo.queue().launch()

 import gradio as gr
 import subprocess
 import os
 # --- TTS 模型函数 (CPU 友好) ---
         os.remove(output_file)
     try:
         command = ["espeak-ng", f"-v{lang}", "--stdout", text]
         process = subprocess.run(command, capture_output=True, check=True, timeout=10)
         if not process.stdout:
             gr.Warning("eSpeak-ng 没有为给定文本生成任何音频输出。请尝试不同的文本。")
             print(f"eSpeak-ng 为文本 '{text}' 未产生输出。")
+            return None
         with open(output_file, "wb") as f:
             f.write(process.stdout)
         print(f"eSpeak-ng 合成成功: {output_file}")
+        return output_file
     except FileNotFoundError:
         error_msg = "错误：未找到 espeak-ng。请确保它已安装在您 Space 的 Dockerfile 中，并且 Space 已重建。"
         print(error_msg)
+        gr.Error(error_msg)
         return None
     except subprocess.CalledProcessError as e:
         error_msg = f"eSpeak-ng 合成过程中出现错误。命令以代码 {e.returncode} 退出。错误输出：{e.stderr.decode()}"
     对于此演示，它返回一个占位符音频文件。
     """
     print(f"正在模拟 API TTS：'{text}'")
     return "https://www.soundhelix.com/examples/mp3/SoundHelix-Song-2.mp3" # 占位符 WAV/MP3
+---
+### **Gradio 界面 (最简化版本)**
+```python
+with gr.Blocks() as demo: # 移除 css 参数
+    gr.Markdown("# 🎙️ 文本转音频模型对比实验") # 使用 Markdown 标题替代 gr.HTML
+    gr.Markdown("这是一个最简化的版本，用于排查启动问题。")
+    text_input = gr.Textbox(
+        label="输入您想要合成的文本",
+        lines=3,
+        placeholder="例如：您好，这是��个文本转音频的测试。"
+    )
+    with gr.Row():
+        espeak_button = gr.Button("🎤 合成 (eSpeak-ng)")
+        api_tts_button = gr.Button("🎧 合成 (API TTS 示例)")
+    with gr.Row():
+        espeak_output = gr.Audio(label="eSpeak-ng 输出", type="filepath")
+        api_tts_output = gr.Audio(label="API TTS 示例输出", type="filepath")
+    espeak_button.click(
+        synthesize_espeak,
+        inputs=[text_input],
+        outputs=[espeak_output]
+    )
+    api_tts_button.click(
+        synthesize_api_tts,
+        inputs=[text_input],
+        outputs=[api_tts_output]
+    )
 # --- 启动 Gradio Demo ---
 demo.queue().launch()