YingMusic-SingerGPU

Running on Zero

App Files Files Community

xjsc0 commited on Mar 23

Commit

335a61e

1 Parent(s): c0f6c5b

22

Browse files

Files changed (1) hide show

app.py +45 -62

app.py CHANGED Viewed

@@ -311,16 +311,17 @@ CUSTOM_CSS = """
 /* ---------- Disclaimer ---------- */
 #disclaimer {
-    border-left: 4px solid var(--primary);
-    background: var(--accent-glow);
-    border-radius: 8px;
-    padding: 12px 16px;
-    margin: 8px 0 16px;
-    font-size: 0.88rem;
-    color: var(--text-muted);
-    line-height: 1.6;
 }
-#disclaimer strong { color: var(--primary-light); }
 /* ---------- Section labels / 分区标题 ---------- */
 .section-title {
@@ -373,8 +374,8 @@ CUSTOM_CSS = """
 HEADER_HTML = """
 <div id="app-header" align="center">
   <h1>
-    🏆 LyricEditBench: The first benchmark for melody-preserving lyric modification evaluation<br>
-    🚀 <a href="https://github.com/ASLP-lab/YingMusic-Singer" target="_blank">YingMusic-Singer</a>
   </h1>
   <div class="lang-links">
@@ -429,11 +430,12 @@ HEADER_HTML = """
 DISCLAIMER_HTML = """
 <div id="disclaimer">
-  <strong>⚠️ Disclaimer / 免责声明：</strong>
   YingMusic-Singer enables the creation of singing voices with modified lyrics, supporting applications
   in artistic creation and entertainment. Potential risks include unauthorized voice cloning and copyright
   infringement. To ensure responsible deployment, users should obtain consent for voice usage, disclose
-  AI involvement, and verify musical originality.
 </div>
 """
@@ -451,7 +453,6 @@ def build_ui():
         # ---- Header / 头部 ----
         gr.HTML(HEADER_HTML)
-        gr.HTML(DISCLAIMER_HTML)
         gr.HTML("<hr style='border-color:#30363d; margin: 8px 0 18px;'>")
@@ -511,62 +512,43 @@ def build_ui():
             )
         # ================================================================
-        # ROW 3 – 高级参数 / Advanced Parameters (collapsible)
         # ================================================================
         with gr.Accordion("⚙️ 高级参数 / Advanced Parameters", open=False):
             with gr.Row():
                 nfe_step = gr.Slider(
-                    minimum=4,
-                    maximum=128,
-                    value=32,
-                    step=1,
                     label="采样步数 / NFE Steps",
                     info="更多步数 = 更高质量，但更慢 / More steps = higher quality, but slower",
                 )
                 cfg_strength = gr.Slider(
-                    minimum=0.0,
-                    maximum=10.0,
-                    value=3.0,
-                    step=0.1,
                     label="CFG 强度 / CFG Strength",
-                    info="Classifier‑Free Guidance 强度 / Classifier‑Free Guidance strength",
                 )
                 t_shift = gr.Slider(
-                    minimum=0.0,
-                    maximum=1.0,
-                    value=0.5,
-                    step=0.01,
                     label="采样时间偏移 / t‑shift",
                 )
             with gr.Row():
                 sil_len_to_end = gr.Slider(
-                    minimum=0.0,
-                    maximum=3.0,
-                    value=0.5,
-                    step=0.1,
                     label="末尾静音时长 (秒) / Silence Padding (s)",
-                    info="参考音频末尾追加的静音 / Silence appended after reference audio",
                 )
                 seed = gr.Number(
-                    value=-1,
-                    precision=0,
                     label="随机种子 / Random Seed",
                     info="-1 表示随机 / -1 means random",
                 )
-        # ================================================================
-        # ROW 4 – 合成按钮与输出 / Run & Output
-        # ================================================================
-        run_btn = gr.Button("🎤  开始合成 / Synthesize", elem_id="run-btn", size="lg")
-        output_audio = gr.Audio(
-            label="合成结果 / Generated Audio",
-            type="filepath",
-            elem_id="output-audio",
-        )
         # ================================================================
-        # ROW 5 – 示例 / Examples (two tabs)
         # ================================================================
         gr.HTML("<hr style='border-color:#30363d; margin: 20px 0 12px;'>")
         gr.Markdown("#### 🎵 预设示例 / Example Presets", elem_classes="section-title")
@@ -574,13 +556,6 @@ def build_ui():
             "<small style='color:#8b949e;'>点击任意行自动填入输入区域 / Click any row to auto-fill the inputs above</small>"
         )
-        # All inputs in order expected by synthesize()
-        _all_inputs = [
-            ref_audio, melody_audio, ref_text, target_text,
-            separate_vocals_flag, mix_accompaniment_flag,
-            sil_len_to_end, t_shift, nfe_step, cfg_strength, seed,
-        ]
         with gr.Tabs():
             with gr.Tab("🎼 Melody Control"):
                 gr.Examples(
@@ -598,10 +573,20 @@ def build_ui():
                 )
         # ================================================================
-        # Event wiring / 事件绑定
         # ================================================================
-        # 联动：未开启分离时，禁用伴奏混合
         separate_vocals_flag.change(
             fn=lambda sep: gr.update(interactive=sep, value=False if not sep else False),
             inputs=[separate_vocals_flag],
@@ -614,14 +599,12 @@ def build_ui():
             outputs=output_audio,
         )
-        # ---- 页脚 / Footer ----
         gr.Markdown(
-            """
-            <center style="color:#8b949e; font-size:0.85rem; margin-top: 16px;">
-            Use <code>|</code> to separate lyric phrases &nbsp;·&nbsp;
-            用 <code>|</code> 分隔歌词乐句
-            </center>
-            """,
         )
     return demo

 /* ---------- Disclaimer ---------- */
 #disclaimer {
+    border-top: 1px solid var(--border);
+    margin: 24px 0 4px;
+    padding: 14px 4px 4px;
+    font-size: 0.80rem;
+    color: #6e7681;
+    line-height: 1.65;
+}
+#disclaimer strong {
+    color: #8b949e;
+    font-weight: 600;
 }
 /* ---------- Section labels / 分区标题 ---------- */
 .section-title {
 HEADER_HTML = """
 <div id="app-header" align="center">
   <h1>
+    🎤 <a href="https://github.com/ASLP-lab/YingMusic-Singer" target="_blank">YingMusic-Singer</a>:
+    Controllable Singing Voice Synthesis with Flexible Lyric Manipulation and Annotation-free Melody Guidance
   </h1>
   <div class="lang-links">
 DISCLAIMER_HTML = """
 <div id="disclaimer">
+  <strong>Disclaimer / 免责声明</strong><br>
   YingMusic-Singer enables the creation of singing voices with modified lyrics, supporting applications
   in artistic creation and entertainment. Potential risks include unauthorized voice cloning and copyright
   infringement. To ensure responsible deployment, users should obtain consent for voice usage, disclose
+  AI involvement, and verify musical originality.<br>
+  <span style="opacity:0.75;">YingMusic-Singer 可用于修改歌词后的歌声合成，支持艺术创作与娱乐应用。潜在风险包括未经授权的声音克隆与版权侵权。为确保负责任地使用，用户应在使用他人声音前获得授权、公开 AI 参与情况，并确认音乐内容的原创性。</span>
 </div>
 """
         # ---- Header / 头部 ----
         gr.HTML(HEADER_HTML)
         gr.HTML("<hr style='border-color:#30363d; margin: 8px 0 18px;'>")
             )
         # ================================================================
+        # ROW 3 – 高级参数（隐藏默认值）/ Advanced Parameters (hidden defaults)
         # ================================================================
         with gr.Accordion("⚙️ 高级参数 / Advanced Parameters", open=False):
             with gr.Row():
                 nfe_step = gr.Slider(
+                    minimum=4, maximum=128, value=32, step=1,
                     label="采样步数 / NFE Steps",
                     info="更多步数 = 更高质量，但更慢 / More steps = higher quality, but slower",
                 )
                 cfg_strength = gr.Slider(
+                    minimum=0.0, maximum=10.0, value=3.0, step=0.1,
                     label="CFG 强度 / CFG Strength",
                 )
                 t_shift = gr.Slider(
+                    minimum=0.0, maximum=1.0, value=0.5, step=0.01,
                     label="采样时间偏移 / t‑shift",
                 )
             with gr.Row():
                 sil_len_to_end = gr.Slider(
+                    minimum=0.0, maximum=3.0, value=0.5, step=0.1,
                     label="末尾静音时长 (秒) / Silence Padding (s)",
                 )
                 seed = gr.Number(
+                    value=-1, precision=0,
                     label="随机种子 / Random Seed",
                     info="-1 表示随机 / -1 means random",
                 )
+        # All inputs in order expected by synthesize()
+        _all_inputs = [
+            ref_audio, melody_audio, ref_text, target_text,
+            separate_vocals_flag, mix_accompaniment_flag,
+            sil_len_to_end, t_shift, nfe_step, cfg_strength, seed,
+        ]
         # ================================================================
+        # ROW 4 – 预设示例 / Example Presets
         # ================================================================
         gr.HTML("<hr style='border-color:#30363d; margin: 20px 0 12px;'>")
         gr.Markdown("#### 🎵 预设示例 / Example Presets", elem_classes="section-title")
             "<small style='color:#8b949e;'>点击任意行自动填入输入区域 / Click any row to auto-fill the inputs above</small>"
         )
         with gr.Tabs():
             with gr.Tab("🎼 Melody Control"):
                 gr.Examples(
                 )
         # ================================================================
+        # ROW 5 – 合成按钮与输出 / Run & Output
         # ================================================================
+        gr.HTML("<hr style='border-color:#30363d; margin: 12px 0;'>")
+        run_btn = gr.Button("🎤  开始合成 / Synthesize", elem_id="run-btn", size="lg")
+        output_audio = gr.Audio(
+            label="合成结果 / Generated Audio",
+            type="filepath",
+            elem_id="output-audio",
+        )
+        # ================================================================
+        # Event wiring / 事件绑定
+        # ================================================================
         separate_vocals_flag.change(
             fn=lambda sep: gr.update(interactive=sep, value=False if not sep else False),
             inputs=[separate_vocals_flag],
             outputs=output_audio,
         )
+        # ---- 页脚：免责声明 + 使用提示 / Footer: disclaimer + tip ----
+        gr.HTML(DISCLAIMER_HTML)
         gr.Markdown(
+            "<center style='color:#6e7681; font-size:0.78rem; margin-top: 4px;'>"
+            "Use <code>|</code> to separate lyric phrases &nbsp;·&nbsp; 用 <code>|</code> 分隔歌词乐句"
+            "</center>",
         )
     return demo