Spaces:

Respair
/

Voice_Design

Running

App Files Files Community

Respair commited on 4 days ago

Commit

4cb44e3

verified ·

1 Parent(s): 1505e24

Update app.py

Browse files

Files changed (1) hide show

app.py +45 -38

app.py CHANGED Viewed

@@ -88,18 +88,46 @@ VOICE_EXAMPLES = {
     "落ち着いた男性 / 呆れ気味": "落ち着いた低めの声の男性が、相手の言動に少し呆れつつも感情を表に出さず、静かで平坦なトーンで淡々と話してるような声で読んでほしい。", # https://huggingface.co/spaces/Respair/Voice_Design/blob/main/samples/guy_cool.wav
     "Calm man / mildly exasperated (EN)": "Read this in the voice of a calm, low-pitched man who sounds mildly exasperated but keeps his emotions in check, speaking in a flat, even tone without much expression.", # Nothing
     "冷たい女性 / 憎しみ (1)": "低くて冷たい声の女性が、怒りを内に秘めながら憎しみのこもった口調で、淡々と早めに話してるような声で読んでほしい。", # https://huggingface.co/spaces/Respair/Voice_Design/blob/main/samples/woman_cold_frustrated_2.wav
-    "冷たい女性 / 憎しみ (2)": "低くて冷たい声の女性が、怒りを内に秘めながら憎しみのこもった口調で、淡々と早めに話してるような声で読んでほしい。", # same text different result / https://huggingface.co/spaces/Respair/Voice_Design/blob/main/samples/woman_cold_frustrated.wav
 }
 VOICE_PRESET_LIST = list(VOICE_EXAMPLES.items())
-PREGENERATED_SAMPLES = [
-    ["甘えた女の子 / ゆっくり", "samples/onnanoko_amai.wav"],
-    ["激怒する女性 / 感情爆発", "samples/angry.wav"],
-    ["落ち着いた男性 / 呆れ気味", "samples/guy_cool.wav"],
-    ["冷たい女性 / 憎しみ (1)", "samples/woman_cold_frustrated_2.wav"],
-    ["冷たい女性 / 憎しみ (2)", "samples/woman_cold_frustrated.wav"],
-]
 def run_generation_pipeline_client(
@@ -164,7 +192,6 @@ with gr.Blocks(theme="Respair/Shiki@10.1.0", css=css) as demo:
     </div>
     """
     )
     with gr.Tabs():
         with gr.TabItem("Speech Generation"):
@@ -254,11 +281,11 @@ with gr.Blocks(theme="Respair/Shiki@10.1.0", css=css) as demo:
                 concurrency_limit=4,
             )
-        with gr.TabItem("Example"):
             gr.HTML("""
             <div style="background-color: rgba(255, 255, 255, 0.025); padding: 20px; border-radius: 12px; backdrop-filter: blur(10px); box-shadow: 0 4px 6px rgba(0,0,0,0.5); margin-top: 8px;">
                 <p style="color: #1a1a1a; font-weight: 500; line-height: 1.6; font-size: 14px; text-align: center; margin: 0;">
-                クリックすると声の説明がロードされます。 / Click a preset to load it into the Instruction field.
                 </p>
             </div>
             """)
@@ -270,39 +297,19 @@ with gr.Blocks(theme="Respair/Shiki@10.1.0", css=css) as demo:
                         <h3 style="color: #000000; margin: 0; font-size: 16px;">Examples</h3>
                     </div>
                     """)
-                    voice_preset_holder = gr.Textbox(visible=False)
                     gr.Examples(
-                        examples=[[label] for label in VOICE_EXAMPLES.keys()],
-                        inputs=[voice_preset_holder],
-                        outputs=[voice_desc_input],
-                        fn=lambda label: VOICE_EXAMPLES.get(label, ""),
-                        label="Click to load a voice preset",
                         cache_examples=False,
                         run_on_click=True,
                         examples_per_page=10,
                     )
-            gr.HTML("""
-            <div style="background-color: rgba(255, 255, 255, 0.025); padding: 20px; border-radius: 12px; backdrop-filter: blur(10px); box-shadow: 0 4px 6px rgba(0,0,0,0.5); margin-top: 16px;">
-                <p style="color: #1a1a1a; font-weight: 500; line-height: 1.6; font-size: 14px; text-align: center; margin: 0;">
-                クリックするとプリジェネ音声がロードされます。 / Click a preset to load a pre-generated audio sample.
-                </p>
-            </div>
-            """)
-            sample_holder = gr.Textbox(visible=False)
-            pregenerated_audio = gr.Audio(label="Pre-generated Samples", interactive=False)
-            gr.Examples(
-                examples=[[name] for name, _ in PREGENERATED_SAMPLES],
-                inputs=[sample_holder],
-                outputs=[pregenerated_audio],
-                fn=lambda name: next((path for n, path in PREGENERATED_SAMPLES if n == name), None),
-                label="Click to load a pre-generated sample",
-                cache_examples=False,
-                run_on_click=True,
-                examples_per_page=10,
-            )
         with gr.TabItem("Info"):
             gr.HTML('<h1 style="text-align: center;">🌸 Takane - Voice Design 🎨 </h1>')

     "落ち着いた男性 / 呆れ気味": "落ち着いた低めの声の男性が、相手の言動に少し呆れつつも感情を表に出さず、静かで平坦なトーンで淡々と話してるような声で読んでほしい。", # https://huggingface.co/spaces/Respair/Voice_Design/blob/main/samples/guy_cool.wav
     "Calm man / mildly exasperated (EN)": "Read this in the voice of a calm, low-pitched man who sounds mildly exasperated but keeps his emotions in check, speaking in a flat, even tone without much expression.", # Nothing
     "冷たい女性 / 憎しみ (1)": "低くて冷たい声の女性が、怒りを内に秘めながら憎しみのこもった口調で、淡々と早めに話してるような声で読んでほしい。", # https://huggingface.co/spaces/Respair/Voice_Design/blob/main/samples/woman_cold_frustrated_2.wav
+    "冷たい女性 / 憎しみ (2)": "低くて冷たい声の女性が、怒りを内に秘めながら憎しみのこもった口調で、淡々と早めに話してるような声で読んでほしい。", # same text different result --> https://huggingface.co/spaces/Respair/Voice_Design/blob/main/samples/woman_cold_frustrated.wav
 }
 VOICE_PRESET_LIST = list(VOICE_EXAMPLES.items())
+# label -> local file path (ship these in your Space repo under samples/)
+PREGENERATED_AUDIO = {
+    "甘えた女の子 / ゆっくり": "samples/onnanoko_amai.wav",
+    "激怒する女性 / 感情爆発": "samples/angry.wav",
+    "落ち着いた男性 / 呆れ気味": "samples/guy_cool.wav",
+    "冷たい女性 / 憎しみ (1)": "samples/woman_cold_frustrated_2.wav",
+    "冷たい女性 / 憎しみ (2)": "samples/woman_cold_frustrated.wav",
+}
+def load_pregenerated_to_main(label):
+    """
+    Click handler from Examples tab:
+    loads instruction text into the Instruction box (optional)
+    and loads the pre-generated WAV into the MAIN tab audio_output.
+    """
+    desc = VOICE_EXAMPLES.get(label, "")
+    path = PREGENERATED_AUDIO.get(label)
+    if path and os.path.exists(path):
+        sr, data = wavfile.read(path)
+        if isinstance(data, np.ndarray) and data.ndim == 2 and data.shape[0] in (1, 2) and data.shape[0] < data.shape[1]:
+            data = data.T
+        return (
+            gr.update(value=desc),          # voice_desc_input
+            (sr, data),                     # audio_output (MAIN TAB)
+            f"Status: Loaded pre-generated sample: {label}"
+        )
+    return (
+        gr.update(value=desc),
+        None,
+        f"Status: No pre-generated audio found for: {label}"
+    )
 def run_generation_pipeline_client(
     </div>
     """
     )
     with gr.Tabs():
         with gr.TabItem("Speech Generation"):
                 concurrency_limit=4,
             )
+        with gr.TabItem("Examples"):
             gr.HTML("""
             <div style="background-color: rgba(255, 255, 255, 0.025); padding: 20px; border-radius: 12px; backdrop-filter: blur(10px); box-shadow: 0 4px 6px rgba(0,0,0,0.5); margin-top: 8px;">
                 <p style="color: #1a1a1a; font-weight: 500; line-height: 1.6; font-size: 14px; text-align: center; margin: 0;">
+                クリックするとメインタブの音声プレイヤーにプリジェネ音声がロードされます。 / Click a preset to load the pre-generated audio into the main tab player.
                 </p>
             </div>
             """)
                         <h3 style="color: #000000; margin: 0; font-size: 16px;">Examples</h3>
                     </div>
                     """)
+                    example_label_holder = gr.Textbox(visible=False)
                     gr.Examples(
+                        examples=[[label] for label in PREGENERATED_AUDIO.keys()],
+                        inputs=[example_label_holder],
+                        outputs=[voice_desc_input, audio_output, status_output],  # <-- MAIN TAB outputs
+                        fn=load_pregenerated_to_main,
+                        label="Click to load a pre-generated sample",
                         cache_examples=False,
                         run_on_click=True,
                         examples_per_page=10,
                     )
         with gr.TabItem("Info"):
             gr.HTML('<h1 style="text-align: center;">🌸 Takane - Voice Design 🎨 </h1>')