Spaces:

nxhong
/

vixtts-api

Build error

App Files Files Community

nxhong commited on Oct 28, 2025

Commit

591dff6

verified ·

1 Parent(s): e232bc5

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -56

app.py CHANGED Viewed

@@ -239,81 +239,60 @@ def predict(
 with gr.Blocks(analytics_enabled=False) as demo:
-    with gr.Row():
-        with gr.Column():
-            gr.Markdown(
-                """
-                # Text to Speech Vietnamese ✨
-                - Special thank to thinhlpg
-                """
-            )
-        with gr.Column():
-            # placeholder to align the image
-            pass
     with gr.Row():
-        with gr.Column():
             input_text_gr = gr.Textbox(
-                label="Text Prompt (Văn bản cần đọc)",
-                info="Mỗi câu nên từ 10 từ trở lên.",
-                value="Xin chào, tôi là một mô hình chuyển đổi văn bản thành giọng nói tiếng Việt.",
             )
             language_gr = gr.Dropdown(
-                label="Language (Ngôn ngữ)",
-                choices=[
-                    "vi",
-                    "en",
-                    "es",
-                    "fr",
-                    "de",
-                    "it",
-                    "pt",
-                    "pl",
-                    "tr",
-                    "ru",
-                    "nl",
-                    "cs",
-                    "ar",
-                    "zh-cn",
-                    "ja",
-                    "ko",
-                    "hu",
-                    "hi",
-                ],
-                max_choices=1,
                 value="vi",
             )
             normalize_text = gr.Checkbox(
                 label="Chuẩn hóa văn bản tiếng Việt",
-                info="Normalize Vietnamese text",
-                value=True,
             )
             ref_gr = gr.Audio(
-                label="Reference Audio (Giọng mẫu)",
                 type="filepath",
-                value="model/samples/nu-luu-loat.wav",
-            )
-            tts_button = gr.Button(
-                "Đọc 🗣️🔥",
-                elem_id="send-btn",
-                visible=True,
-                variant="primary",
             )
-        with gr.Column():
-            audio_gr = gr.Audio(label="Synthesised Audio", autoplay=True)
-            out_text_gr = gr.Text(label="Metrics")
     tts_button.click(
         predict,
-        [
-            input_text_gr,
-            language_gr,
-            ref_gr,
-            normalize_text,
         ],
         outputs=[audio_gr, out_text_gr],
-        api_name="predict",
     )
 demo.queue()

 with gr.Blocks(analytics_enabled=False) as demo:
+    gr.Markdown("# 🇻🇳 Text to Speech Vietnamese (capleaf/viXTTS)")
+    gr.Markdown("Nhập văn bản tiếng Việt và chọn giọng mẫu để tạo âm thanh 🎙️")
     with gr.Row():
+        with gr.Column(scale=1):
             input_text_gr = gr.Textbox(
+                label="Nhập văn bản",
+                placeholder="Nhập câu tiếng Việt để chuyển thành giọng nói...",
+                lines=3,
+                interactive=True,
+                value="Xin chào, tôi là mô hình chuyển đổi văn bản thành giọng nói tiếng Việt."
             )
             language_gr = gr.Dropdown(
+                label="Ngôn ngữ",
+                choices=["vi", "en", "zh-cn", "ja", "ko"],
                 value="vi",
+                interactive=True
             )
             normalize_text = gr.Checkbox(
                 label="Chuẩn hóa văn bản tiếng Việt",
+                value=True
             )
             ref_gr = gr.Audio(
+                label="Giọng mẫu (Reference Audio)",
                 type="filepath",
+                value="model/samples/nu-luu-loat.wav"
             )
+            tts_button = gr.Button("▶️ Đọc văn bản", variant="primary")
+        with gr.Column(scale=1):
+            audio_gr = gr.Audio(label="Kết quả giọng nói", autoplay=True)
+            out_text_gr = gr.Textbox(label="Thông tin chi tiết", interactive=False)
+    # Nút sinh âm thanh
     tts_button.click(
         predict,
+        inputs=[input_text_gr, language_gr, ref_gr, normalize_text],
+        outputs=[audio_gr, out_text_gr]
+    )
+    # Khi chạy Space sẽ tự test 1 câu luôn
+    demo.load(
+        predict,
+        inputs=[
+            gr.Textbox(value="Xin chào, tôi là mô hình viXTTS đang chạy thử."),
+            gr.Dropdown(value="vi"),
+            gr.Audio(value="model/samples/nu-luu-loat.wav", type="filepath"),
+            gr.Checkbox(value=True),
         ],
         outputs=[audio_gr, out_text_gr],
     )
 demo.queue()