VieNeuTTS

Runtime error

App Files Files Community

StorageDater commited on Nov 17, 2025

Commit

7e0ccae

verified ·

1 Parent(s): 287a341

Update app.py

Browse files

Files changed (1) hide show

app.py +58 -19

app.py CHANGED Viewed

@@ -1,16 +1,15 @@
 import spaces  # PHẢI import TRƯỚC mọi thứ!
 import os
 os.environ['SPACES_ZERO_GPU'] = '1'  # Set environment variable
 import gradio as gr
 import numpy as np
 import soundfile as sf
 import tempfile
 import torch
 # Import vieneutts SAU khi đã setup spaces
 from vieneutts import VieNeuTTS
 # Khởi tạo model trên CPU trước
 print("📦 Đang tải model...")
 tts = VieNeuTTS(
@@ -20,7 +19,6 @@ tts = VieNeuTTS(
     codec_device="cpu"
 )
 print("✅ Model đã tải xong!")
 # Danh sách giọng mẫu
 VOICE_SAMPLES = {
     "Nam miền Nam": {
@@ -32,6 +30,8 @@ VOICE_SAMPLES = {
         "text": "./sample/id_0002.txt"
     }
 }
 @spaces.GPU(duration=120)  # Giữ GPU trong 120 giây
 def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
@@ -41,11 +41,11 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
     try:
         # Kiểm tra text input
         if not text or text.strip() == "":
-            return None, "❌ Vui lòng nhập văn bản cần tổng hợp"
         # Giới hạn độ dài text
         if len(text) > 500:
-            return None, "❌ Văn bản quá dài! Vui lòng nhập tối đa 500 ký tự"
         # Xác định reference audio và text
         if custom_audio is not None and custom_text:
@@ -57,7 +57,7 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
             with open(ref_text_path, "r", encoding="utf-8") as f:
                 ref_text = f.read()
         else:
-            return None, "❌ Vui lòng chọn giọng hoặc tải lên audio tùy chỉnh"
         # Di chuyển model lên GPU
         device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -86,8 +86,17 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
             sf.write(tmp_file.name, wav, 24000)
             output_path = tmp_file.name
         print("✅ Hoàn thành!")
-        return output_path, f"✅ Tổng hợp thành công trên {device.upper()}!"
     except Exception as e:
         print(f"❌ Lỗi: {str(e)}")
@@ -103,7 +112,24 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
         except:
             pass
-        return None, f"❌ Lỗi: {str(e)}"
 # Các ví dụ mẫu
 examples = [
@@ -111,7 +137,6 @@ examples = [
     ["Từ nhiều nguồn tài liệu lịch sử, có thể thấy nuôi con theo phong cách Do Thái không chỉ tốt cho đứa trẻ mà còn tốt cho cả các bậc cha mẹ.", "Nữ miền Nam"],
     ["Các bác sĩ đang nghiên cứu một loại vaccine mới chống lại virus cúm mùa. Thí nghiệm lâm sàng cho thấy phản ứng miễn dịch mạnh mẽ và ít tác dụng phụ, mở ra hy vọng phòng chống dịch bệnh hiệu quả hơn trong tương lai.", "Nam miền Nam"],
 ]
 # Custom CSS
 custom_css = """
 .gradio-container {
@@ -132,17 +157,14 @@ custom_css = """
     margin: 10px 0;
 }
 """
 # Tạo giao diện Gradio
 with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
     # 🎙️ VieNeu-TTS: Vietnamese Text-to-Speech
     Hệ thống tổng hợp tiếng nói tiếng Việt được **finetune từ NeuTTS-Air** - một mô hình TTS tiên tiến sử dụng Large Language Model và Neural Codec.
-    Tác giả: [Phạm Nguyễn Ngọc Bảo](https://github.com/pnnbao97)
-    Model: [VieNeu-TTS](https://huggingface.co/pnnbao-ump/VieNeu-TTS)
-    Code: [GitHub](https://github.com/pnnbao97/VieNeu-TTS)
     Demo: [Hugging Face](https://huggingface.co/spaces/pnnbao-ump/VieNeu-TTS)
     """)
@@ -188,12 +210,22 @@ with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as de
             audio_output = gr.Audio(label="🔊 Kết quả")
             status_output = gr.Textbox(label="📊 Trạng thái", interactive=False)
     # Examples
     gr.Markdown("### 💡 Ví dụ nhanh")
     gr.Examples(
         examples=examples,
         inputs=[text_input, voice_select],
-        outputs=[audio_output, status_output],
         fn=synthesize_speech,
         cache_examples=False
     )
@@ -210,11 +242,18 @@ with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as de
         outputs=[char_count]
     )
-    # Event handler
     submit_btn.click(
         fn=synthesize_speech,
         inputs=[text_input, voice_select, custom_audio, custom_text],
-        outputs=[audio_output, status_output]
     )
     gr.Markdown("""

 import spaces  # PHẢI import TRƯỚC mọi thứ!
 import os
 os.environ['SPACES_ZERO_GPU'] = '1'  # Set environment variable
 import gradio as gr
 import numpy as np
 import soundfile as sf
 import tempfile
 import torch
+import time
+import pandas as pd
 # Import vieneutts SAU khi đã setup spaces
 from vieneutts import VieNeuTTS
 # Khởi tạo model trên CPU trước
 print("📦 Đang tải model...")
 tts = VieNeuTTS(
     codec_device="cpu"
 )
 print("✅ Model đã tải xong!")
 # Danh sách giọng mẫu
 VOICE_SAMPLES = {
     "Nam miền Nam": {
         "text": "./sample/id_0002.txt"
     }
 }
+# Lưu lịch sử (global list)
+history = []
 @spaces.GPU(duration=120)  # Giữ GPU trong 120 giây
 def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
     try:
         # Kiểm tra text input
         if not text or text.strip() == "":
+            return None, "❌ Vui lòng nhập văn bản cần tổng hợp", None
         # Giới hạn độ dài text
         if len(text) > 500:
+            return None, "❌ Văn bản quá dài! Vui lòng nhập tối đa 500 ký tự", None
         # Xác định reference audio và text
         if custom_audio is not None and custom_text:
             with open(ref_text_path, "r", encoding="utf-8") as f:
                 ref_text = f.read()
         else:
+            return None, "❌ Vui lòng chọn giọng hoặc tải lên audio tùy chỉnh", None
         # Di chuyển model lên GPU
         device = "cuda" if torch.cuda.is_available() else "cpu"
             sf.write(tmp_file.name, wav, 24000)
             output_path = tmp_file.name
+        # Lưu vào lịch sử
+        timestamp = time.strftime("%Y-%m-%d %H:%M:%S")
+        history.append({
+            "Thời gian": timestamp,
+            "Văn bản": text,
+            "Giọng": voice_choice if voice_choice else "Tùy chỉnh",
+            "Audio": output_path
+        })
         print("✅ Hoàn thành!")
+        return output_path, f"✅ Tổng hợp thành công trên {device.upper()}!", update_history()
     except Exception as e:
         print(f"❌ Lỗi: {str(e)}")
         except:
             pass
+        return None, f"❌ Lỗi: {str(e)}", None
+# Hàm cập nhật lịch sử cho Dataframe
+def update_history():
+    if not history:
+        return pd.DataFrame(columns=["Thời gian", "Văn bản", "Giọng", "Audio"])
+    df = pd.DataFrame(history)
+    df = df[["Thời gian", "Văn bản", "Giọng"]]  # Không hiển thị path audio đầy đủ trong df
+    return df
+# Hàm tải về lịch sử dưới dạng CSV
+def download_history():
+    if not history:
+        return None
+    df = pd.DataFrame(history)
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".csv") as tmp_file:
+        df.to_csv(tmp_file.name, index=False, encoding="utf-8-sig")
+        return tmp_file.name
 # Các ví dụ mẫu
 examples = [
     ["Từ nhiều nguồn tài liệu lịch sử, có thể thấy nuôi con theo phong cách Do Thái không chỉ tốt cho đứa trẻ mà còn tốt cho cả các bậc cha mẹ.", "Nữ miền Nam"],
     ["Các bác sĩ đang nghiên cứu một loại vaccine mới chống lại virus cúm mùa. Thí nghiệm lâm sàng cho thấy phản ứng miễn dịch mạnh mẽ và ít tác dụng phụ, mở ra hy vọng phòng chống dịch bệnh hiệu quả hơn trong tương lai.", "Nam miền Nam"],
 ]
 # Custom CSS
 custom_css = """
 .gradio-container {
     margin: 10px 0;
 }
 """
 # Tạo giao diện Gradio
 with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
     # 🎙️ VieNeu-TTS: Vietnamese Text-to-Speech
     Hệ thống tổng hợp tiếng nói tiếng Việt được **finetune từ NeuTTS-Air** - một mô hình TTS tiên tiến sử dụng Large Language Model và Neural Codec.
+    Tác giả: [Phạm Nguyễn Ngọc Bảo](https://github.com/pnnbao97)
+    Model: [VieNeu-TTS](https://huggingface.co/pnnbao-ump/VieNeu-TTS)
+    Code: [GitHub](https://github.com/pnnbao97/VieNeu-TTS)
     Demo: [Hugging Face](https://huggingface.co/spaces/pnnbao-ump/VieNeu-TTS)
     """)
             audio_output = gr.Audio(label="🔊 Kết quả")
             status_output = gr.Textbox(label="📊 Trạng thái", interactive=False)
+    # Lịch sử
+    gr.Markdown("### 📜 Lịch sử tổng hợp")
+    history_df = gr.Dataframe(
+        value=update_history(),
+        headers=["Thời gian", "Văn bản", "Giọng"],
+        interactive=False
+    )
+    download_btn = gr.Button("📥 Tải về lịch sử (CSV)")
+    download_file = gr.File(label="Tệp tải về", interactive=False)
     # Examples
     gr.Markdown("### 💡 Ví dụ nhanh")
     gr.Examples(
         examples=examples,
         inputs=[text_input, voice_select],
+        outputs=[audio_output, status_output, history_df],
         fn=synthesize_speech,
         cache_examples=False
     )
         outputs=[char_count]
     )
+    # Event handler for synthesize
     submit_btn.click(
         fn=synthesize_speech,
         inputs=[text_input, voice_select, custom_audio, custom_text],
+        outputs=[audio_output, status_output, history_df]
+    )
+    # Event handler for download
+    download_btn.click(
+        fn=download_history,
+        inputs=[],
+        outputs=[download_file]
     )
     gr.Markdown("""