VieNeuTTS

Runtime error

App Files Files Community

pnnbao-ump commited on Oct 29

Commit

0133704

1 Parent(s): 4a204a9

Add @spaces.GPU decorator for GPU Zero

Browse files

Files changed (1) hide show

app.py +16 -32

app.py CHANGED Viewed

@@ -1,11 +1,15 @@
 import gradio as gr
 import numpy as np
 import soundfile as sf
-from vieneutts import VieNeuTTS
 import tempfile
-import os
 import torch
-import spaces  # Import cho GPU Zero
 # Khởi tạo model trên CPU trước
 print("📦 Đang tải model...")
@@ -29,7 +33,7 @@ VOICE_SAMPLES = {
     }
 }
-@spaces.GPU(duration=120)  # Giữ GPU trong 120 giây cho mỗi request
 def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
     """
     Tổng hợp giọng nói từ văn bản - Chạy trên GPU
@@ -39,7 +43,7 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
         if not text or text.strip() == "":
             return None, "❌ Vui lòng nhập văn bản cần tổng hợp"
-        # Giới hạn độ dài text để tránh timeout
         if len(text) > 500:
             return None, "❌ Văn bản quá dài! Vui lòng nhập tối đa 500 ký tự"
@@ -55,7 +59,7 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
         else:
             return None, "❌ Vui lòng chọn giọng hoặc tải lên audio tùy chỉnh"
-        # Di chuyển model lên GPU (spaces.GPU tự động làm điều này)
         device = "cuda" if torch.cuda.is_available() else "cpu"
         if device == "cuda":
             print("🚀 Đang chuyển model lên GPU...")
@@ -70,7 +74,7 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
         print(f"🎵 Đang tổng hợp giọng nói trên {device.upper()}...")
         wav = tts.infer(text, ref_codes, ref_text)
-        # Di chuyển model về CPU để giải phóng GPU
         if device == "cuda":
             print("💾 Đang giải phóng GPU...")
             tts.backbone = tts.backbone.to("cpu")
@@ -90,7 +94,7 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
         import traceback
         traceback.print_exc()
-        # Đảm bảo giải phóng GPU khi có lỗi
         try:
             if torch.cuda.is_available():
                 tts.backbone = tts.backbone.to("cpu")
@@ -101,7 +105,7 @@ def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
         return None, f"❌ Lỗi: {str(e)}"
-# Các ví dụ mẫu - Ngắn gọn
 examples = [
     ["Xin chào, tôi là trợ lý giọng nói tiếng Việt.", "Nam miền Nam"],
     ["Chúc bạn một ngày tốt lành!", "Nữ miền Nam"],
@@ -137,15 +141,6 @@ with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as de
     Hệ thống tổng hợp tiếng nói tiếng Việt sử dụng Large Language Model và Neural Codec.
     """)
-    # Thông báo GPU Zero
-    gr.Markdown("""
-    <div id="info">
-    ⚡ <strong>GPU Zero Mode:</strong> Space này sử dụng GPU miễn phí với tốc độ nhanh (3-5 giây/câu).
-    <br>
-    ⏳ Lần đầu sử dụng có thể phải chờ 5-30 phút trong hàng đợi GPU. Sau đó sẽ rất nhanh!
-    </div>
-    """)
     with gr.Row():
         with gr.Column():
             # Input text
@@ -194,7 +189,7 @@ with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as de
         inputs=[text_input, voice_select],
         outputs=[audio_output, status_output],
         fn=synthesize_speech,
-        cache_examples=False  # Không cache để build nhanh hơn
     )
     # Update character count
@@ -219,18 +214,7 @@ with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as de
     gr.Markdown("""
     ---
     ### 📌 Thông tin
-    **Ưu điểm GPU Zero:**
-    - ⚡ Tốc độ: 3-5 giây/câu (nhanh hơn CPU 10-20 lần)
-    - 💰 Hoàn toàn miễn phí
-    - 🎯 Chất lượng âm thanh cao
-    **Lưu ý:**
-    - ⏳ Lần đầu sử dụng phải chờ GPU khả dụng (5-30 phút)
-    - 🔄 Sau đó các request tiếp theo sẽ rất nhanh
-    - ⏱️ GPU timeout sau 120 giây nếu không dùng
-    - 📏 Khuyến nghị: Văn bản dưới 500 ký tự
     **Liên kết:**
     - [GitHub Repository](https://github.com/pnnbao97/VieNeu-TTS)
     - [Model Card](https://huggingface.co/pnnbao-ump/VieNeu-TTS)
@@ -240,7 +224,7 @@ with gr.Blocks(title="VieNeu-TTS", css=custom_css, theme=gr.themes.Soft()) as de
 # Launch
 if __name__ == "__main__":
-    demo.queue(max_size=20)  # Queue size lớn hơn cho GPU Zero
     demo.launch(
         server_name="0.0.0.0",
         server_port=7860,

+import spaces  # PHẢI import TRƯỚC mọi thứ!
+import os
+os.environ['SPACES_ZERO_GPU'] = '1'  # Set environment variable
 import gradio as gr
 import numpy as np
 import soundfile as sf
 import tempfile
 import torch
+# Import vieneutts SAU khi đã setup spaces
+from vieneutts import VieNeuTTS
 # Khởi tạo model trên CPU trước
 print("📦 Đang tải model...")
     }
 }
+@spaces.GPU(duration=120)  # Giữ GPU trong 120 giây
 def synthesize_speech(text, voice_choice, custom_audio=None, custom_text=None):
     """
     Tổng hợp giọng nói từ văn bản - Chạy trên GPU
         if not text or text.strip() == "":
             return None, "❌ Vui lòng nhập văn bản cần tổng hợp"
+        # Giới hạn độ dài text
         if len(text) > 500:
             return None, "❌ Văn bản quá dài! Vui lòng nhập tối đa 500 ký tự"
         else:
             return None, "❌ Vui lòng chọn giọng hoặc tải lên audio tùy chỉnh"
+        # Di chuyển model lên GPU
         device = "cuda" if torch.cuda.is_available() else "cpu"
         if device == "cuda":
             print("🚀 Đang chuyển model lên GPU...")
         print(f"🎵 Đang tổng hợp giọng nói trên {device.upper()}...")
         wav = tts.infer(text, ref_codes, ref_text)
+        # Di chuyển model về CPU
         if device == "cuda":
             print("💾 Đang giải phóng GPU...")
             tts.backbone = tts.backbone.to("cpu")
         import traceback
         traceback.print_exc()
+        # Giải phóng GPU khi có lỗi
         try:
             if torch.cuda.is_available():
                 tts.backbone = tts.backbone.to("cpu")
         return None, f"❌ Lỗi: {str(e)}"
+# Các ví dụ mẫu
 examples = [
     ["Xin chào, tôi là trợ lý giọng nói tiếng Việt.", "Nam miền Nam"],
     ["Chúc bạn một ngày tốt lành!", "Nữ miền Nam"],
     Hệ thống tổng hợp tiếng nói tiếng Việt sử dụng Large Language Model và Neural Codec.
     """)
     with gr.Row():
         with gr.Column():
             # Input text
         inputs=[text_input, voice_select],
         outputs=[audio_output, status_output],
         fn=synthesize_speech,
+        cache_examples=False
     )
     # Update character count
     gr.Markdown("""
     ---
     ### 📌 Thông tin
     **Liên kết:**
     - [GitHub Repository](https://github.com/pnnbao97/VieNeu-TTS)
     - [Model Card](https://huggingface.co/pnnbao-ump/VieNeu-TTS)
 # Launch
 if __name__ == "__main__":
+    demo.queue(max_size=20)
     demo.launch(
         server_name="0.0.0.0",
         server_port=7860,