kt003

Running

App Files Files Community

ktvoice commited on Apr 15

Commit

cd2ed09

verified ·

1 Parent(s): 17e4dc0

Upload app.py

Browse files

Files changed (1) hide show

app.py +37 -8

app.py CHANGED Viewed

@@ -29,7 +29,7 @@ except Exception as e:
 # Danh sách giọng
 VOICE_SAMPLES = {
     "Tuyên (nam miền Bắc)": {"audio": "./sample/Tuyên (nam miền Bắc).wav", "text": "./sample/Tuyên (nam miền Bắc).txt"},
-    "Thiện Tâm": {"audio": "./sample/thientam.mp3", "text": "./sample/thientam.txt"},
     "Ngọc Huyền": {"audio": "./sample/NgocHuyen.mp3", "text": "./sample/NgocHuyen.txt"},
     "Minh Quân": {"audio": "./sample/MinhQuan.mp3", "text": "./sample/MinhQuan.txt"},
     "Vĩnh (nam miền Nam)": {"audio": "./sample/Vĩnh (nam miền Nam).wav", "text": "./sample/Vĩnh (nam miền Nam).txt"},
@@ -58,12 +58,21 @@ def tts_process(text, voice_choice, custom_audio, custom_text, mode_tab, pause_l
             ref_path, ref_txt_val = custom_audio, custom_text
         else:
             sample = VOICE_SAMPLES.get(voice_choice)
             ref_path = sample["audio"]
             try:
                 with open(sample["text"], "r", encoding="utf-8") as f:
                     ref_txt_val = f.read()
-            except:
-                return None, "Lỗi đọc file text mẫu."
         # Xử lý ngắt nghỉ
         processed_text = text
@@ -74,9 +83,25 @@ def tts_process(text, voice_choice, custom_audio, custom_text, mode_tab, pause_l
         start_time = time.time()
-        # Chạy AI
-        ref_codes = tts.encode_reference(ref_path)
-        wav = tts.infer(processed_text[:500], ref_codes, ref_txt_val)
         # Tốc độ
         if speed_value != 1.0:
@@ -84,10 +109,14 @@ def tts_process(text, voice_choice, custom_audio, custom_text, mode_tab, pause_l
         with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp:
             sf.write(tmp.name, wav, 24000)
-            return tmp.name, f"Hoàn tất: {time.time() - start_time:.2f}s"
     except Exception as e:
-        return None, f"Lỗi: {str(e)}"
 # --- 2. GIAO DIỆN CƠ BẢN (Native Gradio) ---
 with gr.Blocks(title="AI Voice") as demo:

 # Danh sách giọng
 VOICE_SAMPLES = {
     "Tuyên (nam miền Bắc)": {"audio": "./sample/Tuyên (nam miền Bắc).wav", "text": "./sample/Tuyên (nam miền Bắc).txt"},
+    "Thiện Tâm": {"audio": "./sample/ThienTam.mp3", "text": "./sample/ThienTam.txt"},
     "Ngọc Huyền": {"audio": "./sample/NgocHuyen.mp3", "text": "./sample/NgocHuyen.txt"},
     "Minh Quân": {"audio": "./sample/MinhQuan.mp3", "text": "./sample/MinhQuan.txt"},
     "Vĩnh (nam miền Nam)": {"audio": "./sample/Vĩnh (nam miền Nam).wav", "text": "./sample/Vĩnh (nam miền Nam).txt"},
             ref_path, ref_txt_val = custom_audio, custom_text
         else:
             sample = VOICE_SAMPLES.get(voice_choice)
+            if not sample:
+                return None, f"Lỗi: Không tìm thấy giọng '{voice_choice}'"
             ref_path = sample["audio"]
             try:
                 with open(sample["text"], "r", encoding="utf-8") as f:
                     ref_txt_val = f.read()
+            except Exception as e_txt:
+                return None, f"Lỗi đọc file text mẫu: {e_txt}"
+        # [DEBUG] Kiểm tra file audio tồn tại
+        if not os.path.exists(ref_path):
+            return None, f"Lỗi: File audio không tồn tại: {ref_path}"
+        file_size = os.path.getsize(ref_path)
+        print(f"[DEBUG] Voice: {voice_choice} | File: {ref_path} | Size: {file_size} bytes | Text mẫu: {ref_txt_val[:50]}...")
         # Xử lý ngắt nghỉ
         processed_text = text
         start_time = time.time()
+        # [DEBUG] Bước 1: Encode reference
+        print(f"[DEBUG] Bắt đầu encode_reference: {ref_path}")
+        try:
+            ref_codes = tts.encode_reference(ref_path)
+            print(f"[DEBUG] encode_reference thành công! Type: {type(ref_codes)}")
+        except Exception as e_enc:
+            import traceback
+            traceback.print_exc()
+            return None, f"Lỗi encode_reference: {type(e_enc).__name__}: {str(e_enc)}"
+        # [DEBUG] Bước 2: Infer
+        print(f"[DEBUG] Bắt đầu infer. Text length: {len(processed_text)}")
+        try:
+            wav = tts.infer(processed_text[:500], ref_codes, ref_txt_val)
+            print(f"[DEBUG] infer thành công! Wav shape: {wav.shape if hasattr(wav, 'shape') else len(wav)}")
+        except Exception as e_inf:
+            import traceback
+            traceback.print_exc()
+            return None, f"Lỗi infer: {type(e_inf).__name__}: {str(e_inf)}"
         # Tốc độ
         if speed_value != 1.0:
         with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp:
             sf.write(tmp.name, wav, 24000)
+            elapsed = time.time() - start_time
+            print(f"[DEBUG] Hoàn tất TTS: {elapsed:.2f}s | Output: {tmp.name}")
+            return tmp.name, f"Hoàn tất: {elapsed:.2f}s"
     except Exception as e:
+        import traceback
+        traceback.print_exc()
+        return None, f"Lỗi: {type(e).__name__}: {str(e)}"
 # --- 2. GIAO DIỆN CƠ BẢN (Native Gradio) ---
 with gr.Blocks(title="AI Voice") as demo: