Spaces:

smartwang
/

magicvoice

Running on Zero

smartwang commited on Feb 23

Commit

e0707a4

1 Parent(s): 85916ca

T

Files changed (1) hide show

app.py CHANGED Viewed

@@ -289,8 +289,8 @@ def extract_voice_clone_prompt(ref_audio,ref_text,use_xvector_only):
     uxo = use_xvector_only
     # 如果没有提供参考文本且未开启仅 x-vector 模式，尝试使用 Whisper 自动识别
-    if not uxo and (not r_text or (isinstance(r_text, str) and not r_text.strip())):
-        whisper_size = "large-v3"
         logger.info(f"未提供参考文本，开始使用 Whisper 自动识别。模型: {whisper_size}")
         try:
             whisper_model = load_whisper_model(whisper_size)
@@ -306,6 +306,7 @@ def extract_voice_clone_prompt(ref_audio,ref_text,use_xvector_only):
             result = whisper_model.transcribe(whisper_audio)
             r_text = result["text"].strip()
             logger.info(f"Whisper 识别成功：{r_text}")
         except Exception as e:
             logger.error(f"Whisper 识别失败: {str(e)}", exc_info=True)
             return None, f"错误：语音识别失败且未提供参考文本。{str(e)}"

     uxo = use_xvector_only
     # 如果没有提供参考文本且未开启仅 x-vector 模式，尝试使用 Whisper 自动识别
+    if not r_text or (isinstance(r_text, str) and not r_text.strip()):
+        whisper_size = "base"
         logger.info(f"未提供参考文本，开始使用 Whisper 自动识别。模型: {whisper_size}")
         try:
             whisper_model = load_whisper_model(whisper_size)
             result = whisper_model.transcribe(whisper_audio)
             r_text = result["text"].strip()
             logger.info(f"Whisper 识别成功：{r_text}")
+            uxo = False
         except Exception as e:
             logger.error(f"Whisper 识别失败: {str(e)}", exc_info=True)
             return None, f"错误：语音识别失败且未提供参考文本。{str(e)}"