Spaces:

smartwang
/

magicvoice

Running on Zero

smartwang commited on Feb 14

Commit

471c527

1 Parent(s): 265bb42

T

Files changed (1) hide show

app.py CHANGED Viewed

@@ -296,23 +296,25 @@ def extract_voice_clone_prompt(ref_audio,ref_text,use_xvector_only):
     #     return None, "错误：未启用 '仅使用 x-vector' 时需要参考文本。"
     model_size = "base"
     logger.info(f"开始 Whisper 语音识别任务。模型: {model_size}, 音频路径: {ref_audio}")
     try:
-        model = load_whisper_model(model_size)
         # 使用 transcribe 方法进行转录
         # whisper 会自动处理音频加载和重采样
-        result = model.transcribe(ref_audio)
         text = result["text"]
         logger.info(f"Whisper 识别完成。文本长度: {len(text)}")
-        ref_text = text.strip()
         logger.error(f"Whisper 识别成功：{ref_text}")
-        use_xvector_only = False
     except Exception as e:
         logger.error(f"Whisper 识别失败: {str(e)}", exc_info=True)
     voice_clone_prompt = tts.create_voice_clone_prompt(
         ref_audio=audio_tuple,
-        ref_text=ref_text.strip() if ref_text else None,
-        x_vector_only_mode=use_xvector_only
     )
     logger.info("参考音频特征提取完成。")

     #     return None, "错误：未启用 '仅使用 x-vector' 时需要参考文本。"
     model_size = "base"
     logger.info(f"开始 Whisper 语音识别任务。模型: {model_size}, 音频路径: {ref_audio}")
+    r_text = ref_text
+    uxo = use_xvector_only
     try:
+        whisper_model = load_whisper_model(model_size)
         # 使用 transcribe 方法进行转录
         # whisper 会自动处理音频加载和重采样
+        result = whisper_model.transcribe(ref_audio)
         text = result["text"]
         logger.info(f"Whisper 识别完成。文本长度: {len(text)}")
+        r_text = text.strip()
         logger.error(f"Whisper 识别成功：{ref_text}")
+        uxo = False
     except Exception as e:
         logger.error(f"Whisper 识别失败: {str(e)}", exc_info=True)
     voice_clone_prompt = tts.create_voice_clone_prompt(
         ref_audio=audio_tuple,
+        ref_text=r_text.strip() if r_text else None,
+        x_vector_only_mode=uxo
     )
     logger.info("参考音频特征提取完成。")