GENIE / installer.py
Tom1986's picture
Add PyAudio alternative installation and improve genie-tts setup process
88ea7f6
"""
Genie TTS 依赖安装模块
负责处理Genie TTS包及其依赖的安装和管理
"""
import subprocess
import sys
import logging
logger = logging.getLogger(__name__)
def install_pyaudio_alternative():
"""尝试安装PyAudio的替代方案或创建mock模块"""
try:
# 首先尝试正常安装PyAudio
subprocess.check_call([
sys.executable, "-m", "pip", "install", "pyaudio"
], timeout=120)
logger.info("✓ PyAudio 安装成功")
return True
except Exception as e:
logger.warning(f"PyAudio 安装失败: {e}")
# 如果PyAudio安装失败,创建一个mock模块
try:
import os
import site
# 获取site-packages路径
site_packages = site.getsitepackages()[0]
pyaudio_mock_path = os.path.join(site_packages, "pyaudio.py")
# 创建mock pyaudio模块
mock_pyaudio_code = '''"""
Mock PyAudio module for environments without audio support
"""
class PyAudioError(Exception):
pass
class Stream:
def __init__(self, *args, **kwargs):
raise PyAudioError("音频流在此环境中不可用")
def read(self, *args, **kwargs):
raise PyAudioError("音频读取在此环境中不可用")
def write(self, *args, **kwargs):
raise PyAudioError("音频写入在此环境中不可用")
def start_stream(self):
pass
def stop_stream(self):
pass
def close(self):
pass
class PyAudio:
paInt16 = 8
paFloat32 = 1
def __init__(self):
logger.warning("使用Mock PyAudio - 音频功能不可用")
def open(self, *args, **kwargs):
return Stream()
def get_device_count(self):
return 0
def get_device_info_by_index(self, index):
return {"name": "Mock Device", "maxInputChannels": 0, "maxOutputChannels": 0}
def terminate(self):
pass
# 导出主要类和常量
__all__ = ['PyAudio', 'Stream', 'PyAudioError']
'''
with open(pyaudio_mock_path, 'w', encoding='utf-8') as f:
f.write(mock_pyaudio_code)
logger.info("✓ 创建 PyAudio mock 模块成功")
return True
except Exception as mock_error:
logger.error(f"创建 PyAudio mock 模块失败: {mock_error}")
return False
def install_genie_tts():
"""尝试安装genie-tts包,处理Hugging Face Spaces的限制"""
try:
import genie_tts
logger.info("genie-tts已安装")
return True, None
except ImportError:
logger.info("正在尝试安装genie-tts...")
try:
# 首先确保关键依赖已安装
critical_deps = [
"onnxruntime>=1.16.0", # 最关键:没有它TTS完全无法工作
"numpy>=1.21.0", # 基础依赖
"soundfile>=0.12.0", # 音频处理
"huggingface-hub>=0.17.0", # 模型下载
"scipy>=1.9.0", # 科学计算
"pyyaml>=6.0", # 配置文件解析
"rich>=12.0.0" # 终端输出美化
]
logger.info("正在安装关键依赖...")
for dep in critical_deps:
try:
subprocess.check_call([
sys.executable, "-m", "pip", "install", dep, "--upgrade"
], timeout=180)
logger.info(f"✓ 成功安装: {dep}")
except Exception as e:
logger.error(f"✗ 关键依赖安装失败: {dep} - {e}")
return False, f"关键依赖 {dep} 安装失败: {str(e)}"
# 处理PyAudio依赖
logger.info("正在处理PyAudio依赖...")
pyaudio_success = install_pyaudio_alternative()
if not pyaudio_success:
logger.warning("PyAudio处理失败,但将继续安装...")
# 尝试安装可选的日语处理依赖
try:
subprocess.check_call([
sys.executable, "-m", "pip", "install", "pyopenjtalk"
], timeout=120)
logger.info("✓ 成功安装 pyopenjtalk")
except Exception as e:
logger.warning(f"⚠ pyopenjtalk 安装失败: {e}")
# 尝试安装可选的音频重采样依赖
try:
subprocess.check_call([
sys.executable, "-m", "pip", "install", "soxr"
], timeout=120)
logger.info("✓ 成功安装 soxr")
except Exception as e:
logger.warning(f"⚠ soxr 安装失败: {e}")
# 最后安装genie-tts主包
logger.info("正在安装 genie-tts 主包...")
subprocess.check_call([
sys.executable, "-m", "pip", "install",
"genie-tts", "--upgrade"
], timeout=300)
# 验证安装
import genie_tts
logger.info("✅ genie-tts安装成功")
return True, "安装成功,但某些音频功能可能不可用(PyAudio限制)"
except subprocess.TimeoutExpired:
error_msg = "安装超时:Hugging Face Spaces 环境可能不支持某些依赖"
logger.error(error_msg)
return False, error_msg
except Exception as e:
error_msg = str(e)
# 如果仍然是PyAudio相关错误,提供更详细的解决建议
if "pyaudio" in error_msg.lower():
error_msg = (
"PyAudio依赖问题:即使创建了mock模块,genie-tts仍无法正常导入。"
"建议解决方案:\n"
"1. 在本地环境运行(安装了音频驱动)\n"
"2. 使用替代的TTS库(如 pyttsx3 或 espeak)\n"
"3. 联系Hugging Face支持团队关于音频依赖问题"
)
logger.error(error_msg)
return False, error_msg
else:
logger.error(f"安装genie-tts失败: {error_msg}")
return False, error_msg
def setup_genie_import():
"""设置Genie TTS的导入,返回模块和错误信息"""
install_success, install_error = install_genie_tts()
if install_success:
try:
import genie_tts as genie
logger.info("Genie TTS导入成功")
return genie, install_error # 返回警告信息(如果有)
except ImportError as e:
error_msg = f"导入失败: {str(e)}"
# 如果导入仍然失败,提供备用方案的建议
if "pyaudio" in error_msg.lower():
error_msg += (
"\n\n建议的备用方案:\n"
"1. 使用在线TTS服务(Google TTS, Azure Speech等)\n"
"2. 在本地环境部署Genie TTS\n"
"3. 使用其他兼容Hugging Face Spaces的TTS模型"
)
logger.error(error_msg)
return None, error_msg
else:
return None, install_error