Spaces:
Sleeping
Sleeping
| [app] | |
| project_version="0.7.5" | |
| # LLM API 超时配置(秒) | |
| llm_vision_timeout = 120 # 视觉模型基础超时时间 | |
| llm_text_timeout = 180 # 文本模型基础超时时间(解说文案生成等复杂任务需要更长时间) | |
| llm_max_retries = 3 # API 重试次数(LiteLLM 会自动处理重试) | |
| ########################################## | |
| # 🚀 LLM 配置 - 使用 LiteLLM 统一接口 | |
| ########################################## | |
| # LiteLLM 是统一的 LLM 接口库,支持 100+ providers | |
| # 优势: | |
| # ✅ 代码量减少 80%,统一的 API 接口 | |
| # ✅ 自动重试和智能错误处理 | |
| # ✅ 内置成本追踪和 token 统计 | |
| # ✅ 支持更多 providers:OpenAI, Anthropic, Gemini, Qwen, DeepSeek, | |
| # Cohere, Together AI, Replicate, Groq, Mistral 等 | |
| # | |
| # 文档:https://docs.litellm.ai/ | |
| # 支持的模型:https://docs.litellm.ai/docs/providers | |
| # ===== 视觉模型配置 ===== | |
| vision_llm_provider = "litellm" | |
| # 模型格式:provider/model_name | |
| # 常用视觉模型示例: | |
| # - Gemini: gemini/gemini-2.0-flash-lite (推荐,速度快成本低) | |
| # - Gemini: gemini/gemini-1.5-pro (高精度) | |
| # - OpenAI: gpt-4o, gpt-4o-mini | |
| # - Qwen: qwen/qwen2.5-vl-32b-instruct | |
| # - SiliconFlow: siliconflow/Qwen/Qwen2.5-VL-32B-Instruct | |
| vision_litellm_model_name = "gemini/gemini-2.0-flash-lite" | |
| vision_litellm_api_key = "" # 填入对应 provider 的 API key | |
| vision_litellm_base_url = "" # 可选:自定义 API base URL | |
| # ===== 文本模型配置 ===== | |
| text_llm_provider = "litellm" | |
| # 常用文本模型示例: | |
| # - DeepSeek: deepseek/deepseek-chat (推荐,性价比高) | |
| # - DeepSeek: deepseek/deepseek-reasoner (推理能力强) | |
| # - Gemini: gemini/gemini-2.0-flash (速度快) | |
| # - OpenAI: gpt-4o, gpt-4o-mini, gpt-4-turbo | |
| # - Qwen: qwen/qwen-plus, qwen/qwen-turbo | |
| # - SiliconFlow: siliconflow/deepseek-ai/DeepSeek-R1 | |
| # - Moonshot: moonshot/moonshot-v1-8k | |
| text_litellm_model_name = "deepseek/deepseek-chat" | |
| text_litellm_api_key = "" # 填入对应 provider 的 API key | |
| text_litellm_base_url = "" # 可选:自定义 API base URL | |
| # ===== API Keys 参考 ===== | |
| # 主流 LLM Providers API Key 获取地址: | |
| # | |
| # OpenAI: https://platform.openai.com/api-keys | |
| # Gemini: https://makersuite.google.com/app/apikey | |
| # DeepSeek: https://platform.deepseek.com/api_keys | |
| # Qwen (阿里): https://bailian.console.aliyun.com/?tab=model#/api-key | |
| # SiliconFlow: https://cloud.siliconflow.cn/account/ak (手机号注册) | |
| # Moonshot: https://platform.moonshot.cn/console/api-keys | |
| # Anthropic: https://console.anthropic.com/settings/keys | |
| # Cohere: https://dashboard.cohere.com/api-keys | |
| # Together AI: https://api.together.xyz/settings/api-keys | |
| ########################################## | |
| # 🔧 高级配置(可选) | |
| ########################################## | |
| # WebUI 界面是否显示配置项 | |
| hide_config = true | |
| ########################################## | |
| # 📚 传统配置示例(仅供参考,不推荐使用) | |
| ########################################## | |
| # 如果需要使用传统的单独 provider 实现,可以参考以下配置 | |
| # 但强烈推荐使用上面的 LiteLLM 配置 | |
| # | |
| # 传统视觉模型配置示例: | |
| # vision_llm_provider = "gemini" # 可选:gemini, qwenvl, siliconflow | |
| # vision_gemini_api_key = "" | |
| # vision_gemini_model_name = "gemini-2.0-flash-lite" | |
| # | |
| # 传统文本模型配置示例: | |
| # text_llm_provider = "openai" # 可选:openai, gemini, qwen, deepseek, siliconflow, moonshot | |
| # text_openai_api_key = "" | |
| # text_openai_model_name = "gpt-4o-mini" | |
| # text_openai_base_url = "https://api.openai.com/v1" | |
| ########################################## | |
| # TTS (文本转语音) 配置 | |
| ########################################## | |
| [azure] | |
| # Azure TTS 配置 | |
| # 获取密钥:https://portal.azure.com | |
| speech_key = "" | |
| speech_region = "" | |
| [tencent] | |
| # 腾讯云 TTS 配置 | |
| # 访问 https://console.cloud.tencent.com/cam/capi 获取密钥 | |
| secret_id = "" | |
| secret_key = "" | |
| region = "ap-beijing" # 地域配置 | |
| [soulvoice] | |
| # SoulVoice TTS API 配置 | |
| api_key = "" | |
| voice_uri = "speech:mcg3fdnx:clzkyf4vy00e5qr6hywum4u84:bzznlkuhcjzpbosexitr" | |
| api_url = "https://tts.scsmtech.cn/tts" | |
| model = "FunAudioLLM/CosyVoice2-0.5B" | |
| [tts_qwen] | |
| # 通义千问 Qwen3 TTS 配置 | |
| # 访问 https://bailian.console.aliyun.com/?tab=model#/api-key 获取你的 API 密钥 | |
| api_key = "" | |
| model_name = "qwen3-tts-flash" | |
| [indextts2] | |
| # IndexTTS2 语音克隆配置 | |
| # 这是一个开源的零样本语音克隆项目,需要自行部署 | |
| # 项目地址:https://github.com/index-tts/index-tts | |
| # 默认 API 地址(本地部署) | |
| api_url = "http://127.0.0.1:8081/tts" | |
| # 默认参考音频路径(可选) | |
| # reference_audio = "/path/to/reference_audio.wav" | |
| # 推理模式:普通推理 / 快速推理 | |
| infer_mode = "普通推理" | |
| # 高级参数 | |
| temperature = 1.0 | |
| top_p = 0.8 | |
| top_k = 30 | |
| do_sample = true | |
| num_beams = 3 | |
| repetition_penalty = 10.0 | |
| [ui] | |
| # TTS 引擎选择 | |
| # 可选:edge_tts, azure_speech, soulvoice, tencent_tts, tts_qwen | |
| tts_engine = "edge_tts" | |
| # Edge TTS 配置 | |
| edge_voice_name = "zh-CN-XiaoyiNeural-Female" | |
| edge_volume = 80 | |
| edge_rate = 1.0 | |
| edge_pitch = 0 | |
| # Azure Speech Services 配置 | |
| azure_voice_name = "zh-CN-XiaoyiNeural-Female" | |
| azure_volume = 80 | |
| azure_rate = 1.0 | |
| azure_pitch = 0 | |
| ########################################## | |
| # 代理和网络配置 | |
| ########################################## | |
| [proxy] | |
| # HTTP/HTTPS 代理配置(如需要) | |
| # clash 默认地址:http://127.0.0.1:7890 | |
| http = "" | |
| https = "" | |
| enabled = false | |
| ########################################## | |
| # 视频处理配置 | |
| ########################################## | |
| [frames] | |
| # 提取关键帧的间隔时间(秒) | |
| frame_interval_input = 3 | |
| # 大模型单次处理的关键帧数量 | |
| vision_batch_size = 10 | |