Spaces:

TNOT
/

JinrikiHelper

Running

App Files Files Community

TNOT commited on Feb 1

Commit

86371bb

1 Parent(s): d824a9d

fix: 导出页面 UI 修复 2

Browse files

Files changed (6) hide show

docs/流程文档_AI用.md +5 -3
src/export_plugins/simple_export.py +98 -10
src/export_plugins/utau_oto_export.py +14 -0
src/gui_cloud.py +257 -135
tools/README.md +1 -1
tools/mfa_engine.7z +3 -0

docs/流程文档_AI用.md CHANGED Viewed

@@ -391,9 +391,11 @@ MFA 环境:
 - 音频未上传完成时禁用「开始制作」按钮，防止误操作
 - 导出页面提供「使用刚制作的音源」按钮，避免重复上传
 - Whisper 模型选项标注速度参考：small 约 4 秒/句，medium 约 12 秒/句（慢 2-3 倍但更准确）
-- **导出插件动态选项**: 切换导出插件时自动显示/隐藏对应的配置选项
-  - 简单单字导出: 基本设置（最大样本数、命名规则）
-  - UTAU oto.ini 导出: 额外显示质量评估维度、别名风格、Overlap 比例、文件编码等专用选项
 ### 平台差异

 - 音频未上传完成时禁用「开始制作」按钮，防止误操作
 - 导出页面提供「使用刚制作的音源」按钮，避免重复上传
 - Whisper 模型选项标注速度参考：small 约 4 秒/句，medium 约 12 秒/句（慢 2-3 倍但更准确）
+- **导出插件动态选项系统**:
+  - 插件选项完全动态化，根据 `ExportPlugin.get_options()` 自动生成 UI 组件
+  - 切换插件时自动显示/隐藏对应的配置选项组
+  - 支持的选项类型: TEXT(文本)、NUMBER(数字)、SWITCH(开关)、COMBO(下拉)、MULTI_SELECT(多选)、LABEL(说明文字)
+  - 新增插件无需修改 GUI 代码，只需在插件中定义 `get_options()` 即可自动生成界面
 ### 平台差异

src/export_plugins/simple_export.py CHANGED Viewed

@@ -41,6 +41,13 @@ class SimpleExportPlugin(ExportPlugin):
                 max_value=1000,
                 description="按时长排序，保留最长的N个"
             ),
             PluginOption(
                 key="naming_rule",
                 label="命名规则",
@@ -83,6 +90,57 @@ class SimpleExportPlugin(ExportPlugin):
         name = rule.replace("%p%", pinyin).replace("%n%", str(index))
         return name
     def export(
         self,
         source_name: str,
@@ -105,13 +163,19 @@ class SimpleExportPlugin(ExportPlugin):
             temp_base = os.path.join(bank_dir, ".temp_segments")
             segments_dir = os.path.join(temp_base, source_name)
             # 步骤1: 提取分词片段
             self._log("【提取分词片段】")
             success, msg, pinyin_counts = self._extract_segments(
                 paths["slices_dir"],
                 paths["textgrid_dir"],
                 segments_dir,
-                language
             )
             if not success:
                 return False, msg
@@ -146,13 +210,17 @@ class SimpleExportPlugin(ExportPlugin):
         slices_dir: str,
         textgrid_dir: str,
         segments_dir: str,
-        language: str
     ) -> Tuple[bool, str, Dict[str, int]]:
         """
         提取分词片段
         中文：使用words层按字切分，用char_to_pinyin获取拼音名称
         日语：使用phones层按音素切分，合并辅音+元音为音节
         """
         try:
             import textgrid
@@ -169,11 +237,11 @@ class SimpleExportPlugin(ExportPlugin):
             # 根据语言选择提取方法
             if language in ("japanese", "ja", "jp"):
                 return self._extract_japanese_segments(
-                    tg_files, slices_dir, segments_dir
                 )
             else:
                 return self._extract_chinese_segments(
-                    tg_files, slices_dir, segments_dir, language
                 )
         except Exception as e:
@@ -185,12 +253,16 @@ class SimpleExportPlugin(ExportPlugin):
         tg_files: List[str],
         slices_dir: str,
         segments_dir: str,
-        language: str
     ) -> Tuple[bool, str, Dict[str, int]]:
         """
         中文音频提取
         使用words层的时间边界，按字符切分，用char_to_pinyin获取拼音
         """
         import textgrid
         import soundfile as sf
@@ -208,6 +280,7 @@ class SimpleExportPlugin(ExportPlugin):
             tg = textgrid.TextGrid.fromFile(tg_path)
             audio, sr = sf.read(wav_path, dtype='float32')
             # 使用words层（第一层）
             words_tier = tg[0]
@@ -240,6 +313,11 @@ class SimpleExportPlugin(ExportPlugin):
                     char_start = start_time + i * char_duration
                     char_end = char_start + char_duration
                     pinyin_dir = os.path.join(segments_dir, pinyin)
                     os.makedirs(pinyin_dir, exist_ok=True)
@@ -247,8 +325,8 @@ class SimpleExportPlugin(ExportPlugin):
                     index = current_count + 1
                     pinyin_counts[pinyin] = index
-                    start_sample = int(round(char_start * sr))
-                    end_sample = int(round(char_end * sr))
                     segment = audio[start_sample:end_sample]
                     if len(segment) == 0:
@@ -267,12 +345,16 @@ class SimpleExportPlugin(ExportPlugin):
         self,
         tg_files: List[str],
         slices_dir: str,
-        segments_dir: str
     ) -> Tuple[bool, str, Dict[str, int]]:
         """
         日语音频提取
         使用phones层，将辅音+元音合并为音节
         """
         import textgrid
         import soundfile as sf
@@ -289,6 +371,7 @@ class SimpleExportPlugin(ExportPlugin):
             tg = textgrid.TextGrid.fromFile(tg_path)
             audio, sr = sf.read(wav_path, dtype='float32')
             # 查找phones层
             phones_tier = None
@@ -316,6 +399,11 @@ class SimpleExportPlugin(ExportPlugin):
                 if not normalized:
                     continue
                 phone_dir = os.path.join(segments_dir, normalized)
                 os.makedirs(phone_dir, exist_ok=True)
@@ -323,8 +411,8 @@ class SimpleExportPlugin(ExportPlugin):
                 index = current_count + 1
                 phone_counts[normalized] = index
-                start_sample = int(round(start_time * sr))
-                end_sample = int(round(end_time * sr))
                 segment = audio[start_sample:end_sample]
                 if len(segment) == 0:

                 max_value=1000,
                 description="按时长排序，保留最长的N个"
             ),
+            PluginOption(
+                key="extend_duration",
+                label="头尾拓展（秒）",
+                option_type=OptionType.TEXT,
+                default="0",
+                description="裁剪时头尾各拓展的时长，最大1.5秒。若一边到达边界，另一边继续拓展"
+            ),
             PluginOption(
                 key="naming_rule",
                 label="命名规则",
         name = rule.replace("%p%", pinyin).replace("%n%", str(index))
         return name
+    def _apply_extend(
+        self,
+        start_time: float,
+        end_time: float,
+        extend_duration: float,
+        audio_duration: float
+    ) -> Tuple[float, float]:
+        """
+        应用头尾拓展
+        头尾各拓展 extend_duration 秒，若一边到达边界则另一边继续拓展
+        参数:
+            start_time: 原始开始时间
+            end_time: 原始结束时间
+            extend_duration: 单边拓展时长
+            audio_duration: 音频总时长
+        返回:
+            (实际开始时间, 实际结束时间)
+        """
+        if extend_duration <= 0:
+            return start_time, end_time
+        total_extend = extend_duration * 2  # 总拓展量
+        # 先尝试头尾各拓展
+        head_extend = extend_duration
+        tail_extend = extend_duration
+        # 检查头部是否到达边界
+        if start_time - head_extend < 0:
+            head_actual = start_time  # 头部只能拓展到0
+            head_remaining = head_extend - head_actual  # 剩余量转给尾部
+            tail_extend += head_remaining
+            head_extend = head_actual
+        # 检查尾部是否到达边界
+        if end_time + tail_extend > audio_duration:
+            tail_actual = audio_duration - end_time  # 尾部只能拓展到边界
+            tail_remaining = tail_extend - tail_actual  # 剩余量转给头部
+            # 头部再次尝试拓展（如果还有空间）
+            additional_head = min(tail_remaining, start_time - (start_time - head_extend))
+            head_extend = min(start_time, head_extend + tail_remaining)
+            tail_extend = tail_actual
+        actual_start = max(0, start_time - head_extend)
+        actual_end = min(audio_duration, end_time + tail_extend)
+        return actual_start, actual_end
     def export(
         self,
         source_name: str,
             temp_base = os.path.join(bank_dir, ".temp_segments")
             segments_dir = os.path.join(temp_base, source_name)
+            # 获取头尾拓展参数
+            extend_duration = min(float(options.get("extend_duration", 0)), 1.5)
             # 步骤1: 提取分词片段
             self._log("【提取分词片段】")
+            if extend_duration > 0:
+                self._log(f"头尾拓展: {extend_duration}s（单边到达边界时另一边继续拓展）")
             success, msg, pinyin_counts = self._extract_segments(
                 paths["slices_dir"],
                 paths["textgrid_dir"],
                 segments_dir,
+                language,
+                extend_duration
             )
             if not success:
                 return False, msg
         slices_dir: str,
         textgrid_dir: str,
         segments_dir: str,
+        language: str,
+        extend_duration: float = 0.0
     ) -> Tuple[bool, str, Dict[str, int]]:
         """
         提取分词片段
         中文：使用words层按字切分，用char_to_pinyin获取拼音名称
         日语：使用phones层按音素切分，合并辅音+元音为音节
+        参数:
+            extend_duration: 头尾拓展总时长（秒），单边到达边界时另一边继续拓展
         """
         try:
             import textgrid
             # 根据语言选择提取方法
             if language in ("japanese", "ja", "jp"):
                 return self._extract_japanese_segments(
+                    tg_files, slices_dir, segments_dir, extend_duration
                 )
             else:
                 return self._extract_chinese_segments(
+                    tg_files, slices_dir, segments_dir, language, extend_duration
                 )
         except Exception as e:
         tg_files: List[str],
         slices_dir: str,
         segments_dir: str,
+        language: str,
+        extend_duration: float = 0.0
     ) -> Tuple[bool, str, Dict[str, int]]:
         """
         中文音频提取
         使用words层的时间边界，按字符切分，用char_to_pinyin获取拼音
+        参数:
+            extend_duration: 头尾拓展总时长（秒），单边到达边界时另一边继续拓展
         """
         import textgrid
         import soundfile as sf
             tg = textgrid.TextGrid.fromFile(tg_path)
             audio, sr = sf.read(wav_path, dtype='float32')
+            audio_duration = len(audio) / sr
             # 使用words层（第一层）
             words_tier = tg[0]
                     char_start = start_time + i * char_duration
                     char_end = char_start + char_duration
+                    # 应用头尾拓展，单边到达边界时另一边继续拓展
+                    actual_start, actual_end = self._apply_extend(
+                        char_start, char_end, extend_duration, audio_duration
+                    )
                     pinyin_dir = os.path.join(segments_dir, pinyin)
                     os.makedirs(pinyin_dir, exist_ok=True)
                     index = current_count + 1
                     pinyin_counts[pinyin] = index
+                    start_sample = int(round(actual_start * sr))
+                    end_sample = int(round(actual_end * sr))
                     segment = audio[start_sample:end_sample]
                     if len(segment) == 0:
         self,
         tg_files: List[str],
         slices_dir: str,
+        segments_dir: str,
+        extend_duration: float = 0.0
     ) -> Tuple[bool, str, Dict[str, int]]:
         """
         日语音频提取
         使用phones层，将辅音+元音合并为音节
+        参数:
+            extend_duration: 头尾拓展总时长（秒），单边到达边界时另一边继续拓展
         """
         import textgrid
         import soundfile as sf
             tg = textgrid.TextGrid.fromFile(tg_path)
             audio, sr = sf.read(wav_path, dtype='float32')
+            audio_duration = len(audio) / sr
             # 查找phones层
             phones_tier = None
                 if not normalized:
                     continue
+                # 应用头尾拓展，单边到达边界时另一边继续拓展
+                actual_start, actual_end = self._apply_extend(
+                    start_time, end_time, extend_duration, audio_duration
+                )
                 phone_dir = os.path.join(segments_dir, normalized)
                 os.makedirs(phone_dir, exist_ok=True)
                 index = current_count + 1
                 phone_counts[normalized] = index
+                start_sample = int(round(actual_start * sr))
+                end_sample = int(round(actual_end * sr))
                 segment = audio[start_sample:end_sample]
                 if len(segment) == 0:

src/export_plugins/utau_oto_export.py CHANGED Viewed

@@ -238,6 +238,13 @@ class UTAUOtoExportPlugin(ExportPlugin):
                 label="从 TextGrid phones 层提取音素，生成 oto.ini（音频不裁剪）",
                 option_type=OptionType.LABEL
             ),
             PluginOption(
                 key="max_samples",
                 label="每个别名最大样本数",
@@ -286,6 +293,13 @@ class UTAUOtoExportPlugin(ExportPlugin):
                 max_value=0.5,
                 description="Overlap = Preutterance × 此比例"
             ),
             PluginOption(
                 key="encoding",
                 label="文件编码",

                 label="从 TextGrid phones 层提取音素，生成 oto.ini（音频不裁剪）",
                 option_type=OptionType.LABEL
             ),
+            PluginOption(
+                key="cross_language",
+                label="跨语种导出",
+                option_type=OptionType.SWITCH,
+                default=False,
+                description="【TODO】启用中跨日或日跨中的音素映射导出"
+            ),
             PluginOption(
                 key="max_samples",
                 label="每个别名最大样本数",
                 max_value=0.5,
                 description="Overlap = Preutterance × 此比例"
             ),
+            PluginOption(
+                key="auto_phoneme_combine",
+                label="自动拼字",
+                option_type=OptionType.SWITCH,
+                default=False,
+                description="【TODO】尽可能用已有的音素拆分拼接成缺失的音素"
+            ),
             PluginOption(
                 key="encoding",
                 label="文件编码",

src/gui_cloud.py CHANGED Viewed

@@ -534,31 +534,13 @@ def get_plugin_options_config(plugins: Dict[str, Any]) -> Dict[str, List[Dict]]:
                 "choices": opt.choices,
                 "min_value": opt.min_value,
                 "max_value": opt.max_value,
             }
             options.append(opt_config)
         config[name] = options
     return config
-def build_plugin_options_html(plugin_name: str, plugins_config: Dict) -> str:
-    """
-    根据插件选项生成 HTML 表单
-    这个方法生成一个简单的 HTML 表单，用于在 Gradio 中显示插件选项
-    """
-    if plugin_name not in plugins_config:
-        return "<p>未找到插件配置</p>"
-    options = plugins_config[plugin_name]
-    html_parts = []
-    for opt in options:
-        if opt["type"] == "label":
-            html_parts.append(f'<p style="color: #666; font-style: italic;">{opt["label"]}</p>')
-    return "\n".join(html_parts) if html_parts else ""
 def get_default_options_json(plugin_name: str, plugins_config: Dict) -> str:
     """获取插件的默认选项 JSON"""
     if plugin_name not in plugins_config:
@@ -573,6 +555,145 @@ def get_default_options_json(plugin_name: str, plugins_config: Dict) -> str:
     return json.dumps(defaults, ensure_ascii=False)
 # ==================== 构建界面 ====================
 def create_cloud_ui():
@@ -743,128 +864,126 @@ def create_cloud_ui():
                     label="导出插件"
                 )
-                # 插件描述
-                plugin_desc = gr.Markdown(
-                    value=f"> {plugins[plugin_names[0]].description}" if plugin_names and plugin_names[0] in plugins else ""
-                )
-                # 存储当前选项的 JSON（隐藏）
-                options_state = gr.State(
-                    value=get_default_options_json(plugin_names[0], plugins_config) if plugin_names else "{}"
-                )
                 # ===== 动态选项区域 =====
-                # 使用 gr.Group 包裹所有可能的选项组件，通过 visible 控制显示
-                # 通用选项（两个插件都有）
-                with gr.Group():
-                    gr.Markdown("#### 基本设置")
-                    with gr.Row():
-                        export_max_samples = gr.Number(
-                            label="每个拼音/别名最大样本数",
-                            value=10,
-                            minimum=1,
-                            maximum=1000
-                        )
-                    with gr.Row():
-                        export_naming = gr.Textbox(
-                            label="命名规则",
-                            value="%p%%n%",
-                            info="%p%=拼音/罗马音, %n%=序号"
-                        )
-                        export_first_naming = gr.Textbox(
-                            label="首个样本命名",
-                            value="%p%",
-                            info="第0个样本的特殊规则"
-                        )
-                # UTAU 专用选项
-                with gr.Group(visible=False) as utau_options_group:
-                    gr.Markdown("#### UTAU 专用设置")
-                    with gr.Row():
-                        export_quality_metrics = gr.Dropdown(
-                            label="质量评估维度",
-                            choices=["duration", "duration+rms", "duration+f0", "all"],
-                            value="duration+rms",
-                            info="duration=仅时长, +rms=音量稳定性, +f0=音高稳定性"
-                        )
-                        export_alias_style = gr.Dropdown(
-                            label="别名风格（日语）",
-                            choices=["romaji", "hiragana"],
-                            value="hiragana",
-                            info="日语音源的别名格式"
-                        )
-                    with gr.Row():
-                        export_overlap_ratio = gr.Number(
-                            label="Overlap 比例",
-                            value=0.3,
-                            minimum=0.1,
-                            maximum=0.5,
-                            info="Overlap = Preutterance × 此比例"
-                        )
-                        export_encoding = gr.Dropdown(
-                            label="文件编码",
-                            choices=["shift_jis", "utf-8", "gbk"],
-                            value="shift_jis",
-                            info="oto.ini 编码（UTAU 标准为 Shift_JIS）"
-                        )
-                    export_sanitize_filename = gr.Checkbox(
-                        label="文件名转拼音（防止 UTAU 识别故障）",
-                        value=False
-                    )
-                # 插件切换时更新选项显示
-                def on_plugin_change(plugin_name):
-                    """切换插件时更新选项区域"""
-                    is_utau = "UTAU" in plugin_name
-                    # 获取插件描述
-                    desc = ""
-                    if plugin_name in plugins:
-                        desc = f"> {plugins[plugin_name].description}"
-                    # 获取默认值
-                    default_max = 5 if is_utau else 10
-                    return (
-                        gr.update(visible=is_utau),  # utau_options_group
-                        desc,  # plugin_desc
-                        default_max,  # export_max_samples
-                    )
                 export_plugin.change(
                     fn=on_plugin_change,
                     inputs=[export_plugin],
-                    outputs=[utau_options_group, plugin_desc, export_max_samples]
                 )
                 # 收集选项并导出
-                def collect_and_export(
-                    zip_file, plugin_name,
-                    max_samples, naming_rule, first_naming_rule,
-                    quality_metrics, alias_style, overlap_ratio, encoding, sanitize_filename,
-                    progress=gr.Progress()
-                ):
-                    """收集所有选项并执行导出"""
-                    # 构建选项字典
-                    options = {
-                        "max_samples": int(max_samples),
-                        "naming_rule": naming_rule,
-                        "first_naming_rule": first_naming_rule,
-                    }
-                    # UTAU 专用选项
-                    if "UTAU" in plugin_name:
-                        options.update({
-                            "quality_metrics": quality_metrics,
-                            "alias_style": alias_style,
-                            "overlap_ratio": float(overlap_ratio),
-                            "encoding": encoding,
-                            "sanitize_filename": sanitize_filename,
-                        })
                     options_json = json.dumps(options, ensure_ascii=False)
                     return process_export_voicebank(zip_file, plugin_name, options_json, progress)
@@ -884,14 +1003,17 @@ def create_cloud_ui():
                 > - 导出为适配其他软件的音源格式
                 """)
                 export_btn.click(
                     fn=collect_and_export,
-                    inputs=[
-                        export_upload, export_plugin,
-                        export_max_samples, export_naming, export_first_naming,
-                        export_quality_metrics, export_alias_style,
-                        export_overlap_ratio, export_encoding, export_sanitize_filename
-                    ],
                     outputs=[export_status, export_log, export_download]
                 )

                 "choices": opt.choices,
                 "min_value": opt.min_value,
                 "max_value": opt.max_value,
+                "step": opt.step,
             }
             options.append(opt_config)
         config[name] = options
     return config
 def get_default_options_json(plugin_name: str, plugins_config: Dict) -> str:
     """获取插件的默认选项 JSON"""
     if plugin_name not in plugins_config:
     return json.dumps(defaults, ensure_ascii=False)
+def create_dynamic_plugin_options(plugins: Dict[str, Any], plugins_config: Dict) -> Tuple[Dict[str, Any], callable]:
+    """
+    创建动态插件选项组件
+    返回:
+        (组件字典, 收集选项函数)
+    组件字典结构: {
+        "container": gr.Column,  # 主容器
+        "groups": {插件名: gr.Group},  # 每个插件的选项组
+        "components": {插件名: {选项key: 组件}},  # 所有组件
+    }
+    """
+    from src.export_plugins.base import OptionType
+    all_groups = {}
+    all_components = {}
+    # 为每个插件创建选项组
+    for plugin_name, options in plugins_config.items():
+        plugin_components = {}
+        # 创建该插件的选项组（初始隐藏，第一个插件除外）
+        is_first = (plugin_name == list(plugins_config.keys())[0])
+        with gr.Group(visible=is_first) as plugin_group:
+            # 显示插件描述
+            if plugin_name in plugins:
+                gr.Markdown(f"> {plugins[plugin_name].description}")
+            for opt in options:
+                opt_type = opt["type"]
+                key = opt["key"]
+                label = opt["label"]
+                default = opt["default"]
+                description = opt.get("description", "")
+                choices = opt.get("choices", [])
+                min_val = opt.get("min_value")
+                max_val = opt.get("max_value")
+                step = opt.get("step")
+                # 根据类型创建对应的 Gradio 组件
+                if opt_type == "label":
+                    # 纯文本标签
+                    gr.Markdown(f"*{label}*")
+                    continue
+                elif opt_type == "text":
+                    component = gr.Textbox(
+                        label=label,
+                        value=default or "",
+                        info=description
+                    )
+                elif opt_type == "number":
+                    component = gr.Number(
+                        label=label,
+                        value=default if default is not None else 0,
+                        minimum=min_val,
+                        maximum=max_val,
+                        step=step or 1,
+                        info=description
+                    )
+                elif opt_type == "switch":
+                    component = gr.Checkbox(
+                        label=label,
+                        value=bool(default),
+                        info=description
+                    )
+                elif opt_type == "combo":
+                    component = gr.Dropdown(
+                        label=label,
+                        choices=choices,
+                        value=default if default in choices else (choices[0] if choices else None),
+                        info=description
+                    )
+                elif opt_type == "multi_select":
+                    component = gr.CheckboxGroup(
+                        label=label,
+                        choices=choices,
+                        value=default if isinstance(default, list) else [],
+                        info=description
+                    )
+                else:
+                    # 未知类型，使用文本框
+                    component = gr.Textbox(
+                        label=label,
+                        value=str(default) if default else "",
+                        info=description
+                    )
+                plugin_components[key] = component
+        all_groups[plugin_name] = plugin_group
+        all_components[plugin_name] = plugin_components
+    return all_groups, all_components
+def build_options_collector(plugins_config: Dict, all_components: Dict):
+    """
+    构建选项收集函数
+    返回一个函数，该函数接收插件名和所有组件值，返回选项字典
+    """
+    # 构建组件到选项的映射
+    component_keys = {}
+    for plugin_name, components in all_components.items():
+        component_keys[plugin_name] = list(components.keys())
+    def collect_options(plugin_name: str, *values) -> Dict[str, Any]:
+        """收集当前插件的选项值"""
+        if plugin_name not in component_keys:
+            return {}
+        keys = component_keys[plugin_name]
+        options = {}
+        # 计算当前插件的值在 values 中的起始位置
+        start_idx = 0
+        for pname in component_keys:
+            if pname == plugin_name:
+                break
+            start_idx += len(component_keys[pname])
+        # 提取当前插件的值
+        for i, key in enumerate(keys):
+            if start_idx + i < len(values):
+                options[key] = values[start_idx + i]
+        return options
+    return collect_options
 # ==================== 构建界面 ====================
 def create_cloud_ui():
                     label="导出插件"
                 )
                 # ===== 动态选项区域 =====
+                # 为每个插件动态创建选���组件
+                all_plugin_groups = {}
+                all_plugin_components = {}
+                for idx, (pname, poptions) in enumerate(plugins_config.items()):
+                    is_first = (idx == 0)
+                    plugin_components = {}
+                    with gr.Group(visible=is_first) as plugin_group:
+                        # 插件描述
+                        if pname in plugins:
+                            gr.Markdown(f"> {plugins[pname].description}")
+                        # 动态创建选项组件
+                        for opt in poptions:
+                            opt_type = opt["type"]
+                            key = opt["key"]
+                            label = opt["label"]
+                            default = opt["default"]
+                            description = opt.get("description", "")
+                            choices = opt.get("choices", [])
+                            min_val = opt.get("min_value")
+                            max_val = opt.get("max_value")
+                            step = opt.get("step")
+                            if opt_type == "label":
+                                gr.Markdown(f"*{label}*")
+                                continue
+                            elif opt_type == "text":
+                                component = gr.Textbox(
+                                    label=label,
+                                    value=default or "",
+                                    info=description
+                                )
+                            elif opt_type == "number":
+                                component = gr.Number(
+                                    label=label,
+                                    value=default if default is not None else 0,
+                                    minimum=min_val,
+                                    maximum=max_val,
+                                    step=step or 1,
+                                    info=description
+                                )
+                            elif opt_type == "switch":
+                                component = gr.Checkbox(
+                                    label=label,
+                                    value=bool(default),
+                                    info=description
+                                )
+                            elif opt_type == "combo":
+                                component = gr.Dropdown(
+                                    label=label,
+                                    choices=choices,
+                                    value=default if default in choices else (choices[0] if choices else None),
+                                    info=description
+                                )
+                            elif opt_type == "multi_select":
+                                component = gr.CheckboxGroup(
+                                    label=label,
+                                    choices=choices,
+                                    value=default if isinstance(default, list) else [],
+                                    info=description
+                                )
+                            else:
+                                component = gr.Textbox(
+                                    label=label,
+                                    value=str(default) if default else "",
+                                    info=description
+                                )
+                            plugin_components[key] = component
+                    all_plugin_groups[pname] = plugin_group
+                    all_plugin_components[pname] = plugin_components
+                # 插件切换时更新选项组可见性
+                def on_plugin_change(selected_plugin):
+                    """切换插件时更新选项区域可见性"""
+                    updates = []
+                    for pname in plugins_config.keys():
+                        updates.append(gr.update(visible=(pname == selected_plugin)))
+                    return updates
+                # 绑定插件切换事件
                 export_plugin.change(
                     fn=on_plugin_change,
                     inputs=[export_plugin],
+                    outputs=list(all_plugin_groups.values())
                 )
                 # 收集选项并导出
+                def collect_and_export(zip_file, plugin_name, *all_values, progress=gr.Progress()):
+                    """收集当前插件的选项并执行导出"""
+                    # 根据插件名找到对应的选项配置
+                    if plugin_name not in plugins_config:
+                        return "❌ 未找到插件配置", "", None
+                    # 计算当前插件的值在 all_values 中的位置
+                    start_idx = 0
+                    for pname in plugins_config.keys():
+                        if pname == plugin_name:
+                            break
+                        # 统计该插件的非 label 选项数量
+                        start_idx += sum(1 for opt in plugins_config[pname] if opt["type"] != "label")
+                    # 提取当前插件的选项值
+                    options = {}
+                    current_idx = start_idx
+                    for opt in plugins_config[plugin_name]:
+                        if opt["type"] == "label":
+                            continue
+                        key = opt["key"]
+                        if current_idx < len(all_values):
+                            value = all_values[current_idx]
+                            # 类型转换
+                            if opt["type"] == "number":
+                                value = float(value) if value is not None else opt["default"]
+                            options[key] = value
+                        current_idx += 1
                     options_json = json.dumps(options, ensure_ascii=False)
                     return process_export_voicebank(zip_file, plugin_name, options_json, progress)
                 > - 导出为适配其他软件的音源格式
                 """)
+                # 收集所有插件的所有组件作为输入
+                all_option_components = []
+                for pname in plugins_config.keys():
+                    if pname in all_plugin_components:
+                        for opt in plugins_config[pname]:
+                            if opt["type"] != "label" and opt["key"] in all_plugin_components[pname]:
+                                all_option_components.append(all_plugin_components[pname][opt["key"]])
                 export_btn.click(
                     fn=collect_and_export,
+                    inputs=[export_upload, export_plugin] + all_option_components,
                     outputs=[export_status, export_log, export_download]
                 )

tools/README.md CHANGED Viewed

@@ -30,5 +30,5 @@ tools/
 ## 注意事项
 - MFA 引擎仅支持 Windows 64位系统
-- 解压后约占用 500MB 磁盘空间
 - 首次运行可能需要较长时间初始化

 ## 注意事项
 - MFA 引擎仅支持 Windows 64位系统
+- 解压后约占用 2GB 磁盘空间
 - 首次运行可能需要较长时间初始化

tools/mfa_engine.7z ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ccbaac4541b3ae414ddecb8d6e092e622887b6a30155f01c3ecc84cd6aba86b
+size 395100074