Spaces:

DataEval
/

dingo

Sleeping

App Files Files Community

DataEval commited on Dec 26, 2025

Commit

28b65b3

verified ·

1 Parent(s): 95cc0d2

update v2.0

Browse files

Files changed (1) hide show

app.py +279 -218

app.py CHANGED Viewed

@@ -14,17 +14,17 @@ from dingo.model import Model
 def dingo_demo(
         uploaded_file,
-        dataset_source, data_format, input_path, max_workers, batch_size,
-        column_id, column_prompt, column_content, column_image,
-        rule_list, prompt_list, scene_list,
-        model, key, api_url
 ):
     if not data_format:
         raise gr.Error('ValueError: data_format can not be empty, please input.')
-    # if not column_content:
-    #     raise gr.Error('ValueError: column_content can not be empty, please input.')
-    if not rule_list and not prompt_list:
-        raise gr.Error('ValueError: rule_list and prompt_list can not be empty at the same time.')
     # Handle input path based on dataset source
     if dataset_source == "hugging_face":
@@ -47,42 +47,127 @@ def dingo_demo(
         raise gr.Error('Please input value > 0 in batch_size.')
     try:
         input_data = {
             "input_path": final_input_path,
             "output_path": "" if dataset_source == 'hugging_face' else os.path.dirname(final_input_path),
             "dataset": {
                 "source": dataset_source,
                 "format": data_format,
-                "field": {}
             },
             "executor": {
-                "rule_list": rule_list,
-                "prompt_list": prompt_list,
                 "result_save": {
                     "bad": True,
-                    "raw": True
                 },
                 "max_workers": max_workers,
                 "batch_size": batch_size,
             },
-            "evaluator": {
-                "llm_config": {
-                    scene_list: {
-                        "model": model,
-                        "key": key,
-                        "api_url": api_url,
-                    }
                 }
-            }
         }
-        if column_id:
-            input_data['dataset']['field']['id'] = column_id
-        if column_prompt:
-            input_data['dataset']['field']['prompt'] = column_prompt
-        if column_content:
-            input_data['dataset']['field']['content'] = column_content
-        if column_image:
-            input_data['dataset']['field']['image'] = column_image
         # print(input_data)
         # exit(0)
@@ -91,28 +176,33 @@ def dingo_demo(
         executor = Executor.exec_map["local"](input_args)
         summary = executor.execute().to_dict()
         detail = executor.get_bad_info_list()
         new_detail = []
         for item in detail:
-            new_detail.append(item)
         if summary['output_path']:
-            shutil.rmtree(summary['output_path'])
-        # 返回两个值：概要信息和详细信息
         return json.dumps(summary, indent=4), new_detail
     except Exception as e:
         raise gr.Error(str(e))
 def update_input_components(dataset_source):
-    # 根据数据源的不同，返回不同的输入组件
     if dataset_source == "hugging_face":
-        # 如果数据源是huggingface，返回一个可见的文本框和一个不可见的文件组件
         return [
             gr.Textbox(visible=True),
             gr.File(visible=False),
         ]
     else:  # local
-        # 如果数据源是本地，返回一个不可见的文本框和一个可见的文件组件
         return [
             gr.Textbox(visible=False),
             gr.File(visible=True),
@@ -123,72 +213,66 @@ def update_rule_list(rule_type_mapping, rule_type):
     return gr.CheckboxGroup(
         choices=rule_type_mapping.get(rule_type, []),
         value=[],
-        label="rule_list"
     )
-def update_prompt_list(scene_prompt_mapping, scene):
-    """根据选择的场景更新可用的prompt列表，并清空所有勾选"""
-    return gr.CheckboxGroup(
-        choices=scene_prompt_mapping.get(scene, []),
-        value=[],  # 清空所有勾选
-        label="prompt_list"
-    )
-# prompt_list变化时，动态控制model、key、api_url的显示
-def toggle_llm_fields(prompt_values):
-    visible = bool(prompt_values)
-    return (
-        gr.update(visible=visible),
-        gr.update(visible=visible),
-        gr.update(visible=visible)
-    )
-# 控制column_id、column_prompt、column_content、column_image的显示
-def update_column_fields(rule_list, prompt_list):
     rule_type_mapping = get_rule_type_mapping()
-    scene_prompt_mapping = get_scene_prompt_mapping()
     data_column_mapping = get_data_column_mapping()
-    status_mapping = {
-        'id': False,
-        'prompt': False,
-        'content': False,
-        'image': False,
-    }
-    res = (
-        gr.update(visible=status_mapping['id']),
-        gr.update(visible=status_mapping['prompt']),
-        gr.update(visible=status_mapping['content']),
-        gr.update(visible=status_mapping['image'])
-    )
-    if not rule_list and not prompt_list:
-        return res
-    key_list = []
-    key_list += get_key_by_mapping(rule_type_mapping, rule_list)
-    key_list += get_key_by_mapping(scene_prompt_mapping, prompt_list)
-    data_column = []
-    for key in key_list:
-        if not data_column:
-            data_column = data_column_mapping[key]
-        else:
-            new_data_column = data_column_mapping[key]
-            if data_column != new_data_column:
-                raise gr.Error(f'ConflictError: {key} need data type is different from other.')
-    for c in data_column:
-        status_mapping[c] = True
-    res = (
-        gr.update(visible=status_mapping['id']),
-        gr.update(visible=status_mapping['prompt']),
-        gr.update(visible=status_mapping['content']),
-        gr.update(visible=status_mapping['image'])
-    )
-    return res
 def get_rule_type_mapping():
@@ -208,50 +292,32 @@ def get_rule_type_mapping():
     return process_map
-def get_scene_prompt_mapping():
-    origin_map = Model.get_scenario_prompt_map()
-    process_map = {'LLMTextQualityModelBase': [], 'LLMTextQualityPromptBase': []}  # can adjust the order
-    for k, v in origin_map.items():
-        for p in v:
-            if k not in process_map:
-                process_map[k] = []
-            process_map[k].append(p.__name__)
-    # print(process_map)
-    return process_map
-def get_key_by_mapping(map_dict: dict, value_list: list):
-    key_list = []
-    for k, v in map_dict.items():
-        if bool(set(v) & set(value_list)):
-            key_list.append(k)
-    return key_list
 def get_data_column_mapping():
     return {
-        # llm
-        'LLMTextQualityPromptBase': ['content'],
-        'LLMTextQualityModelBase': ['content'],
-        'LLMSecurityPolitics': ['content'],
-        'LLMSecurityProhibition': ['content'],
-        'LLMText3HHarmless': ['content'],
-        'LLMText3HHelpful': ['content'],
-        'LLMText3HHonest': ['content'],
-        'LLMClassifyTopic': ['content'],
-        'LLMClassifyQR': ['content'],
-        'LLMDatamanAssessment': ['content'],
-        'VLMImageRelevant': ['prompt', 'content'],
-        # rule
-        # 'QUALITY_BAD_COMPLETENESS': ['content'],
-        # 'QUALITY_BAD_EFFECTIVENESS': ['content'],
-        # 'QUALITY_BAD_FLUENCY': ['content'],
-        # 'QUALITY_BAD_RELEVANCE': ['content'],
-        # 'QUALITY_BAD_SIMILARITY': ['content'],
-        # 'QUALITY_BAD_UNDERSTANDABILITY': ['content'],
         'Rule-Based TEXT Quality Metrics': ['content'],
         'QUALITY_BAD_SECURITY': ['content'],
         'QUALITY_BAD_IMG_EFFECTIVENESS': ['image'],
@@ -264,8 +330,7 @@ if __name__ == '__main__':
     rule_type_mapping = get_rule_type_mapping()
     rule_type_options = list(rule_type_mapping.keys())
-    scene_prompt_mapping = get_scene_prompt_mapping()
-    scene_options = list(scene_prompt_mapping.keys())
     current_dir = Path(__file__).parent
     with open(os.path.join(current_dir, 'header.html'), "r") as file:
@@ -291,10 +356,16 @@ if __name__ == '__main__':
                         visible=False
                     )
-                    data_format = gr.Dropdown(
-                        ["jsonl", "json", "plaintext", "listjson","image"],
-                        label="data_format"
-                    )
                     with gr.Row():
                         max_workers = gr.Number(
                             value=1,
@@ -313,84 +384,72 @@ if __name__ == '__main__':
                     rule_type = gr.Dropdown(
                         choices=rule_type_options,
                         value=rule_type_options[0],
-                        label="rule_type",
                         interactive=True
                     )
                     rule_list = gr.CheckboxGroup(
                         choices=rule_type_mapping.get(rule_type_options[0], []),
-                        label="rule_list"
                     )
-                    # 添加场景选择下拉框
-                    scene_list = gr.Dropdown(
-                        choices=scene_options,
-                        value=scene_options[0],
-                        label="scenario_list",
-                        interactive=True
                     )
-                    prompt_list = gr.CheckboxGroup(
-                        choices=scene_prompt_mapping.get(scene_options[0], []),
-                        label="prompt_list"
-                    )
-                    # LLM模型名
-                    model = gr.Textbox(
-                        placeholder="If want to use llm, please input model, such as: deepseek-chat",
-                        label="model",
-                        visible=False
-                    )
-                    # LLM API KEY
-                    key = gr.Textbox(
-                        placeholder="If want to use llm, please input key, such as: 123456789012345678901234567890xx",
-                        label="API KEY",
-                        visible=False
                     )
-                    # LLM API URL
-                    api_url = gr.Textbox(
-                        placeholder="If want to use llm, please input api_url, such as: https://api.deepseek.com/v1",
-                        label="API URL",
                         visible=False
                     )
-                    with gr.Row():
-                        # 字段映射说明文本，带示例链接
-                        with gr.Column():
-                            gr.Markdown(
-                                "Please input the column name of dataset in the input boxes below ( [examples](https://github.com/MigoXLab/dingo/tree/main/examples) )")
-                        column_id = gr.Textbox(
-                            value="",
-                            placeholder="Column name of id in the input file. If exists multiple levels, use '.' separate",
-                            label="column_id",
-                            visible=False
-                        )
-                        column_prompt = gr.Textbox(
-                            value="",
-                            placeholder="Column name of prompt in the input file. If exists multiple levels, use '.' separate",
-                            label="column_prompt",
-                            visible=False
-                        )
-                        column_content = gr.Textbox(
-                            value="content",
-                            placeholder="Column name of content in the input file. If exists multiple levels, use '.' separate",
-                            label="column_content",
-                            visible=False
-                        )
-                        column_image = gr.Textbox(
-                            value="",
-                            placeholder="Column name of image in the input file. If exists multiple levels, use '.' separate",
-                            label="column_image",
-                            visible=False
-                        )
                 with gr.Row():
                     submit_single = gr.Button(value="Submit", interactive=True, variant="primary")
             with gr.Column():
-                # 修改输出组件部分，使用Tabs
                 with gr.Tabs():
                     with gr.Tab("Result Summary"):
-                        summary_output = gr.JSON(label="summary", max_height=800)
                     with gr.Tab("Result Detail"):
-                        detail_output = gr.JSON(label="detail", max_height=800)  # 使用JSON组件来更好地展示结构化数据
         dataset_source.change(
             fn=update_input_components,
@@ -404,38 +463,40 @@ if __name__ == '__main__':
             outputs=rule_list
         )
-        # 场景变化时更新prompt列表
-        scene_list.change(
-            fn=partial(update_prompt_list, scene_prompt_mapping),
-            inputs=scene_list,
-            outputs=prompt_list
-        )
-        prompt_list.change(
-            fn=toggle_llm_fields,
-            inputs=prompt_list,
-            outputs=[model, key, api_url]
         )
-        # column字段显示控制
-        for comp in [rule_list, prompt_list]:
             comp.change(
-                fn=update_column_fields,
-                inputs=[rule_list, prompt_list],
-                outputs=[column_id, column_prompt, column_content, column_image]
             )
         submit_single.click(
             fn=dingo_demo,
             inputs=[
                 uploaded_file,
-                dataset_source, data_format, input_path, max_workers, batch_size,
-                column_id, column_prompt, column_content, column_image,
-                rule_list, prompt_list, scene_list,
-                model, key, api_url
             ],
-            outputs=[summary_output, detail_output]  # 修改输出为两个组件
         )
-    # 启动界面
-    demo.launch(share=True)

 def dingo_demo(
         uploaded_file,
+        dataset_source, data_format, remove_output, input_path, max_workers, batch_size,
+        fields_data,
+        rule_list, llm_list,
+        # rule_config_data,
+        llm_config_data
 ):
     if not data_format:
         raise gr.Error('ValueError: data_format can not be empty, please input.')
+    if not rule_list and not llm_list:
+        raise gr.Error('ValueError: rule_list and llm_list can not be empty at the same time.')
     # Handle input path based on dataset source
     if dataset_source == "hugging_face":
         raise gr.Error('Please input value > 0 in batch_size.')
     try:
+        # Parse fields from dataframe
+        fields = {}
+        if fields_data is not None and len(fields_data) > 0:
+            for row in fields_data.values.tolist():
+                if len(row) >= 2 and row[0] and row[1]:  # Both key and value are not empty
+                    fields[row[0]] = row[1]
+        # Parse rule configs from dataframe
+        rule_configs = {}
+        # if rule_config_data is not None and len(rule_config_data) > 0:
+        #     for row in rule_config_data.values.tolist():
+        #         if len(row) >= 6 and row[0]:  # Rule name exists
+        #             rule_name = row[0]
+        #             config = {}
+        #
+        #             # threshold
+        #             if row[1] is not None and str(row[1]).strip():
+        #                 try:
+        #                     config['threshold'] = float(row[1])
+        #                 except:
+        #                     pass
+        #
+        #             # pattern
+        #             if row[2] and str(row[2]).strip():
+        #                 config['pattern'] = str(row[2])
+        #
+        #             # key_list
+        #             if row[3] and str(row[3]).strip():
+        #                 try:
+        #                     val = str(row[3])
+        #                     config['key_list'] = json.loads(val) if val.startswith('[') else [k.strip() for k in val.split(',') if k.strip()]
+        #                 except:
+        #                     config['key_list'] = [k.strip() for k in str(row[3]).split(',') if k.strip()]
+        #
+        #             # refer_path
+        #             if row[4] and str(row[4]).strip():
+        #                 try:
+        #                     val = str(row[4])
+        #                     config['refer_path'] = json.loads(val) if val.startswith('[') else [p.strip() for p in val.split(',') if p.strip()]
+        #                 except:
+        #                     config['refer_path'] = [p.strip() for p in str(row[4]).split(',') if p.strip()]
+        #
+        #             # parameters
+        #             if row[5] and str(row[5]).strip():
+        #                 try:
+        #                     config['parameters'] = json.loads(str(row[5]))
+        #                 except:
+        #                     pass
+        #
+        #             if config:
+        #                 rule_configs[rule_name] = config
+        # Parse llm configs from dataframe
+        llm_configs = {}
+        if llm_config_data is not None and len(llm_config_data) > 0:
+            for row in llm_config_data.values.tolist():
+                if len(row) >= 5 and row[0]:  # LLM name exists
+                    llm_name = row[0]
+                    config = {}
+                    # model
+                    if row[1] and str(row[1]).strip():
+                        config['model'] = str(row[1])
+                    # key
+                    if row[2] and str(row[2]).strip():
+                        config['key'] = str(row[2])
+                    # api_url
+                    if row[3] and str(row[3]).strip():
+                        config['api_url'] = str(row[3])
+                    # parameters
+                    if row[4] and str(row[4]).strip():
+                        try:
+                            config['parameters'] = json.loads(str(row[4]))
+                        except json.JSONDecodeError as e:
+                            raise gr.Error(f"Invalid JSON in 'parameters' for LLM '{llm_name}': {e}")
+                    if config:
+                        llm_configs[llm_name] = config
+        # Build evals array
+        evals = []
+        # Add rule evaluators and their configurations
+        for rule in rule_list:
+            eval_item = {"name": rule}
+            if rule in rule_configs:
+                eval_item["config"] = rule_configs[rule]
+            evals.append(eval_item)
+        # Add LLM evaluators and their configurations
+        for llm in llm_list:
+            eval_item = {"name": llm}
+            if llm in llm_configs:
+                eval_item["config"] = llm_configs[llm]
+            evals.append(eval_item)
         input_data = {
             "input_path": final_input_path,
             "output_path": "" if dataset_source == 'hugging_face' else os.path.dirname(final_input_path),
             "dataset": {
                 "source": dataset_source,
                 "format": data_format,
             },
             "executor": {
                 "result_save": {
                     "bad": True,
+                    # "raw": True
                 },
                 "max_workers": max_workers,
                 "batch_size": batch_size,
             },
+            "evaluator": [
+                {
+                    "fields": fields,
+                    "evals": evals
                 }
+            ]
         }
         # print(input_data)
         # exit(0)
         executor = Executor.exec_map["local"](input_args)
         summary = executor.execute().to_dict()
         detail = executor.get_bad_info_list()
+        dingo_id_set = set()
         new_detail = []
         for item in detail:
+            if item['dingo_id'] not in dingo_id_set:
+                dingo_id_set.add(item['dingo_id'])
+                new_detail.append(item)
         if summary['output_path']:
+            if remove_output == "true":
+                shutil.rmtree(summary['output_path'])
+                summary['output_path'] = ""
+        # Return summary and detail information
         return json.dumps(summary, indent=4), new_detail
     except Exception as e:
         raise gr.Error(str(e))
 def update_input_components(dataset_source):
+    # Return different input components based on data source
     if dataset_source == "hugging_face":
+        # If data source is huggingface, return a visible textbox and an invisible file component
         return [
             gr.Textbox(visible=True),
             gr.File(visible=False),
         ]
     else:  # local
+        # If data source is local, return an invisible textbox and a visible file component
         return [
             gr.Textbox(visible=False),
             gr.File(visible=True),
     return gr.CheckboxGroup(
         choices=rule_type_mapping.get(rule_type, []),
         value=[],
+        label="rule_list",
+        elem_classes="limited-height-checkboxgroup"
     )
+# Generate configuration dataframes based on selected evaluators
+# def generate_rule_config_dataframe(rule_list):
+#     """Generate rule configuration dataframe based on selected rules"""
+#     if not rule_list:
+#         return gr.update(value=[], visible=False)
+#
+#     # Create rows for each rule
+#     rows = []
+#     for rule in rule_list:
+#         rows.append([rule, None, "", "", "", ""])
+#
+#     return gr.update(value=rows, visible=True)
+def generate_llm_config_dataframe(llm_list):
+    """Generate LLM configuration dataframe based on selected LLMs"""
+    if not llm_list:
+        return gr.update(value=[], visible=False)
+    # Create rows for each LLM
+    rows = []
+    for llm in llm_list:
+        rows.append([llm, "deepseek-chat", "your-api-key", "https://api.deepseek.com/v1", ""])
+    return gr.update(value=rows, visible=True)
+def suggest_fields_dataframe(rule_list, llm_list):
+    """Suggest required field mappings based on selected evaluators"""
+    suggested_fields = set()
+    # Fields required by rule evaluators
     rule_type_mapping = get_rule_type_mapping()
     data_column_mapping = get_data_column_mapping()
+    for rule in rule_list:
+        # Find which type this rule belongs to
+        for rule_type, rules in rule_type_mapping.items():
+            if rule in rules:
+                if rule_type in data_column_mapping:
+                    suggested_fields.update(data_column_mapping[rule_type])
+                break
+    # Fields required by LLM evaluators
+    llm_column_mapping = get_llm_column_mapping()
+    for llm in llm_list:
+        if llm in llm_column_mapping:
+            suggested_fields.update(llm_column_mapping[llm])
+    # Generate suggested fields rows
+    rows = []
+    for field in sorted(suggested_fields):
+        rows.append([field, field])
+    return gr.update(value=rows if rows else [["content", "content"]])
 def get_rule_type_mapping():
     return process_map
+def get_llm_list():
+    """Get LLM list from Model.llm_name_map"""
+    llm_name_map = Model.get_llm_name_map()
+    return list(llm_name_map.keys())
+def get_llm_column_mapping():
+    """Get column mapping required by each LLM"""
+    # Define columns required by each LLM based on actual needs
+    # Can be dynamically obtained from Model information, using default configuration for now
+    llm_list = get_llm_list()
+    mapping = {}
+    for llm_name in llm_list:
+        # Specify different field requirements based on specific LLM type
+        if 'VLM' in llm_name or 'Image' in llm_name:
+            mapping[llm_name] = ['content', 'image']
+        elif 'Relevant' in llm_name:
+            mapping[llm_name] = ['prompt', 'content']
+        else:
+            mapping[llm_name] = ['content']
+    return mapping
 def get_data_column_mapping():
     return {
+        # Rule mapping
         'Rule-Based TEXT Quality Metrics': ['content'],
         'QUALITY_BAD_SECURITY': ['content'],
         'QUALITY_BAD_IMG_EFFECTIVENESS': ['image'],
     rule_type_mapping = get_rule_type_mapping()
     rule_type_options = list(rule_type_mapping.keys())
+    llm_options = get_llm_list()
     current_dir = Path(__file__).parent
     with open(os.path.join(current_dir, 'header.html'), "r") as file:
                         visible=False
                     )
+                    with gr.Row():
+                        data_format = gr.Dropdown(
+                            ["jsonl", "json", "plaintext", "listjson","image"],
+                            label="data_format"
+                        )
+                        remove_output = gr.Dropdown(
+                            ["true"],
+                            value="true",
+                            label="remove_output"
+                        )
                     with gr.Row():
                         max_workers = gr.Number(
                             value=1,
                     rule_type = gr.Dropdown(
                         choices=rule_type_options,
                         value=rule_type_options[0],
+                        label="Rule Type",
                         interactive=True
                     )
                     rule_list = gr.CheckboxGroup(
                         choices=rule_type_mapping.get(rule_type_options[0], []),
+                        label="Rule List",
+                        elem_classes="limited-height-checkboxgroup"
                     )
+                    # LLM evaluator list
+                    llm_list = gr.CheckboxGroup(
+                        choices=llm_options,
+                        label="LLM List",
+                        elem_classes="limited-height-checkboxgroup"
                     )
+                    gr.Markdown("### EvalPipline Configuration")
+                    gr.Markdown("Configure field mappings and evaluator parameters based on selected evaluators ([Examples](https://github.com/MigoXLab/dingo/tree/main/examples))")
+                    # Field mapping configuration
+                    gr.Markdown("**EvalPipline.fields** - Field Mapping")
+                    fields_dataframe = gr.Dataframe(
+                        value=[["content", "content"]],
+                        headers=["Field Key", "Dataset Column"],
+                        datatype=["str", "str"],
+                        column_count=(2, "fixed"),
+                        row_count=(1, "dynamic"),
+                        label="Field Mappings (add/remove rows as needed)",
+                        interactive=True
                     )
+                    # Rule configuration
+                    # gr.Markdown("**Rule Config** - EvalPiplineConfig.config for Rules")
+                    # rule_config_dataframe = gr.Dataframe(
+                    #     value=[],
+                    #     headers=["Rule Name", "threshold", "pattern", "key_list", "refer_path", "parameters"],
+                    #     datatype=["str", "number", "str", "str", "str", "str"],
+                    #     column_count=(6, "fixed"),
+                    #     row_count=(0, "dynamic"),
+                    #     label="Rule Configurations (auto-generated based on rule_list selection)",
+                    #     interactive=True,
+                    #     visible=False
+                    # )
+                    # LLM configuration
+                    gr.Markdown("**LLM Config** - EvalPiplineConfig.config for LLMs")
+                    llm_config_dataframe = gr.Dataframe(
+                        value=[],
+                        headers=["LLM Name", "model", "key", "api_url", "parameters"],
+                        datatype=["str", "str", "str", "str", "str"],
+                        column_count=(5, "fixed"),
+                        row_count=(0, "dynamic"),
+                        label="LLM Configurations (auto-generated based on llm_list selection)",
+                        interactive=True,
                         visible=False
                     )
                 with gr.Row():
                     submit_single = gr.Button(value="Submit", interactive=True, variant="primary")
             with gr.Column():
+                # Output component section, using Tabs
                 with gr.Tabs():
                     with gr.Tab("Result Summary"):
+                        summary_output = gr.JSON(label="Summary", max_height=800)
                     with gr.Tab("Result Detail"):
+                        detail_output = gr.JSON(label="Detail", max_height=800)  # Use JSON component for better structured data display
         dataset_source.change(
             fn=update_input_components,
             outputs=rule_list
         )
+        # Auto-generate configuration dataframes when rule_list changes
+        # rule_list.change(
+        #     fn=generate_rule_config_dataframe,
+        #     inputs=rule_list,
+        #     outputs=rule_config_dataframe
+        # )
+        # Auto-generate configuration dataframes when llm_list changes
+        llm_list.change(
+            fn=generate_llm_config_dataframe,
+            inputs=llm_list,
+            outputs=llm_config_dataframe
         )
+        # Suggest field mappings when evaluators change
+        for comp in [rule_list, llm_list]:
             comp.change(
+                fn=suggest_fields_dataframe,
+                inputs=[rule_list, llm_list],
+                outputs=fields_dataframe
             )
         submit_single.click(
             fn=dingo_demo,
             inputs=[
                 uploaded_file,
+                dataset_source, data_format, remove_output, input_path, max_workers, batch_size,
+                fields_dataframe,
+                rule_list, llm_list,
+                # rule_config_dataframe,
+                llm_config_dataframe
             ],
+            outputs=[summary_output, detail_output]
         )
+    # Launch interface
+    demo.launch(share=False)