Spaces:

baidu
/

conversation_demo

Running

App Files Files Community

maxiaolong03 commited on Jul 15, 2025

Commit

85fc2c3

1 Parent(s): bc61229

add files

Browse files

Files changed (1) hide show

app.py +86 -13

app.py CHANGED Viewed

@@ -51,28 +51,53 @@ def get_args() -> argparse.Namespace:
     parser.add_argument("--server-name", type=str, default="0.0.0.0", help="Demo server name.")
     parser.add_argument("--max_char", type=int, default=8000, help="Maximum character limit for messages.")
     parser.add_argument("--max_retry_num", type=int, default=3, help="Maximum retry number for request.")
     parser.add_argument(
         "--model_map",
         type=str,
         default="""{
-            "ernie-4.5-turbo-128k-preview": "https://qianfan.baidubce.com/v2",
-            "ernie-4.5-21b-a3b": "https://qianfan.baidubce.com/v2",
-            "ernie-4.5-0.3b": "https://qianfan.baidubce.com/v2",
-            "ernie-4.5-turbo-vl-preview": "https://qianfan.baidubce.com/v2",
-            "ernie-4.5-vl-28b-a3b": "https://qianfan.baidubce.com/v2"
         }""",
         help="""JSON string defining model name to endpoint mappings.
             Required Format:
             {"model_name": "http://localhost:port/v1", ...}
             Note:
             - All endpoints must be valid HTTP URLs
             - At least one model must be specified
-            - Prefix determines model capabilities:
             * ERNIE-4.5[-*]: Text-only model
             * ERNIE-4.5-VL[-*]: Multimodal models (image+text)
             """,
     )
     args = parser.parse_args()
     try:
@@ -82,7 +107,20 @@ def get_args() -> argparse.Namespace:
         if len(args.model_map) < 1:
             raise ValueError("model_map must contain at least one model configuration")
     except json.JSONDecodeError as e:
-        raise ValueError("Invalid JSON format for --model-map") from e
     return args
@@ -132,6 +170,7 @@ class GradioEvents:
         max_tokens: int,
         temperature: float,
         top_p: float,
         bot_client: BotClient,
     ) -> str:
         """
@@ -150,6 +189,7 @@ class GradioEvents:
             max_tokens (int): Maximum tokens.
             temperature (float): Temperature.
             top_p (float): Top p.
             bot_client (BotClient): Bot client.
         Yields:
@@ -181,6 +221,7 @@ class GradioEvents:
         try:
             req_data = {"messages": conversation}
             for chunk in bot_client.process_stream(model_name, req_data, max_tokens, temperature, top_p):
                 if "error" in chunk:
                     raise Exception(chunk["error"])
@@ -206,6 +247,7 @@ class GradioEvents:
         max_tokens: int,
         temperature: float,
         top_p: float,
         bot_client: BotClient,
     ) -> list:
         """
@@ -225,6 +267,7 @@ class GradioEvents:
             max_tokens (int): The maximum token length of the generated response.
             temperature (float): The temperature parameter used by the model.
             top_p (float): The top_p parameter used by the model.
             bot_client (BotClient): The bot client.
         Returns:
@@ -238,7 +281,17 @@ class GradioEvents:
         yield chatbot
         new_texts = GradioEvents.chat_stream(
-            query, task_history, image_history, model, file_url, system_msg, max_tokens, temperature, top_p, bot_client
         )
         response = ""
@@ -268,6 +321,7 @@ class GradioEvents:
         max_tokens: int,
         temperature: float,
         top_p: float,
         bot_client: BotClient,
     ) -> list:
         """
@@ -285,6 +339,7 @@ class GradioEvents:
             max_tokens (int): The maximum token length of the generated response.
             temperature (float): The temperature parameter used by the model.
             top_p (float): The top_p parameter used by the model.
             bot_client (BotClient): The bot client.
         Yields:
@@ -312,6 +367,7 @@ class GradioEvents:
             max_tokens,
             temperature,
             top_p,
             bot_client,
         )
@@ -365,7 +421,7 @@ class GradioEvents:
         Returns:
             gr.update: An update object representing the visibility of the file button.
         """
-        return gr.update(visible='vl' in model_name)  # file_btn
 def launch_demo(args: argparse.Namespace, bot_client: BotClient):
@@ -377,6 +433,11 @@ def launch_demo(args: argparse.Namespace, bot_client: BotClient):
         bot_client (BotClient): Bot client instance
     """
     css = """
     /* Hide original Chinese text */
     #file-upload .wrap {
         font-size: 0 !important;
@@ -404,12 +465,20 @@ def launch_demo(args: argparse.Namespace, bot_client: BotClient):
         )
         gr.Markdown(
             """\
 <center><font size=3>This demo is based on ERNIE models. \
 (本演示基于文心大模型实现。)</center>"""
         )
         chatbot = gr.Chatbot(label="ERNIE", elem_classes="control-height", type="messages")
-        model_names = list(args.model_map.keys())
         with gr.Row():
             model_name = gr.Dropdown(
                 label="Select Model", choices=model_names, value=model_names[0], allow_custom_value=True
@@ -418,7 +487,7 @@ def launch_demo(args: argparse.Namespace, bot_client: BotClient):
                 label="Image upload (Active only for multimodal models. Accepted formats: PNG, JPEG, JPG)",
                 height="80px",
                 visible=True,
-                file_types=[".png", ".jpeg", "jpg"],
                 elem_id="file-upload",
             )
         query = gr.Textbox(label="Input", elem_id="text_input")
@@ -444,8 +513,12 @@ def launch_demo(args: argparse.Namespace, bot_client: BotClient):
         model_name.change(
             GradioEvents.reset_state, outputs=[chatbot, task_history, image_history, file_btn], show_progress=True
         )
-        predict_with_clients = partial(GradioEvents.predict_stream, bot_client=bot_client)
-        regenerate_with_clients = partial(GradioEvents.regenerate, bot_client=bot_client)
         query.submit(
             predict_with_clients,
             inputs=[query, chatbot, task_history, image_history, model_name, file_btn] + additional_inputs,

     parser.add_argument("--server-name", type=str, default="0.0.0.0", help="Demo server name.")
     parser.add_argument("--max_char", type=int, default=8000, help="Maximum character limit for messages.")
     parser.add_argument("--max_retry_num", type=int, default=3, help="Maximum retry number for request.")
+    parser.add_argument(
+        "--model_name_map",
+        type=str,
+        default="""{
+            "ERNIE-4.5-300B-A47B": "ernie-4.5-turbo-128k-preview",
+            "ERNIE-4.5-21B-A3B": "ernie-4.5-21b-a3b",
+            "ERNIE-4.5-0.3B": "ernie-4.5-0.3b",
+            "ERNIE-4.5-VL-424B-A47B": "ernie-4.5-turbo-vl-preview",
+            "ERNIE-4.5-VL-28B-A3B": "ernie-4.5-vl-28b-a3b"
+        }""",
+        help="""JSON string defining model name to internal name mappings.
+            Required Format:
+            {"model_name": "internal_model_name", ...}
+            Note:
+            - When specified, model_name must exist in model_map
+            - All names must be unique
+            - Defaults to empty mapping if not provided
+            - model_name MUST follow prefix rules:
+            * ERNIE-4.5[-*]: Text-only model
+            * ERNIE-4.5-VL[-*]: Multimodal models (image+text)
+            """,
+    )
     parser.add_argument(
         "--model_map",
         type=str,
         default="""{
+            "ERNIE-4.5-300B-A47B": "https://qianfan.baidubce.com/v2",
+            "ERNIE-4.5-21B-A3B": "https://qianfan.baidubce.com/v2",
+            "ERNIE-4.5-0.3B": "https://qianfan.baidubce.com/v2",
+            "ERNIE-4.5-VL-424B-A47B": "https://qianfan.baidubce.com/v2",
+            "ERNIE-4.5-VL-28B-A3B": "https://qianfan.baidubce.com/v2"
         }""",
         help="""JSON string defining model name to endpoint mappings.
             Required Format:
             {"model_name": "http://localhost:port/v1", ...}
             Note:
+            - When specified, model_name must exist in model_name_map
             - All endpoints must be valid HTTP URLs
             - At least one model must be specified
+            - model_name MUST follow prefix rules:
             * ERNIE-4.5[-*]: Text-only model
             * ERNIE-4.5-VL[-*]: Multimodal models (image+text)
             """,
     )
+    parser.add_argument("--api_key", type=str, default="bce-v3/xxx", help="Model service API key.")
     args = parser.parse_args()
     try:
         if len(args.model_map) < 1:
             raise ValueError("model_map must contain at least one model configuration")
     except json.JSONDecodeError as e:
+        raise ValueError("Invalid JSON format for --model_map") from e
+    try:
+        args.model_name_map = json.loads(args.model_name_map)
+    except json.JSONDecodeError as e:
+        raise ValueError("Invalid JSON format for --model_name_map") from e
+    if args.model_name_map:
+        for model_name in list(args.model_map.keys()):
+            internal_model = args.model_name_map.get(model_name, model_name)
+            args.model_map[internal_model] = args.model_map.pop(model_name)
+    else:
+        for key in args.model_map:
+            args.model_name_map[key] = key
     return args
         max_tokens: int,
         temperature: float,
         top_p: float,
+        model_name_map: dict,
         bot_client: BotClient,
     ) -> str:
         """
             max_tokens (int): Maximum tokens.
             temperature (float): Temperature.
             top_p (float): Top p.
+            model_name_map (dict): Model name map.
             bot_client (BotClient): Bot client.
         Yields:
         try:
             req_data = {"messages": conversation}
+            model_name = model_name_map.get(model_name, model_name)
             for chunk in bot_client.process_stream(model_name, req_data, max_tokens, temperature, top_p):
                 if "error" in chunk:
                     raise Exception(chunk["error"])
         max_tokens: int,
         temperature: float,
         top_p: float,
+        model_name_map: dict,
         bot_client: BotClient,
     ) -> list:
         """
             max_tokens (int): The maximum token length of the generated response.
             temperature (float): The temperature parameter used by the model.
             top_p (float): The top_p parameter used by the model.
+            model_name_map (dict): The model name map.
             bot_client (BotClient): The bot client.
         Returns:
         yield chatbot
         new_texts = GradioEvents.chat_stream(
+            query,
+            task_history,
+            image_history,
+            model,
+            file_url,
+            system_msg,
+            max_tokens,
+            temperature,
+            top_p,
+            model_name_map,
+            bot_client,
         )
         response = ""
         max_tokens: int,
         temperature: float,
         top_p: float,
+        model_name_map: dict,
         bot_client: BotClient,
     ) -> list:
         """
             max_tokens (int): The maximum token length of the generated response.
             temperature (float): The temperature parameter used by the model.
             top_p (float): The top_p parameter used by the model.
+            model_name_map (dict): The model name map.
             bot_client (BotClient): The bot client.
         Yields:
             max_tokens,
             temperature,
             top_p,
+            model_name_map,
             bot_client,
         )
         Returns:
             gr.update: An update object representing the visibility of the file button.
         """
+        return gr.update(visible=model_name.upper().startswith(MULTI_MODEL_PREFIX))  # file_btn
 def launch_demo(args: argparse.Namespace, bot_client: BotClient):
         bot_client (BotClient): Bot client instance
     """
     css = """
+    #file-upload {
+        height: 90px !important;
+        min-height: 90px !important;
+        max-height: 90px !important;
+    }
     /* Hide original Chinese text */
     #file-upload .wrap {
         font-size: 0 !important;
         )
         gr.Markdown(
             """\
+<center><font size=3>    <a href="https://ernie.baidu.com/">ERNIE Bot</a> | \
+<a href="https://github.com/PaddlePaddle/ERNIE">GitHub</a> | \
+<a href="https://huggingface.co/baidu">Hugging Face</a> | \
+<a href="https://aistudio.baidu.com/modelsoverview">BAIDU AI Studio</a> | \
+<a href="https://yiyan.baidu.com/blog/publication/">Technical Report</a></center>"""
+        )
+        gr.Markdown(
+            """\
 <center><font size=3>This demo is based on ERNIE models. \
 (本演示基于文心大模型实现。)</center>"""
         )
         chatbot = gr.Chatbot(label="ERNIE", elem_classes="control-height", type="messages")
+        model_names = list(args.model_name_map.keys())
         with gr.Row():
             model_name = gr.Dropdown(
                 label="Select Model", choices=model_names, value=model_names[0], allow_custom_value=True
                 label="Image upload (Active only for multimodal models. Accepted formats: PNG, JPEG, JPG)",
                 height="80px",
                 visible=True,
+                file_types=[".png", ".jpeg", ".jpg"],
                 elem_id="file-upload",
             )
         query = gr.Textbox(label="Input", elem_id="text_input")
         model_name.change(
             GradioEvents.reset_state, outputs=[chatbot, task_history, image_history, file_btn], show_progress=True
         )
+        predict_with_clients = partial(
+            GradioEvents.predict_stream, model_name_map=args.model_name_map, bot_client=bot_client
+        )
+        regenerate_with_clients = partial(
+            GradioEvents.regenerate, model_name_map=args.model_name_map, bot_client=bot_client
+        )
         query.submit(
             predict_with_clients,
             inputs=[query, chatbot, task_history, image_history, model_name, file_btn] + additional_inputs,