Spaces:

Elfsong
/

Arena

Build error

App Files Files Community

elfsong commited on Dec 20, 2025

Commit

2b717f1

1 Parent(s): c5dc144

refactor: Simplify bot_response function by improving message handling and UI updates for user interactions.

Browse files

Files changed (1) hide show

app.py +17 -19

app.py CHANGED Viewed

@@ -8,31 +8,28 @@ MODELS = [
 def bot_response(user_message, history, model_name, system_message, max_tokens, temperature, top_p, oauth_token: gr.OAuthToken | None):
     if not user_message:
-        yield history
         return
-    # 获取 Token (如果是本地运行，请确保已登录 HF)
     token = oauth_token.token if oauth_token else None
-    if not token:
-        history.append({"role": "assistant", "content": "⚠️ 请先在侧边栏登录 Hugging Face。"})
-        yield history
-        return
-    # 初始化客户端
     client = InferenceClient(token=token, model=model_name)
-    # 构建消息列表：系统提示词 + 历史记录 + 当前用户输入
-    messages = [{"role": "system", "content": system_message}] + history + [{"role": "user", "content": user_message}]
-    # UI 更新：先在界面显示用户发送的消息
-    history.append({"role": "user", "content": user_message})
-    history.append({"role": "assistant", "content": ""})
-    yield history, "" # 返回 history 更新 UI，并清空对应的输入框
     try:
         response_text = ""
         stream = client.chat_completion(
-            messages,
             max_tokens=max_tokens,
             stream=True,
             temperature=temperature,
@@ -42,12 +39,13 @@ def bot_response(user_message, history, model_name, system_message, max_tokens,
         for chunk in stream:
             token_content = chunk.choices[0].delta.content or ""
             response_text += token_content
-            history[-1]["content"] = response_text
-            yield history, "" # 持续流式输出
     except Exception as e:
-        history[-1]["content"] = f"**Error:** {str(e)}"
-        yield history, ""
 with gr.Blocks() as demo:
     with gr.Sidebar():

 def bot_response(user_message, history, model_name, system_message, max_tokens, temperature, top_p, oauth_token: gr.OAuthToken | None):
     if not user_message:
+        yield history, ""
         return
     token = oauth_token.token if oauth_token else None
     client = InferenceClient(token=token, model=model_name)
+    # 1. 构造发送给 API 的消息序列
+    # 注意：history 在 Gradio 6 中已经是 [{"role": "...", "content": "..."}] 格式
+    api_messages = [{"role": "system", "content": system_message}] + history + [{"role": "user", "content": user_message}]
+    # 2. 更新 UI 的历史记录
+    # 先添加用户的消息，再添加一个空的助手消息用于流式占位
+    new_history = history + [
+        {"role": "user", "content": user_message},
+        {"role": "assistant", "content": ""}
+    ]
+    yield new_history, "" # 立即更新 UI 显示用户消息
     try:
         response_text = ""
         stream = client.chat_completion(
+            api_messages,
             max_tokens=max_tokens,
             stream=True,
             temperature=temperature,
         for chunk in stream:
             token_content = chunk.choices[0].delta.content or ""
             response_text += token_content
+            # 更新最后一条消息的内容
+            new_history[-1]["content"] = response_text
+            yield new_history, ""
     except Exception as e:
+        new_history[-1]["content"] = f"**Error:** {str(e)}"
+        yield new_history, ""
 with gr.Blocks() as demo:
     with gr.Sidebar():