Spaces:

Datangtang
/

iris

Sleeping

App Files Files Community

Datangtang commited on Dec 4, 2025

Commit

f19f181

verified ·

1 Parent(s): c55e754

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -25

app.py CHANGED Viewed

@@ -3,13 +3,10 @@ import gradio as gr
 from huggingface_hub import hf_hub_download
 from llama_cpp import Llama
-print("Gradio version:", gr.__version__)
-# ============ 环境变量中读取 token ==============
 HF_TOKEN = os.environ.get("HF_Token")
-# ============ 模型配置 ==============
 REPO_ID = "Datangtang/GGUF3B"
 FILE_NAME = "llama-3.2-3b-instruct.Q4_K_M.gguf"
@@ -20,7 +17,7 @@ model_path = hf_hub_download(
     token=HF_TOKEN
 )
-# 加载模型（llama_cpp）
 llm = Llama(
     model_path=model_path,
     n_ctx=4096,
@@ -28,44 +25,45 @@ llm = Llama(
     chat_format="llama-3",
 )
-# ============ 核心对话函数 ==============
-def chat_fn(history, user_input):
     """
-    history: List[{"role": "...", "content": "..."}]
-    user_input: 当前用户的输入
     """
-    # 将用户输入添加到历史
-    history.append({"role": "user", "content": user_input})
-    # 调用 LLM
-    response = llm.create_chat_completion(
-        messages=history,
         max_tokens=512,
         temperature=0.7,
-        top_p=0.95
     )
-    assistant_msg = response["choices"][0]["message"]["content"]
-    # 添加模型回复到历史
-    history.append({"role": "assistant", "content": assistant_msg})
-    return history, ""
-# ============ Gradio 界面 ==============
 with gr.Blocks() as demo:
-    gr.Markdown("# 💬 Chat with Your Finetuned LLM")
-    chatbot = gr.Chatbot(height=500, type="messages")  # ⭐ 注意 type="messages"
-    user_input = gr.Textbox(show_label=False, placeholder="Ask your model...")
     submit = gr.Button("Send")
     submit.click(
         fn=chat_fn,
         inputs=[chatbot, user_input],
-        outputs=[chatbot, user_input]
     )
 if __name__ == "__main__":

 from huggingface_hub import hf_hub_download
 from llama_cpp import Llama
+# ============ 读取 HF Token ==============
 HF_TOKEN = os.environ.get("HF_Token")
+# ============ 模型信息 ==============
 REPO_ID = "Datangtang/GGUF3B"
 FILE_NAME = "llama-3.2-3b-instruct.Q4_K_M.gguf"
     token=HF_TOKEN
 )
+# 加载模型
 llm = Llama(
     model_path=model_path,
     n_ctx=4096,
     chat_format="llama-3",
 )
+# ============ 核心对话函数（Gradio 6 消息格式） ==============
+def chat_fn(messages, user_input):
     """
+    messages: List of {"role": "...", "content": "..."}
+    user_input: 当前用户输入
     """
+    # 添加用户输入
+    messages.append({"role": "user", "content": user_input})
+    # llama_cpp 调用
+    result = llm.create_chat_completion(
+        messages=messages,
         max_tokens=512,
         temperature=0.7,
+        top_p=0.95,
     )
+    bot_reply = result["choices"][0]["message"]["content"]
+    # 添加模型回复
+    messages.append({"role": "assistant", "content": bot_reply})
+    return messages, ""
+# ============ Gradio UI (6.0.2) ==============
 with gr.Blocks() as demo:
+    gr.Markdown("# 💬 Chat with Your Finetuned LLM (Gradio 6)")
+    chatbot = gr.Chatbot(height=500, type="messages")
+    user_input = gr.Textbox(show_label=False, placeholder="Type something...")
     submit = gr.Button("Send")
     submit.click(
         fn=chat_fn,
         inputs=[chatbot, user_input],
+        outputs=[chatbot, user_input],
     )
 if __name__ == "__main__":