Spaces:

Datangtang
/

iris

Sleeping

App Files Files Community

Datangtang commited on Dec 4, 2025

Commit

d658b72

verified ·

1 Parent(s): 654c34c

继续修改bug，没有回复

Browse files

Files changed (1) hide show

app.py +33 -54

app.py CHANGED Viewed

@@ -6,7 +6,7 @@ import os
 # ----------------------------------------
 # Global model cache
 # ----------------------------------------
-loaded_models = {}   # Cache loaded Llama models
 current_model_name = None
 MODEL_CONFIGS = {
@@ -15,7 +15,7 @@ MODEL_CONFIGS = {
         "filename": "llama-3.2-1b-instruct.Q4_K_M.gguf"
     },
     "3B Model (Datangtang/GGUF3B)": {
-        "repo_id": "Datangtang/GGUF3B",   # FIXED typo here
         "filename": "llama-3.2-3b-instruct.Q4_K_M.gguf"
     }
 }
@@ -27,13 +27,9 @@ MODEL_CONFIGS = {
 def load_model(model_choice):
     global loaded_models, current_model_name
-    # Use cache
     if model_choice in loaded_models:
-        print(f"Reusing already loaded model: {model_choice}")
-        current_model_name = model_choice
         return loaded_models[model_choice]
-    print(f"Downloading model: {model_choice}")
     cfg = MODEL_CONFIGS[model_choice]
     model_path = hf_hub_download(
@@ -43,9 +39,6 @@ def load_model(model_choice):
         token=os.environ["HF_TOKEN"]
     )
-    print(f"Model downloaded to: {model_path}")
-    print("Loading GGUF model into memory...")
     llm = Llama(
         model_path=model_path,
         n_ctx=1024,
@@ -59,29 +52,31 @@ def load_model(model_choice):
     loaded_models[model_choice] = llm
     current_model_name = model_choice
-    print("Model loaded successfully!")
     return llm
 # ----------------------------------------
-# Chat function (works with Chatbot)
 # ----------------------------------------
-def chat(message, history, model_choice):
     llm = load_model(model_choice)
-    # Build conversation string
     conversation = "System: You are a helpful assistant.\n"
-    # Handle Chatbot list-of-lists format
-    for human, assistant in history[-3:]:
-        conversation += f"User: {human}\n"
-        if assistant:
-            conversation += f"Assistant: {assistant}\n"
-    conversation += f"User: {message}\nAssistant:"
-    # Call model
     response = llm(
         conversation,
         max_tokens=128,
@@ -89,60 +84,44 @@ def chat(message, history, model_choice):
         top_p=0.9,
         top_k=40,
         repeat_penalty=1.1,
-        stop=["User:", "Assistant:"],
-        echo=False,
     )
     return response["choices"][0]["text"].strip()
 # ----------------------------------------
-# Gradio UI (Blocks + Chatbot)
 # ----------------------------------------
 with gr.Blocks() as demo:
-    gr.Markdown("# 🦙 Datangtang GGUF Model Demo")
-    gr.Markdown("Switch between **1B** and **3B** GGUF models in real-time.")
-    # Dropdown for model selection
     model_choice = gr.Dropdown(
         label="Select Model",
         choices=list(MODEL_CONFIGS.keys()),
         value="1B Model (Datangtang/GGUF1B)",
     )
-    chatbot = gr.Chatbot()
-    msg_box = gr.Textbox(label="Type your message:")
-    # Add user message to chatbot
-    def user_send(message, history):
-        history = history + [[message, None]]
-        return history, ""
-    # Generate bot reply
-    def bot_reply(history, model_name):
-        user_msg = history[-1][0]
-        bot_msg = chat(user_msg, history[:-1], model_name)
-        history[-1][1] = bot_msg
-        return history
-    # Wire functions
     msg_box.submit(
-        user_send,
-        [msg_box, chatbot],
-        [chatbot, msg_box]
     ).then(
-        bot_reply,
-        [chatbot, model_choice],
-        chatbot
-    )
-    model_choice.change(
-        fn=lambda x: f"🔄 Switched to: {x}",
-        inputs=[model_choice],
-        outputs=[],
     )
-if __name__ == "__main__":
-    demo.launch()

 # ----------------------------------------
 # Global model cache
 # ----------------------------------------
+loaded_models = {}
 current_model_name = None
 MODEL_CONFIGS = {
         "filename": "llama-3.2-1b-instruct.Q4_K_M.gguf"
     },
     "3B Model (Datangtang/GGUF3B)": {
+        "repo_id": "Datangtang/GGUF3B",
         "filename": "llama-3.2-3b-instruct.Q4_K_M.gguf"
     }
 }
 def load_model(model_choice):
     global loaded_models, current_model_name
     if model_choice in loaded_models:
         return loaded_models[model_choice]
     cfg = MODEL_CONFIGS[model_choice]
     model_path = hf_hub_download(
         token=os.environ["HF_TOKEN"]
     )
     llm = Llama(
         model_path=model_path,
         n_ctx=1024,
     loaded_models[model_choice] = llm
     current_model_name = model_choice
     return llm
 # ----------------------------------------
+# Chat function (Gradio 4.x message format)
 # ----------------------------------------
+def chat(messages, model_choice):
     llm = load_model(model_choice)
+    # Construct conversation
     conversation = "System: You are a helpful assistant.\n"
+    for msg in messages[-3:]:
+        role = msg["role"]
+        text = msg["content"]
+        if role == "user":
+            conversation += f"User: {text}\n"
+        elif role == "assistant":
+            conversation += f"Assistant: {text}\n"
+    conversation += "Assistant:"
+    # LLM output
     response = llm(
         conversation,
         max_tokens=128,
         top_p=0.9,
         top_k=40,
         repeat_penalty=1.1,
+        stop=["User:", "Assistant:"]
     )
     return response["choices"][0]["text"].strip()
 # ----------------------------------------
+# Gradio UI (Gradio 4.x messages format)
 # ----------------------------------------
 with gr.Blocks() as demo:
+    gr.Markdown("# 🦙 Datangtang GGUF Model Demo (Gradio 4.x Compatible)")
     model_choice = gr.Dropdown(
         label="Select Model",
         choices=list(MODEL_CONFIGS.keys()),
         value="1B Model (Datangtang/GGUF1B)",
     )
+    chatbot = gr.Chatbot(label="Chat", type="messages")
+    msg_box = gr.Textbox(label="Message")
+    # User sends message
+    def add_user_message(user_msg, messages):
+        messages = messages + [{"role": "user", "content": user_msg}]
+        return messages, ""
+    # Bot replies
+    def add_bot_reply(messages, model_choice):
+        reply = chat(messages, model_choice)
+        messages = messages + [{"role": "assistant", "content": reply}]
+        return messages
     msg_box.submit(
+        add_user_message, [msg_box, chatbot], [chatbot, msg_box]
     ).then(
+        add_bot_reply, [chatbot, model_choice], chatbot
     )
+demo.launch()