MultiModelCoder

Sleeping

App Files Files Community

w1r4 commited on Jan 5

Commit

fbee7ec

verified ·

1 Parent(s): f726ac6

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -12

app.py CHANGED Viewed

@@ -6,35 +6,32 @@ from huggingface_hub import InferenceClient
 model_id = "Qwen/Qwen2.5-Coder-32B-Instruct"
 def respond(message, history, system_message, temperature, request: gr.Request):
     token = None
-    # 1. Safely try to get the user's token (works on HF Spaces if logged in)
     if request:
-        # We use getattr() to avoid the "AttributeError" if running locally
         token = getattr(request, "token", None)
-    # 2. If no user token, fall back to the Space's secret token (HF_TOKEN)
     if token is None:
         token = os.getenv("HF_TOKEN")
-    # 3. If still no token, stop.
     if token is None:
-        yield "Error: No authentication token found. Please add 'HF_TOKEN' to Space Secrets or run locally with an env variable."
         return
-    # Initialize client
     client = InferenceClient(model_id, token=token)
-    # Build the message format
     messages = [{"role": "system", "content": system_message}]
-    # 'history' comes as tuples [(user, bot), (user, bot)...]
-    for user_msg, bot_msg in history:
-        messages.append({"role": "user", "content": user_msg})
-        messages.append({"role": "assistant", "content": bot_msg})
     messages.append({"role": "user", "content": message})
     try:
         stream = client.chat_completion(
             messages,
@@ -43,15 +40,22 @@ def respond(message, history, system_message, temperature, request: gr.Request):
             temperature=temperature,
             top_p=0.9
         )
         response_text = ""
         for chunk in stream:
             content = chunk.choices[0].delta.content
             if content:
                 response_text += content
                 yield response_text
     except Exception as e:
         yield f"Error: {str(e)}"
 with gr.Blocks(fill_height=True) as demo:
     with gr.Sidebar():
         gr.Markdown("# AI Coding Assistant")
@@ -60,6 +64,8 @@ with gr.Blocks(fill_height=True) as demo:
     gr.ChatInterface(
         respond,
         additional_inputs=[
             gr.Textbox(value="You are a helpful assistant.", label="System Instruction", lines=2),
             gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature")

 model_id = "Qwen/Qwen2.5-Coder-32B-Instruct"
 def respond(message, history, system_message, temperature, request: gr.Request):
+    # --- 1. Authentication Logic ---
     token = None
+    # Safely access token (handles both Local run and Spaces)
     if request:
         token = getattr(request, "token", None)
     if token is None:
         token = os.getenv("HF_TOKEN")
     if token is None:
+        yield "Error: No authentication token found. Please add 'HF_TOKEN' to Space Secrets."
         return
+    # --- 2. Setup Client ---
     client = InferenceClient(model_id, token=token)
+    # --- 3. Build Messages (handling history correctly) ---
     messages = [{"role": "system", "content": system_message}]
+    # We use type="messages" in ChatInterface, so history is already a list of dicts
+    for msg in history:
+        messages.append(msg)
     messages.append({"role": "user", "content": message})
+    # --- 4. Generate Response ---
     try:
         stream = client.chat_completion(
             messages,
             temperature=temperature,
             top_p=0.9
         )
         response_text = ""
         for chunk in stream:
+            # FIX: Check if choices exist before accessing index [0]
+            if not chunk.choices:
+                continue
             content = chunk.choices[0].delta.content
             if content:
                 response_text += content
                 yield response_text
     except Exception as e:
         yield f"Error: {str(e)}"
+# --- 5. Build UI ---
 with gr.Blocks(fill_height=True) as demo:
     with gr.Sidebar():
         gr.Markdown("# AI Coding Assistant")
     gr.ChatInterface(
         respond,
+        # 'type="messages"' fixes the deprecation warning and makes parsing easier
+        type="messages",
         additional_inputs=[
             gr.Textbox(value="You are a helpful assistant.", label="System Instruction", lines=2),
             gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature")