Spaces:

AIencoder
/

Axon

Sleeping

App Files Files Community

AIencoder commited on Jan 25

Commit

636da78

verified ·

1 Parent(s): c3c3dca

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -19

app.py CHANGED Viewed

@@ -177,13 +177,9 @@ def export_chat_history(history):
     export = {
         "exported_at": datetime.now().isoformat(),
         "tool": "Axon v6 Chat",
-        "messages": []
     }
-    for user_msg, assistant_msg in history:
-        export["messages"].append({"role": "user", "content": user_msg})
-        export["messages"].append({"role": "assistant", "content": assistant_msg})
     filename = f"/tmp/axon_chat_{datetime.now().strftime('%Y%m%d_%H%M%S')}.json"
     with open(filename, "w") as f:
         json.dump(export, f, indent=2)
@@ -209,41 +205,62 @@ def export_code(code, language):
     return filename, f"✅ Exported as .{ext}!"
-# ===== STREAMING =====
 def chat_stream(message, history, model_name, temperature, max_tokens):
     valid, error = validate_input(message, "Message")
     if not valid:
-        yield history + [[message, error]]
         return
     llm = load_model(model_name)
     if not llm:
-        yield history + [[message, "❌ Model not available."]]
         return
     if "deepseek" in model_name.lower():
         conv = "### Instruction:\nYou are an expert coding assistant. Use markdown code blocks.\n\n"
-        for u, a in history:
-            conv += f"User: {u}\nAssistant: {a}\n\n"
         conv += f"User: {message}\n\n### Response:\n"
         stop_tokens = ["### Instruction:", "User:"]
     else:
         conv = "<|im_start|>system\nYou are an expert coding assistant. Use markdown code blocks.<|im_end|>\n"
-        for u, a in history:
-            conv += f"<|im_start|>user\n{u}<|im_end|>\n"
-            if a:
-                conv += f"<|im_start|>assistant\n{a}<|im_end|>\n"
         conv += f"<|im_start|>user\n{message}<|im_end|>\n<|im_start|>assistant\n"
         stop_tokens = ["<|im_end|>", "<|im_start|>"]
     try:
         full = ""
         for chunk in llm(conv, max_tokens=max_tokens, temperature=temperature, top_p=0.9, stop=stop_tokens, stream=True):
-            full += chunk["choices"][0]["text"]
-            yield history + [[message, full]]
     except Exception as e:
-        yield history + [[message, f"❌ {str(e)[:50]}"]]
 def generate_stream(prompt, language, model_name, temperature, max_tokens):
     valid, error = validate_input(prompt, "Description")
@@ -573,7 +590,7 @@ with gr.Blocks(title="Axon v6", theme=dark_theme) as demo:
         # ===== CHAT =====
         with gr.TabItem("💬 Chat"):
-            chatbot = gr.Chatbot(height=400, type="tuples")
             with gr.Row():
                 msg = gr.Textbox(placeholder="Ask anything...", show_label=False, scale=8)
                 send = gr.Button("Send", variant="primary", scale=1)
@@ -812,7 +829,7 @@ with gr.Blocks(title="Axon v6", theme=dark_theme) as demo:
     # ===== EVENTS =====
     def respond(message, history, model, temp, tokens):
-        history = history or []
         for updated in chat_stream(message, history, model, temp, tokens):
             yield updated, ""

     export = {
         "exported_at": datetime.now().isoformat(),
         "tool": "Axon v6 Chat",
+        "messages": history # Direct dump for Gradio 5 format
     }
     filename = f"/tmp/axon_chat_{datetime.now().strftime('%Y%m%d_%H%M%S')}.json"
     with open(filename, "w") as f:
         json.dump(export, f, indent=2)
     return filename, f"✅ Exported as .{ext}!"
+# ===== STREAMING (UPDATED FOR GRADIO 5) =====
 def chat_stream(message, history, model_name, temperature, max_tokens):
+    # Initialize history if None (Gradio 5 sometimes sends None on first load)
+    history = history or []
     valid, error = validate_input(message, "Message")
     if not valid:
+        # Append error as assistant message
+        history.append({"role": "user", "content": message})
+        history.append({"role": "assistant", "content": error})
+        yield history
         return
     llm = load_model(model_name)
     if not llm:
+        history.append({"role": "user", "content": message})
+        history.append({"role": "assistant", "content": "❌ Model not available."})
+        yield history
         return
+    # Build conversation string from Dict history
     if "deepseek" in model_name.lower():
         conv = "### Instruction:\nYou are an expert coding assistant. Use markdown code blocks.\n\n"
+        for msg in history:
+            if msg['role'] == 'user':
+                conv += f"User: {msg['content']}\n"
+            else:
+                conv += f"Assistant: {msg['content']}\n\n"
         conv += f"User: {message}\n\n### Response:\n"
         stop_tokens = ["### Instruction:", "User:"]
     else:
         conv = "<|im_start|>system\nYou are an expert coding assistant. Use markdown code blocks.<|im_end|>\n"
+        for msg in history:
+            role = msg['role']
+            content = msg['content']
+            conv += f"<|im_start|>{role}\n{content}<|im_end|>\n"
         conv += f"<|im_start|>user\n{message}<|im_end|>\n<|im_start|>assistant\n"
         stop_tokens = ["<|im_end|>", "<|im_start|>"]
+    # Add the new user message to history
+    history.append({"role": "user", "content": message})
+    # Add a placeholder for the assistant response
+    history.append({"role": "assistant", "content": ""})
     try:
         full = ""
         for chunk in llm(conv, max_tokens=max_tokens, temperature=temperature, top_p=0.9, stop=stop_tokens, stream=True):
+            text_chunk = chunk["choices"][0]["text"]
+            full += text_chunk
+            # Update the last message (assistant's response)
+            history[-1]['content'] = full
+            yield history
     except Exception as e:
+        history[-1]['content'] = f"❌ Error: {str(e)[:100]}"
+        yield history
 def generate_stream(prompt, language, model_name, temperature, max_tokens):
     valid, error = validate_input(prompt, "Description")
         # ===== CHAT =====
         with gr.TabItem("💬 Chat"):
+            chatbot = gr.Chatbot(height=400, type="messages")
             with gr.Row():
                 msg = gr.Textbox(placeholder="Ask anything...", show_label=False, scale=8)
                 send = gr.Button("Send", variant="primary", scale=1)
     # ===== EVENTS =====
     def respond(message, history, model, temp, tokens):
+        # Gradio 5 automatically handles history state
         for updated in chat_stream(message, history, model, temp, tokens):
             yield updated, ""