Spaces:

beyoru
/

Simple-chatbot

Running

App Files Files Community

beyoru commited on Dec 12, 2025

Commit

8e33e20

verified ·

1 Parent(s): b0da11a

Update app.py

Browse files

Files changed (1) hide show

app.py +233 -42

app.py CHANGED Viewed

@@ -1,11 +1,14 @@
 import os
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, TextIteratorStreamer
 from threading import Thread
 import gradio as gr
 MODEL_NAME = os.getenv('MODEL_ID')
 TOKEN = os.getenv('TOKEN')
 print("Loading model...")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, trust_remote_code=True, token=TOKEN)
@@ -18,28 +21,132 @@ model = AutoModelForCausalLM.from_pretrained(
 )
 print("Model loaded.")
 def playground(
     message,
     history,
     system_prompt,
     max_new_tokens,
     temperature,
     repetition_penalty,
     top_k,
-    top_p
 ):
     if not isinstance(message, str) or not message.strip():
         yield ""
         return
-    # Build conversation với system prompt
     conversation = []
-    # Thêm system prompt nếu có
     if system_prompt and system_prompt.strip():
         conversation.append({"role": "system", "content": system_prompt.strip()})
-    # Thêm lịch sử chat
     for user_msg, bot_msg in history:
         conversation.append({"role": "user", "content": user_msg})
         if bot_msg:
@@ -47,56 +154,130 @@ def playground(
     conversation.append({"role": "user", "content": message})
-    if hasattr(tokenizer, "apply_chat_template"):
-        prompt = tokenizer.apply_chat_template(conversation, tokenize=False, add_generation_prompt=True)
-    else:
-        prompt = "\n".join([f"{msg['role']}: {msg['content']}" for msg in conversation]) + "\nassistant:"
-    inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
-    streamer = TextIteratorStreamer(tokenizer, skip_prompt=True, skip_special_tokens=True)
-    generation_kwargs = dict(
-        **inputs,
-        streamer=streamer,
-        max_new_tokens=int(max_new_tokens),
-        temperature=float(temperature),
-        top_k=int(top_k) if top_k > 0 else None,
-        top_p=float(top_p),
-        repetition_penalty=float(repetition_penalty),
-        do_sample=True if temperature > 0 else False,
-        pad_token_id=tokenizer.eos_token_id
-    )
-    thread = Thread(target=model.generate, kwargs=generation_kwargs)
-    thread.start()
     generated_text = ""
-    for new_text in streamer:
-        generated_text += new_text
-        yield generated_text
-    thread.join()
 with gr.Blocks(fill_height=True, fill_width=True) as app:
     with gr.Sidebar():
-        gr.Markdown("## Playground by UltimaX Intelligence")
         gr.HTML("""
         Runs <b><a href="https://huggingface.co/beyoru/Qwen3-0.9B-A0.6B" target="_blank">
-        beyoru/Qwen3-0.9B-A0.6B</a></b> via <b>Hugging Face Transformers</b>.<br><br>
-        <b>Support me at:</b>.<br><br>
         <a href="https://www.buymeacoffee.com/ductransa0g" target="_blank">
             <img src="https://cdn.buymeacoffee.com/buttons/v2/default-yellow.png" alt="Buy Me A Coffee" width="150px">
         </a>
         """)
         gr.Markdown("---")
         gr.Markdown("## System Prompt")
         system_prompt = gr.Textbox(
             label="System Prompt",
-            placeholder="Enter custom system instructions here (optional)...",
             lines=4,
-            value="You are a helpful AI assistant.",
-            info="AI role custome"
         )
         gr.Markdown("---")
@@ -109,16 +290,26 @@ with gr.Blocks(fill_height=True, fill_width=True) as app:
     gr.ChatInterface(
         fn=playground,
-        additional_inputs=[system_prompt, max_new_tokens, temperature, repetition_penalty, top_k, top_p],
         chatbot=gr.Chatbot(
-            label="Qwen3-0.9B-A0.6B",
             show_copy_button=True,
             allow_tags=["think"],
         ),
         examples=[
-            ["Hello who are you?"],
-            ["How to solve 2x+1=3."],
-            ["Example python code for async"]
         ],
         cache_examples=False,
         show_api=False

 import os
+import json
 import torch
+import requests
 from transformers import AutoTokenizer, AutoModelForCausalLM, TextIteratorStreamer
 from threading import Thread
 import gradio as gr
 MODEL_NAME = os.getenv('MODEL_ID')
 TOKEN = os.getenv('TOKEN')
+MCP_URL = "https://beyoru-clone-tools.hf.space/gradio_api/mcp/"
 print("Loading model...")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, trust_remote_code=True, token=TOKEN)
 )
 print("Model loaded.")
+# Define MCP tools schema
+TOOLS = [
+    {
+        "type": "function",
+        "function": {
+            "name": "clone_tools_Web_Search",
+            "description": "Run a DuckDuckGo-backed search across text, news, images, videos, or books.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "query": {"type": "string", "description": "The search query"},
+                    "max_results": {"type": "number", "description": "Number of results to return (1-20)", "default": 5},
+                    "search_type": {"type": "string", "enum": ["text", "news", "images", "videos", "books"], "default": "text"}
+                },
+                "required": ["query"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "clone_tools_Web_Fetch",
+            "description": "Fetch a webpage and return clean Markdown, raw HTML, or a list of links.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "url": {"type": "string", "description": "The absolute URL to fetch"},
+                    "max_chars": {"type": "number", "description": "Maximum characters to return (0 = no limit)", "default": 0},
+                    "mode": {"type": "string", "enum": ["markdown", "html", "url_scraper"], "default": "markdown"}
+                },
+                "required": ["url"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "clone_tools_Code_Interpreter",
+            "description": "Execute Python code and return the output.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "code": {"type": "string", "description": "Python source code to run"}
+                },
+                "required": ["code"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "clone_tools_Generate_Image",
+            "description": "Generate an image from a text prompt via Hugging Face inference.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "prompt": {"type": "string", "description": "Text description of the image to generate"},
+                    "model_id": {"type": "string", "default": "black-forest-labs/FLUX.1-dev"},
+                    "steps": {"type": "number", "default": 30},
+                    "width": {"type": "number", "default": 1024},
+                    "height": {"type": "number", "default": 1024}
+                },
+                "required": ["prompt"]
+            }
+        }
+    }
+]
+def call_mcp_tool(tool_name, parameters):
+    """Call MCP tool via HTTP endpoint"""
+    try:
+        # MCP endpoint format: tool name without clone_tools_ prefix
+        tool_endpoint = tool_name.replace("clone_tools_", "")
+        url = f"{MCP_URL}{tool_endpoint}"
+        response = requests.post(url, json=parameters, timeout=30)
+        response.raise_for_status()
+        return response.json()
+    except Exception as e:
+        return {"error": str(e)}
+def process_tool_calls(tool_calls):
+    """Process tool calls and return results"""
+    results = []
+    for tool_call in tool_calls:
+        if isinstance(tool_call, dict):
+            func_name = tool_call.get("name")
+            func_args = tool_call.get("arguments", {})
+            if isinstance(func_args, str):
+                try:
+                    func_args = json.loads(func_args)
+                except:
+                    pass
+            result = call_mcp_tool(func_name, func_args)
+            results.append({
+                "tool_call_id": tool_call.get("id", "call_0"),
+                "role": "tool",
+                "name": func_name,
+                "content": json.dumps(result, ensure_ascii=False)
+            })
+    return results
 def playground(
     message,
     history,
     system_prompt,
+    enable_tools,
     max_new_tokens,
     temperature,
     repetition_penalty,
     top_k,
+    top_p,
+    max_tool_iterations
 ):
     if not isinstance(message, str) or not message.strip():
         yield ""
         return
+    # Build conversation
     conversation = []
     if system_prompt and system_prompt.strip():
         conversation.append({"role": "system", "content": system_prompt.strip()})
     for user_msg, bot_msg in history:
         conversation.append({"role": "user", "content": user_msg})
         if bot_msg:
     conversation.append({"role": "user", "content": message})
+    # Tool calling loop
+    iteration = 0
     generated_text = ""
+    while iteration < max_tool_iterations:
+        iteration += 1
+        # Apply chat template with tools if enabled
+        if enable_tools and hasattr(tokenizer, "apply_chat_template"):
+            prompt = tokenizer.apply_chat_template(
+                conversation,
+                tools=TOOLS,
+                tokenize=False,
+                add_generation_prompt=True
+            )
+        else:
+            prompt = tokenizer.apply_chat_template(
+                conversation,
+                tokenize=False,
+                add_generation_prompt=True
+            )
+        inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
+        streamer = TextIteratorStreamer(tokenizer, skip_prompt=True, skip_special_tokens=True)
+        generation_kwargs = dict(
+            **inputs,
+            streamer=streamer,
+            max_new_tokens=int(max_new_tokens),
+            temperature=float(temperature),
+            top_k=int(top_k) if top_k > 0 else None,
+            top_p=float(top_p),
+            repetition_penalty=float(repetition_penalty),
+            do_sample=True if temperature > 0 else False,
+            pad_token_id=tokenizer.eos_token_id
+        )
+        thread = Thread(target=model.generate, kwargs=generation_kwargs)
+        thread.start()
+        current_output = ""
+        for new_text in streamer:
+            current_output += new_text
+            generated_text = current_output
+            yield generated_text
+        thread.join()
+        # Check for tool calls
+        tool_calls = None
+        try:
+            # Try to parse tool calls from output
+            if "<tool_call>" in current_output:
+                # Extract tool call JSON
+                import re
+                tool_match = re.search(r'<tool_call>(.*?)</tool_call>', current_output, re.DOTALL)
+                if tool_match:
+                    tool_calls = json.loads(tool_match.group(1))
+        except:
+            pass
+        if not enable_tools or not tool_calls:
+            # No tool calls, return final response
+            break
+        # Process tool calls
+        generated_text += "\n\n🔧 **Executing tools...**\n"
+        yield generated_text
+        tool_results = process_tool_calls(tool_calls if isinstance(tool_calls, list) else [tool_calls])
+        # Add assistant message with tool calls
+        conversation.append({
+            "role": "assistant",
+            "content": current_output,
+            "tool_calls": tool_calls if isinstance(tool_calls, list) else [tool_calls]
+        })
+        # Add tool results
+        for result in tool_results:
+            conversation.append(result)
+            generated_text += f"\n✓ {result['name']}: {result['content'][:200]}...\n"
+            yield generated_text
+        generated_text += "\n**Processing results...**\n\n"
+        yield generated_text
+        # Continue conversation with tool results
+        # Reset generated_text for next iteration
+        generated_text = ""
 with gr.Blocks(fill_height=True, fill_width=True) as app:
     with gr.Sidebar():
+        gr.Markdown("## Playground with MCP Tools")
         gr.HTML("""
         Runs <b><a href="https://huggingface.co/beyoru/Qwen3-0.9B-A0.6B" target="_blank">
+        beyoru/Qwen3-0.9B-A0.6B</a></b> with <b>MCP Tools Integration</b>.<br><br>
+        <b>Support me at:</b><br><br>
         <a href="https://www.buymeacoffee.com/ductransa0g" target="_blank">
             <img src="https://cdn.buymeacoffee.com/buttons/v2/default-yellow.png" alt="Buy Me A Coffee" width="150px">
         </a>
         """)
+        gr.Markdown("---")
+        gr.Markdown("## Tools Settings")
+        enable_tools = gr.Checkbox(
+            label="Enable MCP Tools",
+            value=True,
+            info="Allow model to call external tools (search, code, images)"
+        )
+        max_tool_iterations = gr.Slider(
+            1, 5, value=3, step=1,
+            label="Max Tool Iterations",
+            info="Maximum number of tool calling rounds"
+        )
         gr.Markdown("---")
         gr.Markdown("## System Prompt")
         system_prompt = gr.Textbox(
             label="System Prompt",
+            placeholder="Enter custom system instructions...",
             lines=4,
+            value="You are a helpful AI assistant with access to tools for web search, code execution, and image generation. Use tools when needed to provide accurate and helpful responses.",
+            info="AI role and behavior"
         )
         gr.Markdown("---")
     gr.ChatInterface(
         fn=playground,
+        additional_inputs=[
+            system_prompt,
+            enable_tools,
+            max_new_tokens,
+            temperature,
+            repetition_penalty,
+            top_k,
+            top_p,
+            max_tool_iterations
+        ],
         chatbot=gr.Chatbot(
+            label="Qwen3-0.9B-A0.6B with MCP Tools",
             show_copy_button=True,
             allow_tags=["think"],
         ),
         examples=[
+            ["Search for the latest news about AI"],
+            ["Calculate the fibonacci sequence up to 10 using code"],
+            ["Generate an image of a cute robot"],
+            ["What's the weather like today?"]
         ],
         cache_examples=False,
         show_api=False