First_agent_template

Sleeping

App Files Files Community

mwill-AImission commited on Feb 16, 2025

Commit

1c98c9a

verified ·

1 Parent(s): ae7a494

Update app.py

Browse files

Files changed (1) hide show

app.py +152 -41

app.py CHANGED Viewed

@@ -1,69 +1,180 @@
-from smolagents import CodeAgent,DuckDuckGoSearchTool, HfApiModel,load_tool,tool
-import datetime
 import requests
-import pytz
 import yaml
-from tools.final_answer import FinalAnswerTool
 from Gradio_UI import GradioUI
-# Below is an example of a tool that does nothing. Amaze us with your creativity !
 @tool
-def my_custom_tool(arg1:str, arg2:int)-> str: #it's import to specify the return type
-    #Keep this format for the description / args / args description but feel free to modify the tool
-    """A tool that does nothing yet
     Args:
-        arg1: the first argument
-        arg2: the second argument
     """
-    return "What magic will you build ?"
 @tool
-def get_current_time_in_timezone(timezone: str) -> str:
-    """A tool that fetches the current local time in a specified timezone.
     Args:
-        timezone: A string representing a valid timezone (e.g., 'America/New_York').
     """
     try:
-        # Create timezone object
-        tz = pytz.timezone(timezone)
-        # Get current time in that timezone
-        local_time = datetime.datetime.now(tz).strftime("%Y-%m-%d %H:%M:%S")
-        return f"The current local time in {timezone} is: {local_time}"
     except Exception as e:
-        return f"Error fetching time for timezone '{timezone}': {str(e)}"
-final_answer = FinalAnswerTool()
-# If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
-# model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud'
 model = HfApiModel(
-max_tokens=2096,
-temperature=0.5,
-model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded
-custom_role_conversions=None,
 )
-# Import tool from Hub
-image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)
 with open("prompts.yaml", 'r') as stream:
     prompt_templates = yaml.safe_load(stream)
 agent = CodeAgent(
     model=model,
-    tools=[final_answer], ## add your tools here (don't remove final answer)
-    max_steps=6,
-    verbosity_level=1,
-    grammar=None,
-    planning_interval=None,
-    name=None,
-    description=None,
     prompt_templates=prompt_templates
 )
-GradioUI(agent).launch()

+# app.py
+# AI Agent Framework Imports
+from smolagents import CodeAgent, HfApiModel, tool, load_tool
+# Web Scraping and Parsing
 import requests
+from bs4 import BeautifulSoup
+# Selenium & webdriver-manager for Browser Automation
+from selenium import webdriver
+from selenium.webdriver.chrome.options import Options
+from selenium.webdriver.chrome.service import Service
+from selenium.webdriver.common.by import By
+from webdriver_manager.chrome import ChromeDriverManager
+import time
+import os
+# NLP and Text Processing (Optional for Future Enhancements)
+import nltk
+from nltk.tokenize import sent_tokenize
+import spacy
+# Code Parsing and Explanation
+import ast
+from pygments import highlight
+from pygments.lexers import PythonLexer
+from pygments.formatters import HtmlFormatter
+# UI Overlay & Interaction
+import gradio as gr
+import cv2  # Optional: for visual highlights
 import yaml
+# Final Answer and UI Handling
+from tools.final_answer import FinalAnswerTool
 from Gradio_UI import GradioUI
+# Helper function to automatically obtain and configure the Selenium driver
+def get_driver():
+    options = Options()
+    options.add_argument("--headless")  # Run browser in headless mode
+    options.add_argument("--disable-gpu")
+    options.add_argument("--no-sandbox")
+    options.add_argument("--disable-dev-shm-usage")
+    # Automatically install and use the appropriate ChromeDriver
+    service = Service(ChromeDriverManager().install())
+    driver = webdriver.Chrome(service=service, options=options)
+    return driver
+# Tool to analyze a webpage or document and simplify its content
+@tool
+def analyze_and_simplify(url: str) -> str:
+    """Fetches webpage content, extracts text, and provides a simplified summary.
+    Args:
+        url: The webpage URL to analyze.
+    """
+    try:
+        driver = get_driver()
+        driver.get(url)
+        time.sleep(5)  # Wait for content to load
+        soup = BeautifulSoup(driver.page_source, "html.parser")
+        driver.quit()
+        text = ' '.join([p.get_text() for p in soup.find_all("p")])
+        if not text:
+            return "No readable text found on the page."
+        summary = f"Simplified Summary: {text[:500]}... (summary continues)"
+        return summary
+    except Exception as e:
+        return f"Error analyzing webpage: {str(e)}"
+# Tool to detect ambiguous directions and suggest clarification
+@tool
+def detect_ambiguity(content: str) -> str:
+    """Checks for vague instructions and suggests clarifications.
+    Args:
+        content: Text to analyze.
+    """
+    # Placeholder logic for ambiguity detection
+    return "Ambiguity detected. Click 'Is this ambiguous?' for help."
+# Tool to explain technical terms or assumed knowledge in simple language
 @tool
+def explain_assumed_knowledge(term: str) -> str:
+    """Defines difficult or technical terms in a simple way.
     Args:
+        term: The term to explain.
     """
+    return f"Definition of '{term}': [Detailed beginner-friendly explanation here]"
+# Tool to highlight a UI element and optionally automate its interaction
 @tool
+def highlight_elements(step: str, element: str, auto_execute: bool = False) -> str:
+    """Highlights a UI element and optionally performs an action.
     Args:
+        step: The current step in the guide.
+        element: The UI element to highlight (expected as an XPath).
+        auto_execute: If True, the agent will click the element automatically.
     """
     try:
+        driver = get_driver()
+        # Navigate to a placeholder page; replace "about:blank" with the actual URL if needed
+        driver.get("about:blank")
+        if auto_execute:
+            elem = driver.find_element(By.XPATH, element)
+            elem.click()
+            result = f"Step {step}: Auto-clicked '{element}'."
+        else:
+            result = f"Step {step}: Please click on '{element}'."
+        driver.quit()
+        return result
     except Exception as e:
+        return f"Error in highlight_elements: {str(e)}"
+# Tool to explain a single line of code in simple terms
+@tool
+def explain_code_line(line: str) -> str:
+    """Explains what a line of code does in simple terms.
+    Args:
+        line: The code to explain.
+    """
+    return f"Explanation for: {line} [Insert explanation here]"
+# Tool to provide an interactive teacher box for user queries
+@tool
+def teacher_box_query(question: str) -> str:
+    """Allows users to ask the AI questions while browsing.
+    Args:
+        question: User's query.
+    """
+    return f"AI Answer: [Response for '{question}']"
+# Tool to toggle between manual and automatic navigation modes
+@tool
+def toggle_auto_execution(enable: bool) -> str:
+    """Lets the user turn automatic navigation on or off.
+    Args:
+        enable: True for auto-mode, False for manual steps.
+    """
+    return "Auto-execution enabled." if enable else "Manual step-by-step mode enabled."
+# Configure the AI Model
 model = HfApiModel(
+    max_tokens=2096,       # Maximum response length
+    temperature=0.5,       # Controls response randomness
+    model_id='Qwen/Qwen2.5-Coder-32B-Instruct',  # Selected model
+    custom_role_conversions=None
 )
+# Load prompt templates from a YAML configuration file
 with open("prompts.yaml", 'r') as stream:
     prompt_templates = yaml.safe_load(stream)
+# Create the AI agent with the defined tools
 agent = CodeAgent(
     model=model,
+    tools=[
+        FinalAnswerTool(),
+        analyze_and_simplify,
+        detect_ambiguity,
+        explain_assumed_knowledge,
+        highlight_elements,
+        explain_code_line,
+        teacher_box_query,
+        toggle_auto_execution
+    ],
+    max_steps=6,             # Maximum number of reasoning steps
+    verbosity_level=1,       # Level of detail in agent responses
     prompt_templates=prompt_templates
 )
+# Launch the interactive UI using Gradio
+GradioUI(agent).launch()