First_agent_template

Sleeping

App Files Files Community

mwill-AImission commited on Feb 16, 2025

Commit

ef94807

verified ·

1 Parent(s): 5b8115e

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -94

app.py CHANGED Viewed

@@ -1,17 +1,10 @@
 # AI Agent Framework Imports
 from smolagents import CodeAgent, HfApiModel, tool, load_tool
-# Selenium & webdriver-manager for Browser Automation
-from selenium import webdriver
-from selenium.webdriver.chrome.options import Options
-from selenium.webdriver.chrome.service import Service
-from selenium.webdriver.common.by import By
-from webdriver_manager.chrome import ChromeDriverManager
-import re
-import time
 # Standard Library Imports (allowed)
 import time
 import yaml
@@ -21,48 +14,7 @@ from tools.final_answer import FinalAnswerTool
 from Gradio_UI import GradioUI
 # --------------------------------------------
-# Helper function to obtain and configure the Selenium driver automatically.
-def get_driver():
-    options = Options()
-    options.add_argument("--headless")            # Run in headless mode
-    options.add_argument("--disable-gpu")
-    options.add_argument("--no-sandbox")
-    options.add_argument("--disable-dev-shm-usage")
-    # Use webdriver-manager to install the proper ChromeDriver
-    service = Service(ChromeDriverManager().install())
-    driver = webdriver.Chrome(service=service, options=options)
-    return driver
-# --------------------------------------------
-# Tool to analyze a webpage or document and provide a simplified summary.
-@tool
-def analyze_and_simplify(url: str) -> str:
-    """Fetches webpage content using Selenium, strips HTML tags, and provides a simplified summary.
-    Args:
-        url: The webpage URL to analyze.
-    """
-    try:
-        driver = get_driver()
-        driver.get(url)
-        time.sleep(5)  # Wait for content to load
-        # Fetch page source and use regex to strip HTML tags.
-        page_source = driver.page_source
-        driver.quit()
-        # Remove HTML tags (very simple approach)
-        text = re.sub(r'<[^>]+>', '', page_source)
-        text = text.strip()
-        if not text:
-            return "No readable text found on the page."
-        # Return a truncated summary of the text.
-        summary = f"Simplified Summary: {text[:500]}..."
-        return summary
-    except Exception as e:
-        return f"Error analyzing webpage: {str(e)}"
-# --------------------------------------------
-# Tool to detect ambiguous instructions.
 @tool
 def detect_ambiguity(content: str) -> str:
     """Checks for vague instructions and suggests clarifications.
@@ -70,11 +22,10 @@ def detect_ambiguity(content: str) -> str:
     Args:
         content: Text to analyze.
     """
-    # Placeholder logic for ambiguity detection.
     return "Ambiguity detected. Click 'Is this ambiguous?' for help."
 # --------------------------------------------
-# Tool to explain technical terms in simple language.
 @tool
 def explain_assumed_knowledge(term: str) -> str:
     """Defines technical terms in a simple way.
@@ -85,33 +36,20 @@ def explain_assumed_knowledge(term: str) -> str:
     return f"Definition of '{term}': [Detailed beginner-friendly explanation here]"
 # --------------------------------------------
-# Tool to highlight a UI element and optionally perform a click.
 @tool
 def highlight_elements(step: str, element: str, auto_execute: bool = False) -> str:
-    """Highlights a UI element and optionally performs an action.
     Args:
         step: The current step in the guide.
-        element: The UI element to highlight (as an XPath).
-        auto_execute: If True, the agent will automatically click the element.
     """
-    try:
-        driver = get_driver()
-        # Here we simply navigate to a blank page (or a given URL if needed).
-        driver.get("about:blank")
-        if auto_execute:
-            elem = driver.find_element(By.XPATH, element)
-            elem.click()
-            result = f"Step {step}: Auto-clicked '{element}'."
-        else:
-            result = f"Step {step}: Please click on '{element}'."
-        driver.quit()
-        return result
-    except Exception as e:
-        return f"Error in highlight_elements: {str(e)}"
 # --------------------------------------------
-# Tool to explain a single line of code.
 @tool
 def explain_code_line(line: str) -> str:
     """Explains what a line of code does in simple terms.
@@ -122,7 +60,7 @@ def explain_code_line(line: str) -> str:
     return f"Explanation for: {line} [Insert explanation here]"
 # --------------------------------------------
-# Tool to provide an interactive teacher box for user queries.
 @tool
 def teacher_box_query(question: str) -> str:
     """Allows users to ask the AI questions while browsing.
@@ -133,7 +71,7 @@ def teacher_box_query(question: str) -> str:
     return f"AI Answer: [Response for '{question}']"
 # --------------------------------------------
-# Tool to toggle between manual and automatic navigation modes.
 @tool
 def toggle_auto_execution(enable: bool) -> str:
     """Lets the user turn automatic navigation on or off.
@@ -156,24 +94,5 @@ model = HfApiModel(
 with open("prompts.yaml", 'r') as stream:
     prompt_templates = yaml.safe_load(stream)
-# Create the AI agent with the defined tools.
-agent = CodeAgent(
-    model=model,
-    tools=[
-        FinalAnswerTool(),
-        analyze_and_simplify,
-        detect_ambiguity,
-        explain_assumed_knowledge,
-        highlight_elements,
-        explain_code_line,
-        teacher_box_query,
-        toggle_auto_execution
-    ],
-    max_steps=6,             # Maximum number of reasoning steps.
-    verbosity_level=1,       # Level of detail in agent responses.
-    prompt_templates=prompt_templates
-)
-# Launch the interactive UI using Gradio.
-GradioUI(agent).launch()

+# app.py
 # AI Agent Framework Imports
 from smolagents import CodeAgent, HfApiModel, tool, load_tool
 # Standard Library Imports (allowed)
 import time
 import yaml
 from Gradio_UI import GradioUI
 # --------------------------------------------
+# Tool: detect_ambiguity
 @tool
 def detect_ambiguity(content: str) -> str:
     """Checks for vague instructions and suggests clarifications.
     Args:
         content: Text to analyze.
     """
     return "Ambiguity detected. Click 'Is this ambiguous?' for help."
 # --------------------------------------------
+# Tool: explain_assumed_knowledge
 @tool
 def explain_assumed_knowledge(term: str) -> str:
     """Defines technical terms in a simple way.
     return f"Definition of '{term}': [Detailed beginner-friendly explanation here]"
 # --------------------------------------------
+# Tool: highlight_elements (modified to a placeholder)
 @tool
 def highlight_elements(step: str, element: str, auto_execute: bool = False) -> str:
+    """(Placeholder) Highlights a UI element and optionally performs an action.
     Args:
         step: The current step in the guide.
+        element: The UI element to highlight (as an identifier).
+        auto_execute: If True, the agent would auto-click the element.
     """
+    return "Highlight functionality is currently not available."
 # --------------------------------------------
+# Tool: explain_code_line
 @tool
 def explain_code_line(line: str) -> str:
     """Explains what a line of code does in simple terms.
     return f"Explanation for: {line} [Insert explanation here]"
 # --------------------------------------------
+# Tool: teacher_box_query
 @tool
 def teacher_box_query(question: str) -> str:
     """Allows users to ask the AI questions while browsing.
     return f"AI Answer: [Response for '{question}']"
 # --------------------------------------------
+# Tool: toggle_auto_execution
 @tool
 def toggle_auto_execution(enable: bool) -> str:
     """Lets the user turn automatic navigation on or off.
 with open("prompts.yaml", 'r') as stream:
     prompt_templates = yaml.safe_load(stream)
+#