Sborole-Final-Assignment

Runtime error

App Files Files Community

Sborole commited on Dec 1, 2025

Commit

7de8b44

verified ·

1 Parent(s): b0cdee0

Update tools/SemanticScholar.py

Browse files

Files changed (1) hide show

tools/SemanticScholar.py +30 -57

tools/SemanticScholar.py CHANGED Viewed

@@ -2,73 +2,46 @@ import os
 from smolagents import Tool
 from googleapiclient.discovery import build
-class GoogleAcademicSearchTool(Tool):
     """
-    A specialized search tool that uses the Google Custom Search Engine (CSE)
-    API to find academic papers by applying strong search filters (e.g., site:scholar.google.com).
-    This replaces the Semantic Scholar tool which was experiencing timeouts.
     """
-    name = "academic_paper_search"
-    description = "Searches for academic papers by restricting the Google search to academic domains (like Google Scholar) and returns relevant titles, snippets, and source links."
     inputs = {
-        "query": {"type": "string", "description": "Search query for academic papers (title, keywords, author, etc.)"}
     }
     output_type = "string"
     def __init__(self, **kwargs):
         super().__init__(**kwargs)
-        # Retrieve credentials from environment variables
-        self.api_key = os.getenv("GOOGLE_API_KEY")
-        self.cse_id = os.getenv("GOOGLE_CSE_ID")
-        if not self.api_key or not self.cse_id:
-            raise ValueError("GOOGLE_API_KEY or GOOGLE_CSE_ID secret not found.")
-        # Initialize the Google Custom Search service
-        self.service = build(
-            "customsearch", "v1", developerKey=self.api_key
-        )
     def forward(self, query: str) -> str:
-        """
-        Executes a Google search query, restricting results to academic domains.
-        """
-        print(f"Executing Google Academic search for: '{query}'")
-        # Modify the query to prioritize academic sources
-        # We use OR to check multiple popular domains for better coverage
-        academic_filter = "site:scholar.google.com OR site:researchgate.net OR site:pubmed.ncbi.nlm.nih.gov"
-        google_academic_query = f"{query} {academic_filter}"
         try:
-            # Execute the search request for up to 3 results
-            res = self.service.cse().list(
-                q=google_academic_query,
-                cx=self.cse_id,
-                num=3
-            ).execute()
-            items = res.get('items', [])
-            if not items:
-                return "XX record info: No academic results found using Google search filters."
-            search_results = []
-            for i, item in enumerate(items):
-                title = item.get('title', 'N/A')
-                snippet = item.get('snippet', 'No snippet available.')
-                link = item.get('link', 'N/A')
-                # Format similar to the previous academic tool
-                search_results.append(
-                    f"RESULT {i+1}: **{title}**\n"
-                    f"CONTENT: {snippet}\n"
-                    f"SOURCE: {link}"
                 )
-            return "\n\n---SEPARATOR---\n\n".join(search_results)
         except Exception as e:
-            return f"Error during Google Academic Search API call: {e}"

 from smolagents import Tool
 from googleapiclient.discovery import build
+class TavilyResearchTool(Tool):
     """
+    Tavily deep-research search tool.
+    Use this when the question needs academic papers,
+    scientific background or research-level accuracy.
     """
+    name = "tavily_research"
+    description = (
+        "Use Tavily deep research mode to find academic-level content "
+        "including papers, research summaries, and high-quality sources."
+    )
     inputs = {
+        "query": {"type": "string", "description": "Research topic to search"}
     }
     output_type = "string"
     def __init__(self, **kwargs):
         super().__init__(**kwargs)
+        api_key = os.getenv("TAVILY_API_KEY")
+        if not api_key:
+            raise ValueError("Missing TAVILY_API_KEY.")
+        self.client = TavilyClient(api_key=api_key)
     def forward(self, query: str) -> str:
         try:
+            response = self.client.search(
+                query=query,
+                search_depth="advanced",     # <-- academic/longform mode
+                max_results=5
+            )
+            out = []
+            for r in response.get("results", []):
+                out.append(
+                    f"TITLE: {r.get('title')}\n"
+                    f"CONTENT: {r.get('content')}\n"
+                    f"SOURCE: {r.get('url')}"
                 )
+            return "\n\n---SEPARATOR---\n\n".join(out)
         except Exception as e:
+            return f"Tavily research error: {e}"