Final_Assignment_Template

Sleeping

App Files Files Community

Facelook commited on Apr 26

Commit

9469c9b

1 Parent(s): bf6d10b

Replaced duckduckgo search with wiki search.

Browse files

Files changed (1) hide show

app.py +43 -18

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import os
 import gradio as gr
 import requests
 import pandas as pd
 # (Keep Constants as is)
@@ -15,7 +16,7 @@ class BasicAgent:
     def search_internet(self, query: str) -> str:
         """
-        Search the internet for information using DuckDuckGo.
         This is a simple implementation that returns search results as text.
         Args:
@@ -26,32 +27,56 @@ class BasicAgent:
         """
         print(f"Searching internet for: {query}")
         try:
-            # Using DuckDuckGo search API
             headers = {
                 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'
             }
-            search_url = f"https://api.duckduckgo.com/?q={query}&format=json&no_html=1&no_redirect=1&skip_disambig=1"
-            response = requests.get(search_url, headers=headers, timeout=10)
-            response.raise_for_status()
-            data = response.json()
-            # Extract information from the response
-            results = []
-            # Extract abstract information if available
-            if data.get('Abstract'):
-                results.append(f"Abstract: {data.get('Abstract')}")
-            # Extract related topics
-            for topic in data.get('RelatedTopics', [])[:5]:  # Limit to first 5 topics
-                if 'Text' in topic:
-                    results.append(f"- {topic['Text']}")
-            if results:
-                return "\n".join(results)
             else:
-                return "No relevant information found."
         except Exception as e:
             print(f"Error searching internet: {e}")

 import os
 import gradio as gr
 import requests
+import inspect
 import pandas as pd
 # (Keep Constants as is)
     def search_internet(self, query: str) -> str:
         """
+        Search the internet for information using Wikipedia's API.
         This is a simple implementation that returns search results as text.
         Args:
         """
         print(f"Searching internet for: {query}")
         try:
+            # Use Wikipedia API to search for information
             headers = {
                 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'
             }
+            # Step 1: Search for relevant articles
+            search_url = f"https://en.wikipedia.org/w/api.php?action=query&list=search&srsearch={query}&format=json"
+            search_response = requests.get(search_url, headers=headers, timeout=10)
+            search_response.raise_for_status()
+            search_data = search_response.json()
+            # Check if we found any search results
+            if 'query' not in search_data or 'search' not in search_data['query'] or not search_data['query']['search']:
+                return "No relevant information found."
+            # Get the title of the first (most relevant) result
+            first_result = search_data['query']['search'][0]
+            page_title = first_result['title']
+            # Step 2: Fetch the content of the most relevant article
+            content_url = f"https://en.wikipedia.org/w/api.php?action=query&prop=extracts&exintro=1&explaintext=1&titles={page_title}&format=json"
+            content_response = requests.get(content_url, headers=headers, timeout=10)
+            content_response.raise_for_status()
+            content_data = content_response.json()
+            # Extract the page content
+            pages = content_data['query']['pages']
+            page_id = list(pages.keys())[0]
+            if 'extract' in pages[page_id]:
+                extract = pages[page_id]['extract']
+                # Limit extract length to avoid very long responses
+                if len(extract) > 1000:
+                    extract = extract[:1000] + "..."
+                result = f"Wikipedia article: {page_title}\n\n{extract}"
+                # Also get a few more related article titles
+                related_titles = []
+                for item in search_data['query']['search'][1:4]:  # Get next 3 results
+                    related_titles.append(item['title'])
+                if related_titles:
+                    result += "\n\nRelated topics:\n"
+                    for title in related_titles:
+                        result += f"- {title}\n"
+                return result
             else:
+                return "Found a relevant page, but couldn't extract its content."
         except Exception as e:
             print(f"Error searching internet: {e}")