Final_Assignment_Template

Configuration error

App Files Files Community

oremaz commited on Jun 15, 2025

Commit

e0b6833

1 Parent(s): c361079

Update agent.py

Browse files

Files changed (1) hide show

agent.py +6 -9

agent.py CHANGED Viewed

@@ -31,7 +31,6 @@ from llama_index.readers.json import JSONReader
 from llama_index.readers.web import BeautifulSoupWebReader
 from llama_index.readers.youtube_transcript import YoutubeTranscriptReader
 from llama_index.tools.arxiv import ArxivToolSpec
-from llama_index.tools.duckduckgo import DuckDuckGoSearchToolSpec
 from llama_index.core.agent.workflow import AgentWorkflow
 from llama_index.llms.vllm import Vllm
@@ -45,6 +44,7 @@ from llama_index.readers.file import (
     VideoAudioReader  # Adding VideoAudioReader for handling audio/video without API
 )
 from pydantic import PrivateAttr
 # Optional API-based imports (conditionally loaded)
 try:
@@ -486,7 +486,6 @@ dynamic_qe_manager = DynamicQueryEngineManager()
 # 1. Create the base DuckDuckGo search tool from the official spec.
 # This tool returns text summaries of search results, not just URLs.
-base_duckduckgo_tool = DuckDuckGoSearchToolSpec().to_tool_list()[1]
 def search_and_extract_content_from_url(query: str) -> List[Document]:
     """
@@ -494,14 +493,12 @@ def search_and_extract_content_from_url(query: str) -> List[Document]:
     Returns a list of Document objects containing the extracted content.
     """
     # Get URL from search
-    search_results = base_duckduckgo_tool(query, max_results=1)
-    url_match = re.search(r"https?://\\S+", str(search_results))
-    if not url_match:
-        return [Document(text="No URL could be extracted from the search results.")]
-    url = url_match.group(0)[:-2]
-    print(url)
     documents = []

 from llama_index.readers.web import BeautifulSoupWebReader
 from llama_index.readers.youtube_transcript import YoutubeTranscriptReader
 from llama_index.tools.arxiv import ArxivToolSpec
 from llama_index.core.agent.workflow import AgentWorkflow
 from llama_index.llms.vllm import Vllm
     VideoAudioReader  # Adding VideoAudioReader for handling audio/video without API
 )
 from pydantic import PrivateAttr
+from duckduckgo_search import DDGS
 # Optional API-based imports (conditionally loaded)
 try:
 # 1. Create the base DuckDuckGo search tool from the official spec.
 # This tool returns text summaries of search results, not just URLs.
 def search_and_extract_content_from_url(query: str) -> List[Document]:
     """
     Returns a list of Document objects containing the extracted content.
     """
     # Get URL from search
+    with DDGS() as ddgs:
+        results = list(ddgs.text(query, max_results=1))
+    if not results:
+        return []
+    url = results[0]['href']
     documents = []