Final_Assignment_Template

Configuration error

oremaz commited on Jun 15, 2025

Commit

8012613

1 Parent(s): 81a79f6

Update agent.py

Files changed (1) hide show

agent.py CHANGED Viewed

@@ -33,7 +33,7 @@ from llama_index.readers.youtube_transcript import YoutubeTranscriptReader
 from llama_index.tools.arxiv import ArxivToolSpec
 from llama_index.core.agent.workflow import AgentWorkflow
 from llama_index.llms.vllm import Vllm
 # Import all required official LlamaIndex Readers
 from llama_index.readers.file import (
@@ -494,16 +494,23 @@ dynamic_qe_manager = DynamicQueryEngineManager()
 # 1. Create the base DuckDuckGo search tool from the official spec.
 # This tool returns text summaries of search results, not just URLs.
 def search_and_extract_content_from_url(query: str) -> List[Document]:
     """
     Searches web, gets top URL, and extracts both text content and images.
     Returns a list of Document objects containing the extracted content.
     """
     # Get URL from search
-    results = search_ddg(query)
-    url = results["AbstractURL"]
     print(url)
     documents = []
     try:

 from llama_index.tools.arxiv import ArxivToolSpec
 from llama_index.core.agent.workflow import AgentWorkflow
 from llama_index.llms.vllm import Vllm
+from llama_index.tools.duckduckgo import DuckDuckGoSearchToolSpec
 # Import all required official LlamaIndex Readers
 from llama_index.readers.file import (
 # 1. Create the base DuckDuckGo search tool from the official spec.
 # This tool returns text summaries of search results, not just URLs.
+base_duckduckgo_tool = DuckDuckGoSearchToolSpec().to_tool_list()[1]
 def search_and_extract_content_from_url(query: str) -> List[Document]:
     """
     Searches web, gets top URL, and extracts both text content and images.
     Returns a list of Document objects containing the extracted content.
     """
     # Get URL from search
+    #search_results = base_duckduckgo_tool(query, max_results=1)
+    #url_match = re.search(r"https?://\S+", str(search_results))
+    #if not url_match:
+        #return [Document(text="No URL could be extracted from the search results.")]
+    #url = url_match.group(0)[:-2]
+    url = "https://en.wikipedia.org/wiki/Mercedes_Sosa"
     print(url)
     documents = []
     try: