First_agent_template_2

Sleeping

Gabandino commited on Feb 13, 2025

Commit

04a75c1

verified ·

1 Parent(s): 225253c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,7 +24,8 @@ def search_news_headlines(source: str) -> str:
     """Searches for recent news headlines from specified source using DuckDuckGo.
     Args:
-        source: News source from supported list (BBC, CNN, etc.)
     Returns:
         Formatted news results or error message
@@ -45,8 +46,8 @@ def search_news_headlines(source: str) -> str:
         if not domain:
             return f"Error: {source} is not a supported news source"
-        # Modified search query to better target actual news articles
-        search_query = f"site:{domain} -inurl:video -inurl:about -inurl:contact -inurl:search news article when:7d"
         # Use existing DuckDuckGoSearchTool implementation
         ddg_tool = DuckDuckGoSearchTool(max_results=5)
@@ -56,10 +57,10 @@ def search_news_headlines(source: str) -> str:
         import re
         headlines = re.findall(r'\[(.*?)\]\((.*?)\)', raw_results)
-        # Filter out navigation/section pages
         filtered_headlines = []
         for title, link in headlines:
-            if not any(x in title.lower() for x in ['breaking news updates', 'latest news headlines', 'news video', 'video clips', 'news article', 'breaking news', 'news']):
                 filtered_headlines.append((title, link))
         # Format the results

     """Searches for recent news headlines from specified source using DuckDuckGo.
     Args:
+        source: News source from supported list (BBC News, CNN, Reuters, AP,
+               Fox News, CBS News, Wall Street Journal, Daily Mail)
     Returns:
         Formatted news results or error message
         if not domain:
             return f"Error: {source} is not a supported news source"
+        # Simplified search query
+        search_query = f"site:{domain} when:7d"
         # Use existing DuckDuckGoSearchTool implementation
         ddg_tool = DuckDuckGoSearchTool(max_results=5)
         import re
         headlines = re.findall(r'\[(.*?)\]\((.*?)\)', raw_results)
+        # Filter out navigation/section pages but with fewer restrictions
         filtered_headlines = []
         for title, link in headlines:
+            if not any(x in title.lower() for x in ['video clips', 'contact us', 'about us']):
                 filtered_headlines.append((title, link))
         # Format the results