First_agent_template

Sleeping

App Files Files Community

mhattingpete commited on Feb 12, 2025

Commit

3118bd6

verified ·

1 Parent(s): d638726

Added arXiv search tool

Browse files

Files changed (1) hide show

app.py +66 -8

app.py CHANGED Viewed

@@ -3,20 +3,78 @@ import datetime
 import requests
 import pytz
 import yaml
-from tools.final_answer import FinalAnswerTool, VisitWebpageTool
 from Gradio_UI import GradioUI
-# Below is an example of a tool that does nothing. Amaze us with your creativity !
 @tool
-def my_cutom_tool(arg1:str, arg2:int)-> str: #it's import to specify the return type
-    #Keep this format for the description / args / args description but feel free to modify the tool
-    """A tool that does nothing yet
     Args:
-        arg1: the first argument
-        arg2: the second argument
     """
-    return "What magic will you build ?"
 @tool
 def get_current_time_in_timezone(timezone: str) -> str:

 import requests
 import pytz
 import yaml
+from tools.final_answer import FinalAnswerTool
+from tools.visit_webpage import VisitWebpageTool
 from Gradio_UI import GradioUI
+import arxiv
+from transformers import pipeline
+# Initialize a summarization pipeline using a pre-trained model.
+summarizer = pipeline("summarization")
+def _search_arxiv(query: str, max_results: int = 5) -> list[dict[str, str | list[str]]]:
+    """
+    Search for research articles on arXiv based on the given query.
+    Args:
+        query (str): The search query.
+        max_results (int): Maximum number of results to retrieve.
+    Returns:
+        list[dict[str, str | list[str]]]: Each dict contains title, authors, summary, publication date, and URL.
+    """
+    search = arxiv.Search(
+        query=query,
+        max_results=max_results,
+        sort_by=arxiv.SortCriterion.SubmittedDate
+    )
+    results = []
+    for result in search.results():
+        results.append({
+            'title': result.title,
+            'authors': [author.name for author in result.authors],
+            'summary': result.summary,
+            'published': result.published.strftime("%Y-%m-%d"),
+            'url': result.entry_id
+        })
+    return results
+def _summarize_text(text: str) -> str:
+    """
+    Summarize the provided text using the Hugging Face summarization pipeline.
+    Args:
+        text (str): The text to summarize.
+    Returns:
+        str: The summarized text.
+    """
+    # For longer texts, consider chunking before summarizing.
+    summary = summarizer(text, max_length=130, min_length=30, do_sample=False)
+    return summary[0]['summary_text']
 @tool
+def personalized_research_assistant(query: str) -> str:
+    """A tool that fetches relevant articles from arxiv and provides the information.
     Args:
+        query: The research query to search for in arxiv.
     """
+    response = ""
+    articles = _search_arxiv(query)
+    for idx, article in enumerate(articles):
+        response += f"\nArticle {idx+1}:\n"
+        response += f"\nTitle: {article['title']}\n"
+        response += f"Authors: {', '.join(article['authors'])}\n"
+        response += f"Published on: {article['published']}\n"
+        response += f"URL: {article['url']}\n"
+        response += "Abstract Summary:\n"
+        response += f"{summarize_text(article['summary'])}\n"
+        response += "-" * 80
+    return response
 @tool
 def get_current_time_in_timezone(timezone: str) -> str: