Final_Assignment_Agent

Sleeping

App Files Files Community

beitemian commited on Jun 7, 2025

Commit

1b66ea9

1 Parent(s): 3a496d9

updated tools and req

Browse files

Files changed (3) hide show

agent.py +28 -4
requirements.txt +3 -1
tools.py +27 -2

agent.py CHANGED Viewed

@@ -13,9 +13,10 @@ project_root = str(Path(__file__).parent)
 if project_root not in sys.path:
     sys.path.insert(0, project_root)
 import os
-from tools import web_search, math_tools
 #from memory import set_memory
 from llama_index.core.agent.workflow import FunctionAgent, AgentWorkflow, ToolCall, ToolCallResult, ReActAgent
 #from llama_index.core.memory import Memory
 import asyncio
 from datetime import datetime
@@ -39,6 +40,26 @@ llm_deepseek_r1 = DeepSeek(
 #test the llm
 #answerr = llm_deepseek_r1.complete("What is the capital of France?")
 #print(answerr)
 researcher_agent = FunctionAgent(
     llm=llm_deepseek_r1,
@@ -85,7 +106,8 @@ Response Guidelines:
 - STRICT!!! Only answer the question directly, concisely. For example, if the question is "What is the capital of France?", the answer should be "Paris".
 - No elaboration or explanation, only straight answer to the question.
 - Plain text response formatting.
-""",
     tools = [
         web_search,
         math_tools.add,
@@ -93,8 +115,10 @@ Response Guidelines:
         math_tools.multiply,
         math_tools.divide,
         math_tools.modulus
-    ]
 )
-workflow_agent = AgentWorkflow(agents = [researcher_agent], root_agent=researcher_agent.name, verbose=True)

 if project_root not in sys.path:
     sys.path.insert(0, project_root)
 import os
+from tools import web_search, math_tools, file_management_tools
 #from memory import set_memory
 from llama_index.core.agent.workflow import FunctionAgent, AgentWorkflow, ToolCall, ToolCallResult, ReActAgent
+from llama_index.llms.openai import OpenAI
 #from llama_index.core.memory import Memory
 import asyncio
 from datetime import datetime
 #test the llm
 #answerr = llm_deepseek_r1.complete("What is the capital of France?")
 #print(answerr)
+gpt_4o = OpenAI(
+    model="gpt-4o",
+    api_key=os.getenv("OPENAI_API_KEY"),
+    temperature=0.2,
+    max_retries=5,
+    timeout=100
+)
+# Image and video understanding agent
+# TODO: Add tools for video, audio analysis.
+media_agent = FunctionAgent(
+    llm=gpt_4o,
+    name="Luna",
+    description="An agent that analyzes videos, audio, and images to provide a summary of the content.",
+    system_prompt=f"""Luna is an expert at analyzing videos, images, audio. Luna concisely leverages tools to analyze these modalities.
+    TOOLS:
+    PLAN:
+    OUTPUT FORMATTING: """,
+    tools = [file_management_tools.read_youtube_video],
+    allow_parallel_tool_calls=True
+)
 researcher_agent = FunctionAgent(
     llm=llm_deepseek_r1,
 - STRICT!!! Only answer the question directly, concisely. For example, if the question is "What is the capital of France?", the answer should be "Paris".
 - No elaboration or explanation, only straight answer to the question.
 - Plain text response formatting.
+""",
+#TODO: Add tools for wikipedia, and document processing (csv, code, pdf, etc.)
     tools = [
         web_search,
         math_tools.add,
         math_tools.multiply,
         math_tools.divide,
         math_tools.modulus
+    ],
+    allow_parallel_tool_calls=True,
+    can_handoff_to=media_agent
 )
+workflow_agent = AgentWorkflow(agents = [researcher_agent, media_agent], root_agent=researcher_agent.name, verbose=True, handoff_prompt="Please handoff to the media agent to analyze videos, audio, images.")

requirements.txt CHANGED Viewed

@@ -6,4 +6,6 @@ llama-index-core
 linkup-sdk
 python-dotenv
 requests
-pandas

 linkup-sdk
 python-dotenv
 requests
+pandas
+llama-index-readers-youtube-transcript
+llama-hub-youtube-transcript

tools.py CHANGED Viewed

@@ -1,5 +1,8 @@
 from linkup import LinkupClient
 from dotenv import load_dotenv
 import os
 load_dotenv()
 linkup_client = LinkupClient(api_key=os.getenv("LINKUP_API_KEY"))
@@ -85,5 +88,27 @@ class MathTools:
 # Create an instance for easy importing
 math_tools = MathTools()

 from linkup import LinkupClient
 from dotenv import load_dotenv
+from llama_index.readers.youtube_transcript import YoutubeTranscriptReader
+from llama_index.readers.youtube_transcript.utils import is_youtube_video
+from llama_index.core import Document
 import os
 load_dotenv()
 linkup_client = LinkupClient(api_key=os.getenv("LINKUP_API_KEY"))
 # Create an instance for easy importing
 math_tools = MathTools()
+#File management tools
+class FileManagementTools:
+    """A class for interacting with files (csv, jpeg, png, pdf, etc.)"""
+    def __init__(self): #TODO: Add proper init
+        self.file_path = None
+        self.file_type = None
+        self.file_name = None
+        self.file_size = None
+        self.file_content = None
+    #TODO: Finish the class with proper source handling and additional file type reading.
+    def read_youtube_video(self,urls: list[str]) -> list[Document]:
+        """Read a youtube video and return the transcript."""
+        valid_urls = [url for url in urls if is_youtube_video(url)]
+        if not valid_urls:
+            raise ValueError("No valid YouTube URLs provided")
+        # Load transcripts for valid URLs
+        try:
+            loader = YoutubeTranscriptReader()
+            documents = loader.load_data(ytlinks=valid_urls)
+            return documents
+        except Exception as e:
+            raise ValueError(f"Error loading YouTube transcripts: {e}")
+file_management_tools = FileManagementTools()