Spaces:
Sleeping
Sleeping
| import os | |
| from dotenv import load_dotenv | |
| from typing import TypedDict, List, Dict, Any, Optional | |
| from langgraph.graph import StateGraph, START, END, MessagesState | |
| from langchain.agents import create_tool_calling_agent, AgentExecutor, initialize_agent, create_react_agent | |
| from langchain_google_genai import ChatGoogleGenerativeAI | |
| from langchain_groq import ChatGroq | |
| from langchain_core.tools import tool | |
| from langchain_core.messages import HumanMessage, SystemMessage | |
| from langchain_core.prompts import ChatPromptTemplate, PromptTemplate | |
| from langgraph.prebuilt import ToolNode | |
| from langgraph.prebuilt import tools_condition | |
| # 1. Web Browsing | |
| from langchain_community.tools import DuckDuckGoSearchResults | |
| from langchain_community.document_loaders import ImageCaptionLoader | |
| import requests, time | |
| import pandas as pd | |
| from pathlib import Path | |
| from langchain_community.tools import WikipediaQueryRun | |
| from langchain_community.utilities import WikipediaAPIWrapper | |
| from langchain_community.document_loaders import YoutubeLoader | |
| from langchain_community.document_loaders import UnstructuredExcelLoader | |
| from langchain_community.document_loaders import AssemblyAIAudioTranscriptLoader | |
| from langchain.text_splitter import CharacterTextSplitter | |
| from langchain_community.utilities import GoogleSerperAPIWrapper | |
| load_dotenv() | |
| DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space" | |
| def duckduck_websearch(query: str) -> str: | |
| """Allows search through DuckDuckGo. | |
| Args: | |
| query: what you want to search | |
| """ | |
| search = DuckDuckGoSearchResults() | |
| results = search.invoke(query) | |
| return "\n".join(results) | |
| def serper_websearch(query: str) -> str: | |
| """Allows search through Serper. | |
| Args: | |
| query: what you want to search | |
| """ | |
| search = GoogleSerperAPIWrapper(serper_api_key=os.getenv("SERPER_API_KEY")) | |
| results = search.run(query) | |
| return results | |
| def visit_webpage(url: str) -> str: | |
| """Fetches raw HTML content of a web page. | |
| Args: | |
| url: the webpage url | |
| """ | |
| try: | |
| response = requests.get(url, timeout=5) | |
| return response.text[:5000] | |
| except Exception as e: | |
| return f"[ERROR fetching {url}]: {str(e)}" | |
| def wiki_search(query: str) -> str: | |
| """Wiki search tools. | |
| Args: | |
| query: what you want to wiki | |
| """ | |
| api_wrapper = WikipediaAPIWrapper(top_k_results=1, doc_content_chars_max=100) | |
| wikipediatool = WikipediaQueryRun(api_wrapper=api_wrapper) | |
| return wikipediatool.run({"query": query}) | |
| def text_splitter(text: str) -> List[str]: | |
| """Splits text into chunks using LangChain's CharacterTextSplitter. | |
| Args: | |
| text: A string of text to split. | |
| """ | |
| splitter = CharacterTextSplitter(chunk_size=450, chunk_overlap=10) | |
| return splitter.split_text(text) | |
| def youtube_transcript(video_url: str) -> str: | |
| """Fetched youtube transcript | |
| Args: | |
| video_url: YouTube video url | |
| """ | |
| try: | |
| loader = YoutubeLoader.from_youtube_url(video_url) | |
| # video_id = video_url.split("v=")[-1].split("&")[0] | |
| # transcript = YouTubeTranscriptApi.get_transcript(video_id) | |
| return loader.load() | |
| except Exception as e: | |
| return f"Error fetching transcript: {str(e)}" | |
| # 4. File Reading | |
| def read_file(task_id: str) -> str: | |
| """First download the file, then read its content | |
| Args: | |
| dir: the task_id | |
| """ | |
| file_url = f'{DEFAULT_API_URL}/files/{task_id}' | |
| r = requests.get(file_url, timeout=15, allow_redirects=True) | |
| with open('temp', "wb") as fp: | |
| fp.write(r.content) | |
| with open('temp') as f: | |
| return f.read() | |
| def excel_read(task_id: str) -> str: | |
| """First download the excel file, then read its content | |
| Args: | |
| dir: the task_id | |
| """ | |
| try: | |
| file_url = f'{DEFAULT_API_URL}/files/{task_id}' | |
| r = requests.get(file_url, timeout=15, allow_redirects=True) | |
| with open('temp.xlsx', "wb") as fp: | |
| fp.write(r.content) | |
| # Read the Excel file | |
| df = pd.read_excel('temp.xlsx') | |
| # Run various analyses based on the query | |
| result = ( | |
| f"Excel file loaded with {len(df)} rows and {len(df.columns)} columns.\n" | |
| ) | |
| result += f"Columns: {', '.join(df.columns)}\n\n" | |
| # Add summary statistics | |
| result += "Summary statistics:\n" | |
| result += str(df.describe()) | |
| return result | |
| except Exception as e: | |
| return f"Error analyzing Excel file: {str(e)}" | |
| def csv_read(task_id: str) -> str: | |
| """First download the csv file, then read its content | |
| Args: | |
| dir: the task_id | |
| """ | |
| try: | |
| file_url = f'{DEFAULT_API_URL}/files/{task_id}' | |
| r = requests.get(file_url, timeout=15, allow_redirects=True) | |
| with open('temp.csv', "wb") as fp: | |
| fp.write(r.content) | |
| # Read the CSV file | |
| df = pd.read_csv(temp.csv) | |
| # Run various analyses based on the query | |
| result = ( | |
| f"Excel file loaded with {len(df)} rows and {len(df.columns)} columns.\n" | |
| ) | |
| result += f"Columns: {', '.join(df.columns)}\n\n" | |
| # Add summary statistics | |
| result += "Summary statistics:\n" | |
| result += str(df.describe()) | |
| return result | |
| except Exception as e: | |
| return f"Error analyzing CSV file: {str(e)}" | |
| def mp3_listen(task_id: str) -> str: | |
| """First download the mp3 file, then listen to it | |
| Args: | |
| dir: the task_id | |
| """ | |
| file_url = f'{DEFAULT_API_URL}/files/{task_id}' | |
| r = requests.get(file_url, timeout=15, allow_redirects=True) | |
| with open('temp.mp3', "wb") as fp: | |
| fp.write(r.content) | |
| loader = AssemblyAIAudioTranscriptLoader(file_path="temp.mp3", api_key=os.getenv("AssemblyAI_API_KEY")) | |
| docs = loader.load() | |
| contents = [doc.page_content for doc in docs] | |
| return "\n".join(contents) | |
| # 5. Image Open | |
| def image_caption(dir: str) -> str: | |
| """Understand the content of the provided image | |
| Args: | |
| dir: the image url link | |
| """ | |
| loader = ImageCaptionLoader(images=[dir]) | |
| metadata = loader.load() | |
| return metadata[0].page_content | |
| # 2. Coding | |
| from langchain_experimental.tools import PythonREPLTool | |
| def run_python(code: str): | |
| """ Run the given python code | |
| Args: | |
| code: the python code | |
| """ | |
| return PythonREPLTool().run(code) | |
| def multiply(a: float, b: float) -> float: | |
| """Multiply two numbers. | |
| Args: | |
| a: first float | |
| b: second float | |
| """ | |
| return a * b | |
| def add(a: float, b: float) -> float: | |
| """Add two numbers. | |
| Args: | |
| a: first float | |
| b: second float | |
| """ | |
| return a + b | |
| def subtract(a: float, b: float) -> float: | |
| """Subtract two numbers. | |
| Args: | |
| a: first float | |
| b: second float | |
| """ | |
| return a - b | |
| def divide(a: float, b: float) -> float: | |
| """Divide two numbers. | |
| Args: | |
| a: first float | |
| b: second float | |
| """ | |
| if b == 0: | |
| raise ValueError("Cannot divide by zero.") | |
| return a / b | |
| # 3. Multi-Modality | |
| # - multiply: multiply two numbers, A and B | |
| # - add: add two numbers, A and B | |
| # - subtract: Subtract A by B with passing A as the first argument | |
| # - divide: Divide A by B with passing A as the first argument | |
| # You have access to the following tools: | |
| # - serper_websearch: web search the content of the query by passing the query as input with Serper Search Engine | |
| # - duckduck_websearch: web search the content of the query by passing the query as input with DuckDuckGo Search Engine | |
| # - visit_webpage: visit the given webpage url by passing the url as input | |
| # - wiki_search: wiki search the content of the query by passing the query as input if the question asks for wiki search it | |
| # - text_splitter: split text into chunks | |
| # - youtube_transcript: fetch the transcript of the Youtube video by passing the video url as input if the question asks for watching a Youtube video | |
| # - read_file: read the content of the attached file by passing the TASK-ID as input | |
| # - excel_read: read the content of the attached excel file by passing the TASK-ID as input | |
| # - csv_read: read the content of the attached csv file by passing the TASK-ID as input | |
| # - mp3_listen: listen to the content of the attached mp3 file by passing the TASK-ID as input | |
| # - image_caption: understand the visual content of the attached image by passing the TASK-ID as input | |
| # - run_python: run the python code | |
| # ("human", f"Question: {question}\nReport to validate: {final_answer}") | |
| class BasicAgent: | |
| def __init__(self): | |
| self.model = ChatGoogleGenerativeAI( | |
| model="gemini-2.0-flash-lite", | |
| temperature=0, | |
| max_tokens=128, | |
| timeout=None, | |
| max_retries=2, | |
| google_api_key=os.getenv("GEMINI_API_KEY"), | |
| # other params... | |
| ) | |
| # self.model = ChatGroq( | |
| # model="qwen-qwq-32b", | |
| # temperature=0, | |
| # max_tokens=128, | |
| # timeout=None, | |
| # max_retries=2, | |
| # groq_api_key=os.getenv("GROQ_API_KEY") | |
| # # other params... | |
| # ) | |
| # System Prompt for few shot prompting | |
| self.sys_prompt = """" | |
| You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template: | |
| FINAL ANSWER: [YOUR FINAL ANSWER]. | |
| YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separared list of numbers and/or strings. | |
| If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. | |
| If you are asked for a string, don't use articles, neither abbreviations (eg. for cities), and write the digits in plain text unless specified otherwise. | |
| If you are asked for a comma separated list, apply the above rules depending of whether the element to put in the list is a number or a string. | |
| You have access to the following tools: | |
| {tools} | |
| Here are the tools you can use: {tool_names} | |
| If Task ID is included in the question, remember to call the relevant read tools [ie. read_file, excel_read, csv_read, mp3_listen, image_caption] | |
| Note: python_tool is called when the question mentions the term "Python" or any math calculation. | |
| Follow this format in your response: | |
| THOUGHT: [Describe your reasoning here] | |
| ACTION: [Specify the action/tool to use and any relevant input] | |
| OBSERVATIOn: [Result of the action/tool, provided by the system] | |
| FINAL ANSWER: [Provide your final response to the user] | |
| User Input: {input} | |
| {agent_scratchpad} | |
| """ | |
| self.tools = [duckduck_websearch, serper_websearch, visit_webpage, wiki_search, text_splitter, youtube_transcript, read_file, excel_read, csv_read, mp3_listen, image_caption, run_python] | |
| # self.model_with_tools = self.model.bind_tools(self.tools) | |
| # self.sys_msg = SystemMessage(content=self.sys_prompt) | |
| # self.prompt = ChatPromptTemplate.from_messages([ | |
| # ("system", self.sys_prompt), | |
| # ("human", "{input}") | |
| # ]) | |
| self.prompt = PromptTemplate( | |
| input_variables=["input", "tools", "tool_names", "agent_scratchpad"], | |
| template=self.sys_prompt | |
| ) | |
| # self.agent = initialize_agent( | |
| # tools=self.tools, | |
| # llm=self.model, | |
| # agent="zero-shot-react-description", # ReAct agent type | |
| # verbose=True, | |
| # system_prompt=self.prompt, | |
| # handle_parsing_errors="Check your output and make sure it conforms, use the Action/Action Input syntax" | |
| # ) | |
| self.agent = create_react_agent( | |
| llm=self.model, | |
| tools=self.tools, | |
| prompt=self.prompt | |
| ) | |
| self.agent_exe = AgentExecutor(agent=self.agent, tools=self.tools, verbose=True, | |
| handle_parsing_errors="Check your output and make sure it conforms, use the Action/Action Input syntax") | |
| # self.graph = self.__graph_compile__() | |
| print("BasicAgent initialized.") | |
| def __call__(self, task: dict) -> str: | |
| task_id, question, file_name = task["task_id"], task["question"], task["file_name"] | |
| print(f"Agent received question (first 50 chars): {question[:50]}...") | |
| if file_name == "" or file_name is None: | |
| question = question | |
| else: | |
| question = f"{question} with TASK-ID: {task_id}" | |
| # fixed_answer = self.agent.run(f'{question} with TASK-ID: {task_id}') | |
| # fixed_answer = "This is a default answer." | |
| # fixed_answer = self.agent.run(question) | |
| fixed_answer = self.agent_exe.invoke({"input": question}) | |
| # human_message = [HumanMessage(content=question)] | |
| # messages = self.graph.invoke({"messages": human_message}) | |
| # fixed_answer = messages['messages'][-1].content | |
| print(f"Agent returning fixed answer: {fixed_answer}") | |
| time.sleep(60) | |
| return fixed_answer | |
| def __graph_compile__(self): | |
| def assistant(state: MessagesState): | |
| """Assistant Node""" | |
| return {"message": [self.model_with_tools.invoke(state["messages"])]} | |
| builder = StateGraph(MessagesState) | |
| builder.add_node("assistant", assistant) | |
| builder.add_node("tools", ToolNode(self.tools)) | |
| builder.add_edge(START, "assistant") | |
| builder.add_conditional_edges( | |
| "assistant", | |
| # If the latest message (result) from assistant is a tool call -> tools_condition routes to tools | |
| # If the latest message (result) from assistant is a not a tool call -> tools_condition routes to END | |
| tools_condition, | |
| ) | |
| builder.add_edge("tools", "assistant") | |
| # Compile graph | |
| return builder.compile() | |