Final_Assignment

Paused

App Files Files Community

sebastianfrench commited on May 6, 2025

Commit

2f9e3a2

1 Parent(s): f4d3755

test first question

Browse files

Files changed (7) hide show

agents/search_agent.py +9 -13
app.py +5 -1
graphs/evaluation.py +109 -0
graphs/question_map.py +11 -0
graphs/search.py +0 -51
models/models.py +2 -2
tools/search.py +5 -4

agents/search_agent.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from graphs.search import build_workflow
 from langchain_core.messages import HumanMessage, SystemMessage
 from langfuse.callback import CallbackHandler
 from dotenv import load_dotenv
@@ -11,21 +11,17 @@ class SearchAgent:
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
         workflow = build_workflow()
-        messages= [SystemMessage("""You are a general AI assistant. I will ask you a question. Report your thoughts, and finish with only the answer. \n
-                                 YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.
-                                 If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise.
-                                 If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise.
-                                 If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.""")]
-        messages = messages + [HumanMessage(content=question)]
-        messages = workflow.invoke({
-            "messages":messages
-        }, config={"callbacks": [langfuse_handler]})
-        return messages["messages"][-1].content
-""" if __name__ == "__main__":
     question = "How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia."
     agent = SearchAgent()
     submit_answer = agent(question)
-    print(submit_answer) """

+from graphs.evaluation import build_workflow
 from langchain_core.messages import HumanMessage, SystemMessage
 from langfuse.callback import CallbackHandler
 from dotenv import load_dotenv
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
         workflow = build_workflow()
+        messages =  [HumanMessage(content=question)]
+        state = workflow.invoke({
+            "messages":messages,
+        }, config={"callbacks": [langfuse_handler]})
+        return state["answer"]
+if __name__ == "__main__":
     question = "How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia."
     agent = SearchAgent()
     submit_answer = agent(question)
+    print(submit_answer)

app.py CHANGED Viewed

@@ -71,7 +71,11 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
             print(f"Skipping item with missing task_id or question: {item}")
             continue
         try:
-            submitted_answer = agent(question_text)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:

             print(f"Skipping item with missing task_id or question: {item}")
             continue
         try:
+            submitted_answer = ""
+            if question_text == "":
+                submitted_answer = agent(question_text)
+            else:
+                submitted_answer= "In progress"
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:

graphs/evaluation.py ADDED Viewed

	@@ -0,0 +1,109 @@

+from models.models import  groq_model, anthropic_model
+from tools.search import arxiv_search, taivily_search, serper_search
+from langgraph.graph import StateGraph, START, END, MessagesState
+from langchain_core.messages import HumanMessage, SystemMessage
+from typing import List, TypedDict
+from langgraph.prebuilt import ToolNode
+tools = [
+    taivily_search,
+    serper_search,
+]
+class EvaluationState(TypedDict):
+    messages: List
+    tasks: str
+    current_task: str
+    question: str
+    answer: str
+    external_information: str
+    has_enough_information: bool
+bound_model_llama = groq_model.bind_tools(tools)
+bound_model_antrhropic = anthropic_model.bind_tools(tools)
+def call_node(state: EvaluationState):
+    question = state["messages"][-1].content
+    state["question"] = question
+    response = bound_model_llama.invoke(state["messages"])
+    state["messages"].append(response)
+    return state
+tool_node = ToolNode(tools)
+def parse_response(state: EvaluationState):
+    """
+    Parse the response from the model and return the final answer
+    """
+    prompt = f"""I will ask you a question. Report your thoughts, and finish with only YOUR FINAL ANSWER.
+                                 YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.
+                                 If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise.
+                                 If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise.
+                                 If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
+                                ---question---
+                                {state["question"]}
+                                ---relevant information---
+                                {state["external_information"]}
+                                ---answer---
+                                """
+    response  = groq_model.invoke(prompt)
+    state["messages"].append(response)
+    state["answer"] = response.content
+    return state
+def map_answer(state: EvaluationState):
+    """
+    Map the answer to the final answer
+    """
+    answer = anthropic_model.invoke("Map the answer, I want only the number, string or list. ANSWER:"+ state["answer"])
+    print(answer.content)
+    return {
+        "answer": answer.content
+    }
+def map_tool_answer(state: EvaluationState):
+    """
+    Map the tool answer to the final answer
+    """
+    last_message = state["messages"][-1]
+    state["external_information"] = last_message.content
+    return state
+def build_workflow():
+    """
+    Build search  workflow
+    """
+    workflow = StateGraph(EvaluationState)
+    workflow.add_node("agent", call_node)
+    workflow.add_node("action", tool_node)
+    workflow.add_node("map_tool_answer", map_tool_answer)
+    workflow.add_node("parse_response", parse_response)
+    workflow.add_node("map_answer", map_answer)
+    """ workflow.add_node("action",tool_node)
+    workflow.add_node("answer", parse_response) """
+    workflow.add_edge(START,"agent")
+    workflow.add_edge("agent", "action")
+    workflow.add_edge("action", "map_tool_answer")
+    workflow.add_edge("map_tool_answer", "parse_response")
+    workflow.add_edge("parse_response", "map_answer")
+    workflow.add_edge("map_answer", END)
+    return workflow.compile()
+""" if __name__ == "__main__":
+    question = "How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia."
+    # Build the graph
+    graph = build_workflow()
+    # Run the graph
+    messages = [HumanMessage(content=question)]
+    messages = graph.invoke({"messages": messages})
+    for m in messages["messages"]:
+        m.pretty_print() """

graphs/question_map.py ADDED Viewed

	@@ -0,0 +1,11 @@

+from langchain_core.messages import HumanMessage, SystemMessage
+from models.models import groq_model
+def question_map(state:HumanMessage):
+    """
+    This funtion replace the initial question for a one with a detail expected answer.
+    """
+    question = """/ \n Question:""" + state["content"]

graphs/search.py DELETED Viewed

@@ -1,51 +0,0 @@
-from models.models import  groq_model, anthropic_model
-from tools.search import arxiv_search, web_search, google_search
-from langgraph.graph import StateGraph, START, END, MessagesState
-from langgraph.prebuilt import ToolNode
-from langchain_core.messages import HumanMessage
-tools = [
-    arxiv_search,
-    web_search,
-    google_search,
-]
-tool_node = ToolNode(tools)
-#bound_model = groq_model.bind_tools(tools)
-bound_model = anthropic_model.bind_tools(tools)
-# Define the function that calls the model
-def call_model(state: MessagesState):
-    response = bound_model.invoke(state["messages"])
-    # We return a list, because this will get added to the existing list
-    return {"messages": response}
-def should_continue(state:MessagesState):
-    last_message = state["messages"][-1]
-    if not last_message.tool_calls:
-        return END
-    return "action"
-def build_workflow():
-    """
-    Build search  workflow
-    """
-    workflow = StateGraph(MessagesState)
-    workflow.add_node("agent", call_model)
-    workflow.add_node("action",tool_node)
-    workflow.add_edge(START,"agent")
-    workflow.add_conditional_edges("agent", should_continue)
-    workflow.add_edge("action", "agent")
-    return workflow.compile()
-""" if __name__ == "__main__":
-    question = "How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia."
-    # Build the graph
-    graph = build_workflow()
-    # Run the graph
-    messages = [HumanMessage(content=question)]
-    messages = graph.invoke({"messages": messages})
-    for m in messages["messages"]:
-        m.pretty_print() """

models/models.py CHANGED Viewed

@@ -5,11 +5,11 @@ from dotenv import load_dotenv
 load_dotenv()
 anthropic_model = ChatAnthropic(
-    model="claude-3-7-sonnet-latest",
     temperature=0
 )
 groq_model = ChatGroq(
-    model="meta-llama/llama-4-maverick-17b-128e-instruct",
     temperature=0
 )

 load_dotenv()
 anthropic_model = ChatAnthropic(
+    model="claude-3-5-haiku-latest",
     temperature=0
 )
 groq_model = ChatGroq(
+    model="qwen-qwq-32b",
     temperature=0
 )

tools/search.py CHANGED Viewed

@@ -26,10 +26,11 @@ def wikipedia_search(query: str) -> str:
     return {"wiki_results": formatted_search_docs}
 @tool
-def web_search(query: str) -> str:
-    """Search Tavily for a query and return maximum 1 results.
     Args:
         query: The search query."""
     search_docs = TavilySearchResults(max_results=1).invoke(input=query)
     formatted_search_docs = "\n\n---\n\n".join(
@@ -58,12 +59,12 @@ def arxiv_search(query: str) -> str:
     return {"arxiv_results": formatted_search_docs}
 @tool
-def google_search(query: str) -> str:
     """
     Search Google for a query and return maximum 2 result.
     Args: query: The search query.
     """
-    search_docs = GoogleSerperAPIWrapper()
     result = search_docs.run(query)
     return {"google_results": result}

     return {"wiki_results": formatted_search_docs}
 @tool
+def taivily_search(query: str) -> str:
+    """Tavily is a search engine optimized for LLMs, aimed at efficient, quick and persistent search results. Tavily take care of all the burden of searching, scraping, filtering and extracting the most relevant information from online sources.
     Args:
         query: The search query."""
     search_docs = TavilySearchResults(max_results=1).invoke(input=query)
     formatted_search_docs = "\n\n---\n\n".join(
     return {"arxiv_results": formatted_search_docs}
 @tool
+def serper_search(query: str) -> str:
     """
     Search Google for a query and return maximum 2 result.
     Args: query: The search query.
     """
+    search_docs = GoogleSerperAPIWrapper(k=2)
     result = search_docs.run(query)
     return {"google_results": result}