File size: 10,694 Bytes
2a3616b
 
 
b6088cd
 
 
2a3616b
 
b6088cd
 
 
 
2a3616b
 
b6088cd
2a3616b
 
 
 
b6088cd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2a3616b
b6088cd
 
 
 
 
 
 
 
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
 
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
 
 
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
 
 
 
 
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2a3616b
 
 
b6088cd
2a3616b
b6088cd
 
 
 
2a3616b
 
 
b6088cd
 
 
2a3616b
b6088cd
 
 
 
 
 
 
 
 
 
2a3616b
b6088cd
2a3616b
b6088cd
 
2a3616b
 
 
b6088cd
 
 
 
 
2a3616b
b6088cd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
 
 
 
 
 
 
 
 
2a3616b
b6088cd
 
 
 
 
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
2a3616b
b6088cd
2a3616b
 
 
b6088cd
 
 
 
 
 
 
 
 
 
 
 
2a3616b
b6088cd
 
 
 
 
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
2a3616b
b6088cd
2a3616b
b6088cd
 
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
2a3616b
b6088cd
 
 
 
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
2a3616b
b6088cd
2a3616b
b6088cd
 
2a3616b
b6088cd
2a3616b
b6088cd
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
2a3616b
b6088cd
 
 
2a3616b
b6088cd
2a3616b
 
 
b6088cd
 
 
2a3616b
b6088cd
 
 
 
 
2a3616b
b6088cd
2a3616b
b6088cd
2a3616b
b6088cd
2a3616b
b6088cd
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
from collections.abc import Sequence
from typing import Annotated, Literal, TypedDict

from langchain.chat_models import init_chat_model

# Import tools
from langchain_community.tools import DuckDuckGoSearchRun, WikipediaQueryRun
from langchain_community.tools.arxiv import ArxivQueryRun
from langchain_community.tools.pubmed.tool import PubmedQueryRun
from langchain_community.tools.semanticscholar.tool import SemanticScholarQueryRun
from langchain_community.tools.wikidata.tool import WikidataQueryRun
from langchain_community.utilities import WikipediaAPIWrapper
from langchain_core.messages import BaseMessage, HumanMessage, SystemMessage, ToolMessage
from langchain_core.runnables import RunnableConfig
from langchain_core.tools import Tool
from langchain_experimental.utilities import PythonREPL
from langgraph.graph import END, StateGraph
from langgraph.graph.message import add_messages
from pydantic import BaseModel, Field

# Set up tools
python_repl = PythonREPL()
repl_tool = Tool(
    name="python_repl",
    description="A Python shell. Use this to execute python commands. Input should be a valid python command. If you want to see the output of a value, you should print it out with `print(...)`.",
    func=python_repl.run,
)

# Initialize all tools
tools = [
    DuckDuckGoSearchRun(),
    PubmedQueryRun(),
    SemanticScholarQueryRun(),
    ArxivQueryRun(),
    WikidataQueryRun(),
    WikipediaQueryRun(api_wrapper=WikipediaAPIWrapper()),
    repl_tool,
]

# Initialize Gemini model
model = init_chat_model("gemini-2.0-flash", model_provider="google_genai")
model_with_tools = model.bind_tools(tools)

# Create tools lookup
tools_by_name = {tool.name: tool for tool in tools}


# Pydantic models for structured output
class ToolSufficiencyResponse(BaseModel):
    """Response for tool sufficiency check"""

    sufficient: bool = Field(description="Whether the available tools are sufficient to answer the question")
    reasoning: str = Field(description="Brief reasoning for the decision")


class FinalAnswer(BaseModel):
    """Final answer structure"""

    answer: str = Field(description="The comprehensive answer to the user's question")
    confidence: Literal["high", "medium", "low"] = Field(description="Confidence level in the answer")
    sources_used: list[str] = Field(description="List of tools/sources that were used to generate the answer")


# Define graph state
class AgentState(TypedDict):
    """The state of the agent."""

    messages: Annotated[Sequence[BaseMessage], add_messages]
    llm_call_count: int
    max_llm_calls: int


# Node functions
def check_tool_sufficiency(state: AgentState, config: RunnableConfig):
    """Check if available tools are sufficient to answer the question"""

    # Get the user's question
    user_message = None
    for msg in state["messages"]:
        if msg.type == "human":
            user_message = msg.content
            break

    # Create system prompt for sufficiency check
    available_tools_desc = "\n".join([f"- {tool.name}: {tool.description}" for tool in tools])

    system_prompt = f"""You are an AI assistant that needs to determine if the available tools are sufficient to answer a user's question.

Available tools:
{available_tools_desc}

Your task is to analyze the user's question and determine if these tools provide sufficient capability to answer it comprehensively.

Consider:
- Can the question be answered with web search, academic papers, or computational tools?
- Does the question require real-time data, personal information, or capabilities not available through these tools?
- Can you break down the question into parts that these tools can handle?

Be generous in your assessment - if there's a reasonable path to answer the question using these tools, respond with sufficient=True."""

    # Use structured output for sufficiency check
    structured_model = model.with_structured_output(ToolSufficiencyResponse)

    messages = [SystemMessage(content=system_prompt), HumanMessage(content=f"Question to analyze: {user_message}")]

    response = structured_model.invoke(messages, config)

    # Add response to messages for context
    response_message = SystemMessage(
        content=f"Tool sufficiency check: {'Sufficient' if response.sufficient else 'Insufficient'}. Reasoning: {response.reasoning}"
    )

    return {"messages": [response_message], "tool_sufficiency": response.sufficient}


def call_model(state: AgentState, config: RunnableConfig):
    """Call the model (ReAct agent LLM node)"""

    system_prompt = SystemMessage(
        content="""You are a helpful AI assistant with access to various tools. Use the tools available to you to answer the user's question comprehensively.

Think step by step:
1. Analyze what information you need
2. Use appropriate tools to gather that information
3. Synthesize the information to provide a complete answer

Be thorough but efficient with your tool usage."""
    )

    response = model_with_tools.invoke([system_prompt] + state["messages"], config)

    # Increment LLM call count
    new_count = state.get("llm_call_count", 0) + 1

    return {"messages": [response], "llm_call_count": new_count}


def tool_node(state: AgentState):
    """Execute tools based on the last message's tool calls"""
    outputs = []
    last_message = state["messages"][-1]

    for tool_call in last_message.tool_calls:
        try:
            tool_result = tools_by_name[tool_call["name"]].invoke(tool_call["args"])
            outputs.append(
                ToolMessage(
                    content=str(tool_result),
                    name=tool_call["name"],
                    tool_call_id=tool_call["id"],
                )
            )
        except Exception as e:
            outputs.append(
                ToolMessage(
                    content=f"Error executing tool {tool_call['name']}: {str(e)}",
                    name=tool_call["name"],
                    tool_call_id=tool_call["id"],
                )
            )

    return {"messages": outputs}


def final_answer_node(state: AgentState, config: RunnableConfig):
    """Generate final structured answer based on conversation history"""

    system_prompt = SystemMessage(
        content="""You are tasked with providing a final, comprehensive answer based on the conversation history and tool usage.

Analyze all the information gathered from the tools and provide:
1. A clear, comprehensive answer to the original question
2. Your confidence level in this answer
3. The sources/tools that were used

Be honest about limitations and indicate your confidence level appropriately."""
    )

    # Get the original user question
    user_question = None
    for msg in state["messages"]:
        if msg.type == "human":
            user_question = msg.content
            break

    # Create structured output model
    structured_model = model.with_structured_output(FinalAnswer)

    messages = [
        system_prompt,
        HumanMessage(content=f"Original question: {user_question}"),
        SystemMessage(content="Based on the following conversation history, provide your final answer:"),
    ] + state["messages"]

    response = structured_model.invoke(messages, config)

    return {"messages": [SystemMessage(content=f"Final Answer: {response.answer}")], "final_answer": response}


# Edge functions
def should_continue_sufficiency(state: AgentState):
    """Decide whether tools are sufficient"""
    # Check if we have a tool sufficiency result
    for msg in reversed(state["messages"]):
        if "Tool sufficiency check: Sufficient" in msg.content:
            return "sufficient"
        elif "Tool sufficiency check: Insufficient" in msg.content:
            return "insufficient"
    return "insufficient"  # Default to insufficient if unclear


def should_continue_react(state: AgentState):
    """Decide whether to continue with ReAct loop or move to final answer"""
    messages = state["messages"]
    last_message = messages[-1]
    llm_call_count = state.get("llm_call_count", 0)
    max_calls = state.get("max_llm_calls", 4)

    # If we've reached the maximum number of LLM calls, force stop
    if llm_call_count >= max_calls:
        return "final_answer"

    # If there are no tool calls, we're done with ReAct loop
    if not hasattr(last_message, "tool_calls") or not last_message.tool_calls:
        return "final_answer"

    # Otherwise continue with tools
    return "continue"


# Build the graph
def create_react_agent_graph():
    """Create and return the compiled ReAct agent graph"""

    workflow = StateGraph(AgentState)

    # Add nodes
    workflow.add_node("check_sufficiency", check_tool_sufficiency)
    workflow.add_node("agent", call_model)
    workflow.add_node("tools", tool_node)
    workflow.add_node("final_answer", final_answer_node)

    # Set entry point
    workflow.set_entry_point("check_sufficiency")

    # Add conditional edge from sufficiency check
    workflow.add_conditional_edges(
        "check_sufficiency", should_continue_sufficiency, {"sufficient": "agent", "insufficient": END}
    )

    # Add conditional edge from agent
    workflow.add_conditional_edges(
        "agent", should_continue_react, {"continue": "tools", "final_answer": "final_answer"}
    )

    # Add edge from tools back to agent
    workflow.add_edge("tools", "agent")

    # Add edge from final_answer to END
    workflow.add_edge("final_answer", END)

    return workflow.compile()


# Helper function for running the agent
def run_agent(question: str, max_llm_calls: int = 4):
    """Run the ReAct agent with a question"""

    graph = create_react_agent_graph()

    initial_state = {"messages": [HumanMessage(content=question)], "llm_call_count": 0, "max_llm_calls": max_llm_calls}

    # Stream the execution
    print(f"Question: {question}")
    print("=" * 50)

    for step in graph.stream(initial_state):
        for node, output in step.items():
            print(f"\n--- {node.upper()} ---")
            if "messages" in output and output["messages"]:
                for msg in output["messages"]:
                    if hasattr(msg, "content"):
                        print(f"{msg.__class__.__name__}: {msg.content}")
                    elif hasattr(msg, "tool_calls") and msg.tool_calls:
                        print(f"Tool calls: {[tc['name'] for tc in msg.tool_calls]}")

            if "final_answer" in output:
                print("\nFINAL STRUCTURED ANSWER:")
                print(f"Answer: {output['final_answer'].answer}")
                print(f"Confidence: {output['final_answer'].confidence}")
                print(f"Sources: {output['final_answer'].sources_used}")