Spaces:

Harsh-1202
/

langgraph-rag-agent

Sleeping

langgraph-rag-agent / src /agent_workflow.py

a77376b 3 months ago

12.1 kB

	"""
	LangGraph workflow implementation for the RAG Q&A Agent.
	Defines the agent graph with plan, retrieve, answer, and reflect nodes.
	"""

	from typing import TypedDict, Annotated, Dict, Any, List
	from langgraph.graph import StateGraph, END
	from rag_pipeline import RAGPipeline
	from llm_utils import LLMHandler
	from reflection import ReflectionEvaluator
	import operator


	# Define the agent state
	class AgentState(TypedDict):
	"""State passed between nodes in the agent workflow."""
	query: str
	plan: str
	needs_retrieval: bool
	retrieved_context: str
	retrieved_chunks: List[Dict[str, Any]]
	answer: str
	reflection: Dict[str, Any]
	final_response: str
	iteration: int


	class RAGAgent:
	"""LangGraph-based RAG Q&A Agent with reflection."""

	def __init__(
	self,
	rag_pipeline: RAGPipeline,
	llm_handler: LLMHandler,
	reflection_evaluator: ReflectionEvaluator,
	max_iterations: int = 2
	):
	"""
	Initialize the RAG agent.

	Args:
	rag_pipeline: RAG pipeline for retrieval
	llm_handler: LLM handler for generation
	reflection_evaluator: Reflection evaluator
	max_iterations: Maximum reflection iterations
	"""
	self.rag_pipeline = rag_pipeline
	self.llm_handler = llm_handler
	self.reflection_evaluator = reflection_evaluator
	self.max_iterations = max_iterations

	# Build the graph
	self.graph = self._build_graph()
	print("✓ RAG Agent workflow initialized")

	def _build_graph(self):
	"""Build the LangGraph workflow."""
	# Create state graph
	workflow = StateGraph(AgentState)

	# Add nodes
	workflow.add_node("plan", self.plan_node)
	workflow.add_node("retrieve", self.retrieve_node)
	workflow.add_node("answer", self.answer_node)
	workflow.add_node("reflect", self.reflect_node)

	# Define edges
	workflow.set_entry_point("plan")

	# Plan -> Retrieve or Answer
	workflow.add_conditional_edges(
	"plan",
	self.should_retrieve,
	{
	True: "retrieve",
	False: "answer"
	}
	)

	# Retrieve -> Answer
	workflow.add_edge("retrieve", "answer")

	# Answer -> Reflect
	workflow.add_edge("answer", "reflect")

	# Reflect -> End or Answer (for regeneration)
	workflow.add_conditional_edges(
	"reflect",
	self.should_regenerate,
	{
	"accept": END,
	"regenerate": "answer",
	"end": END
	}
	)

	return workflow.compile()

	def plan_node(self, state: AgentState) -> AgentState:
	"""
	Planning node: Analyze query and decide if retrieval is needed.

	Args:
	state: Current agent state

	Returns:
	Updated state with plan
	"""
	print("\n" + "="*60)
	print("📋 NODE: PLAN")
	print("="*60 + "\n")

	query = state["query"]
	print(f"Query: {query}\n")

	# Use LLM to analyze query and create a plan
	planning_prompt = f"""Analyze the following user query and determine if it requires retrieving information from a knowledge base.

	User Query: "{query}"

	Consider:
	1. Is this a factual question that would benefit from specific documentation or knowledge?
	2. Is this a general question that can be answered without specific context?
	3. Does this query ask about specific concepts, technologies, or topics?

	Respond in the following format:
	NEEDS_RETRIEVAL: [YES/NO]
	REASONING: [Brief explanation]
	PLAN: [How you will approach answering this query]"""

	system_message = "You are a query planning agent. Analyze queries and determine the best approach to answer them."

	plan_response = self.llm_handler.generate(
	planning_prompt,
	system_message
	)

	# Parse response
	needs_retrieval = "YES" in plan_response.upper().split("NEEDS_RETRIEVAL:")[1].split("\n")[0] if "NEEDS_RETRIEVAL:" in plan_response.upper() else True

	print(f"Plan Response:\n{plan_response}\n")
	print(f"Needs Retrieval: {needs_retrieval}")

	state["plan"] = plan_response
	state["needs_retrieval"] = needs_retrieval
	state["iteration"] = 0

	print("\n" + "="*60 + "\n")

	return state

	def should_retrieve(self, state: AgentState) -> bool:
	"""Conditional edge: Determine if retrieval is needed."""
	return state["needs_retrieval"]

	def retrieve_node(self, state: AgentState) -> AgentState:
	"""
	Retrieval node: Retrieve relevant context from vector store.

	Args:
	state: Current agent state

	Returns:
	Updated state with retrieved context
	"""
	print("\n" + "="*60)
	print("🔍 NODE: RETRIEVE")
	print("="*60 + "\n")

	query = state["query"]

	# Retrieve context
	context, chunks = self.rag_pipeline.retrieve_context(query, top_k=3)

	print(f"Retrieved {len(chunks)} relevant chunks\n")

	# Display retrieved content preview
	for i, chunk in enumerate(chunks):
	preview = chunk['content'][:150] + "..." if len(chunk['content']) > 150 else chunk['content']
	print(f"Chunk {i+1} Preview: {preview}\n")

	state["retrieved_context"] = context
	state["retrieved_chunks"] = chunks

	print("="*60 + "\n")

	return state

	def answer_node(self, state: AgentState) -> AgentState:
	"""
	Answer generation node: Generate answer using LLM.

	Args:
	state: Current agent state

	Returns:
	Updated state with generated answer
	"""
	print("\n" + "="*60)
	print("💬 NODE: ANSWER")
	print("="*60 + "\n")

	query = state["query"]
	iteration = state.get("iteration", 0)

	if iteration > 0:
	print(f"[Regeneration attempt {iteration}]\n")

	# Check if we have retrieved context
	if state.get("retrieved_context"):
	# Generate answer with context
	context = state["retrieved_context"]

	# Check if this is a regeneration with feedback
	if "reflection" in state and iteration > 0:
	feedback = state["reflection"]["reasoning"]
	answer = self._generate_answer_with_feedback(query, context, feedback)
	else:
	answer = self.llm_handler.generate_with_context(
	query,
	context,
	system_message="You are a helpful AI assistant. Answer questions accurately based on the provided context."
	)
	else:
	# Generate answer without context
	answer = self.llm_handler.generate(
	query,
	system_message="You are a helpful AI assistant. Answer questions concisely and accurately."
	)

	print(f"Generated Answer:\n{answer}\n")

	state["answer"] = answer

	print("="*60 + "\n")

	return state

	def _generate_answer_with_feedback(
	self,
	query: str,
	context: str,
	feedback: str
	) -> str:
	"""
	Generate answer incorporating feedback from reflection.

	Args:
	query: User query
	context: Retrieved context
	feedback: Feedback from reflection

	Returns:
	Regenerated answer
	"""
	prompt = f"""The previous answer was not satisfactory. Here's the feedback:

	{feedback}

	Now, please generate a better answer to the following question using the context provided.

	Context:
	{context}

	Question: {query}

	Provide a comprehensive, accurate, and relevant answer that addresses the feedback."""

	system_message = "You are a helpful AI assistant. Learn from feedback and provide improved answers."

	return self.llm_handler.generate(prompt, system_message)

	def reflect_node(self, state: AgentState) -> AgentState:
	"""
	Reflection node: Evaluate answer quality.

	Args:
	state: Current agent state

	Returns:
	Updated state with reflection results
	"""
	query = state["query"]
	answer = state["answer"]
	context = state.get("retrieved_context", "")
	chunks = state.get("retrieved_chunks", [])

	# Evaluate answer
	reflection_result = self.reflection_evaluator.evaluate(
	query,
	answer,
	context,
	chunks
	)

	state["reflection"] = reflection_result

	return state

	def should_regenerate(self, state: AgentState) -> str:
	"""
	Conditional edge: Determine if answer should be regenerated.

	Args:
	state: Current agent state

	Returns:
	Next node or END
	"""
	reflection = state["reflection"]
	iteration = state.get("iteration", 0)

	recommendation = reflection.get("recommendation", "ACCEPT")

	# Accept answer if it's good enough or we've hit max iterations
	if recommendation == "ACCEPT" or iteration >= self.max_iterations:
	state["final_response"] = state["answer"]
	return "accept"

	# Regenerate if rejected and we haven't hit max iterations
	if recommendation == "REJECT" and iteration < self.max_iterations:
	state["iteration"] = iteration + 1
	print(f"\n⚠️ Answer rejected. Regenerating (iteration {state['iteration']})...\n")
	return "regenerate"

	# Otherwise, accept with partial relevance
	state["final_response"] = state["answer"]
	return "end"

	def query(self, question: str) -> Dict[str, Any]:
	"""
	Process a query through the agent workflow.

	Args:
	question: User question

	Returns:
	Complete agent response with all state information
	"""
	print("\n" + "="*70)
	print(" "*20 + "🤖 RAG Q&A AGENT 🤖")
	print("="*70 + "\n")
	print(f"User Query: {question}")
	print("="*70)

	# Initialize state
	initial_state = AgentState(
	query=question,
	plan="",
	needs_retrieval=True,
	retrieved_context="",
	retrieved_chunks=[],
	answer="",
	reflection={},
	final_response="",
	iteration=0
	)

	# Run the graph
	final_state = self.graph.invoke(initial_state)

	# Print final result
	print("\n" + "="*70)
	print("✅ FINAL RESPONSE")
	print("="*70 + "\n")
	print(final_state["final_response"])
	print("\n" + "="*70 + "\n")

	return final_state


	def create_rag_agent(
	rag_pipeline: RAGPipeline,
	llm_handler: LLMHandler,
	reflection_evaluator: ReflectionEvaluator,
	max_iterations: int = 2
	) -> RAGAgent:
	"""
	Create and return a RAG agent instance.

	Args:
	rag_pipeline: RAG pipeline for retrieval
	llm_handler: LLM handler for generation
	reflection_evaluator: Reflection evaluator
	max_iterations: Maximum reflection iterations

	Returns:
	RAGAgent instance
	"""
	return RAGAgent(rag_pipeline, llm_handler, reflection_evaluator, max_iterations)