Spaces:

yhzhang3
/

alpha

Sleeping

App Files Files Community

alpha / managers /workflow /workflow_engine.py

yhzhang3

first commit

f580ad3 3 months ago

raw

history blame contribute delete

12.4 kB

	"""
	Workflow Engine Manager for CodeAct Agent.
	Manages the LangGraph workflow execution.
	"""

	import re
	import json
	import datetime
	from typing import Dict, Tuple, List, Any
	from pathlib import Path
	from rich.progress import Progress, SpinnerColumn, TextColumn
	from rich.rule import Rule
	from langchain_core.messages import AIMessage, HumanMessage, BaseMessage
	from langgraph.graph import StateGraph, START, END
	from core.types import AgentState, AgentConfig
	from .plan_manager import PlanManager


	class WorkflowEngine:
	"""Manages the LangGraph workflow execution."""

	def __init__(self, model, config: AgentConfig, console_display, state_manager):
	self.model = model
	self.config = config
	self.console = console_display
	self.state_manager = state_manager
	self.plan_manager = PlanManager()
	self.graph = None
	self.trace_logs = [] # Store all trace logs
	self.message_history = [] # Store all messages

	def setup_workflow(self, generate_func, execute_func, should_continue_func):
	"""Setup the LangGraph workflow with provided functions."""
	workflow = StateGraph(AgentState)

	workflow.add_node("generate", generate_func)
	workflow.add_node("execute", execute_func)

	workflow.add_edge(START, "generate")
	workflow.add_edge("execute", "generate")

	workflow.add_conditional_edges("generate", should_continue_func, {
	"end": END,
	"execute": "execute"
	})

	self.graph = workflow.compile()

	def run_workflow(self, initial_state: Dict) -> Tuple:
	"""Execute the workflow and handle display.

	Returns:
	tuple: (result_content, final_state)
	"""
	# Clear previous traces for new run
	self.trace_logs = []
	self.message_history = []

	# Track if final solution has been provided
	final_solution_provided = False
	previous_plan = None
	displayed_reasoning = set()

	# Stream the workflow execution with monitoring
	self.console.console.print(Rule(title="Execution Steps", style="yellow"))

	with Progress(
	SpinnerColumn(),
	TextColumn("[progress.description]{task.description}"),
	console=self.console.console,
	transient=True
	) as progress:
	task = progress.add_task("Executing agent...", total=None)

	final_state = None
	for s in self.graph.stream(initial_state, stream_mode="values"):
	step_count = s.get("step_count", 0)
	current_plan = s.get("current_plan")
	final_state = s

	progress.update(task, description=f"Step {step_count}")

	message = s["messages"][-1]

	# Serialize and store the message
	serialized_msg = self._serialize_message(message)
	self.message_history.append(serialized_msg)

	# Process different types of messages
	if isinstance(message, AIMessage):
	self._process_ai_message(
	message, step_count, current_plan, previous_plan,
	displayed_reasoning, final_solution_provided
	)
	if current_plan != previous_plan:
	previous_plan = current_plan

	elif "<observation>" in message.content:
	self._process_observation_message(message, step_count)

	result_content = final_state["messages"][-1].content if final_state else ""
	return result_content, final_state

	def _process_ai_message(self, message, step_count, current_plan, previous_plan,
	displayed_reasoning, final_solution_provided):
	"""Process AI message and display appropriate panels."""
	full_content = message.content

	# 1. REASONING: Extract and display agent's thinking
	thinking_content = self._extract_thinking_content(full_content)
	if thinking_content and len(thinking_content) > 20:
	content_hash = hash(thinking_content.strip())
	if content_hash not in displayed_reasoning:
	self.console.print_reasoning(thinking_content, step_count)
	displayed_reasoning.add(content_hash)
	# Add trace entry for reasoning
	self._add_trace_entry("reasoning", step_count, thinking_content)

	# 2. PLAN: Show plan only when it has changed
	if (current_plan and current_plan != previous_plan and
	self.config.verbose and not final_solution_provided):
	self.console.print_plan(current_plan)
	# Add trace entry for plan
	self._add_trace_entry("plan", step_count, current_plan)

	# 3. ACTION & CODE: Handle different action types
	if "<execute>" in full_content and "</execute>" in full_content:
	execute_match = re.search(r"<execute>(.*?)</execute>", full_content, re.DOTALL)
	if execute_match:
	code = execute_match.group(1).strip()
	self.console.print_code_execution(code, step_count)
	# Add trace entry for code execution
	self._add_trace_entry("code_execution", step_count, code)

	elif "<solution>" in full_content and "</solution>" in full_content:
	solution_match = re.search(r"<solution>(.*?)</solution>", full_content, re.DOTALL)
	if solution_match:
	# Update plan to mark all remaining steps as completed
	if current_plan:
	updated_plan = self.plan_manager.update_plan_for_solution(current_plan)
	if updated_plan != current_plan:
	self.console.print_plan(updated_plan)

	solution = solution_match.group(1).strip()
	self.console.print_solution(solution, step_count)
	final_solution_provided = True
	# Add trace entry for solution
	self._add_trace_entry("solution", step_count, solution)

	elif "<error>" in full_content:
	error_match = re.search(r"<error>(.*?)</error>", full_content, re.DOTALL)
	if error_match:
	error_content = error_match.group(1).strip()
	self.console.print_error(error_content, step_count)
	# Add trace entry for error
	self._add_trace_entry("error", step_count, error_content)

	def _process_observation_message(self, message, step_count):
	"""Process observation message and display results."""
	obs_match = re.search(r"<observation>(.*?)</observation>", message.content, re.DOTALL)
	if obs_match:
	observation = obs_match.group(1).strip()
	formatted_output = self._truncate_to_20_rows(observation)
	self.console.print_execution_result(formatted_output, step_count)
	# Add trace entry for observation
	self._add_trace_entry("observation", step_count, observation)

	def _extract_thinking_content(self, content: str) -> str:
	"""Extract thinking content from the message, removing tags and plan information."""
	# Remove specific tags but keep observation content for separate handling
	content = re.sub(r'</?(execute\|solution\|error)>', '', content)

	# Remove plan content (numbered lists with checkboxes)
	plan_pattern = r'\d+\.\s\[[^\]]\]\s[^\n]+(?:\n\d+\.\s\[[^\]]\]\s[^\n]+)*'
	content = re.sub(plan_pattern, '', content).strip()

	# Remove observation blocks entirely
	content = re.sub(r'<observation>.*?</observation>', '', content, flags=re.DOTALL)

	# Clean up extra whitespace and empty lines
	lines = [line.strip() for line in content.split('\n') if line.strip()]
	return '\n'.join(lines)

	def _truncate_to_20_rows(self, text: str) -> str:
	"""Truncate any text output to show only the first 20 rows."""
	lines = text.split('\n')

	if len(lines) > 20:
	truncated = '\n'.join(lines[:20])
	total_lines = len(lines)
	truncated += f"\n\n⚠️ Output truncated to 20 rows. Full output contains {total_lines} rows."
	return truncated

	return text

	def _add_trace_entry(self, step_type: str, step_count: int, content: Any, metadata: Dict = None):
	"""Add an entry to the trace log."""
	entry = {
	"timestamp": datetime.datetime.now().isoformat(),
	"step_count": step_count,
	"step_type": step_type,
	"content": content,
	"metadata": metadata or {}
	}
	self.trace_logs.append(entry)

	def _serialize_message(self, message: BaseMessage) -> Dict:
	"""Serialize a message for saving."""
	if isinstance(message, HumanMessage):
	msg_type = "human"
	elif isinstance(message, AIMessage):
	msg_type = "ai"
	else:
	msg_type = "system"

	return {
	"type": msg_type,
	"content": message.content,
	"timestamp": datetime.datetime.now().isoformat()
	}

	def save_trace_to_file(self, filepath: str = None) -> str:
	"""Save the complete trace log to a JSON file."""
	if filepath is None:
	timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
	filepath = f"agent_trace_{timestamp}.json"

	trace_data = {
	"execution_time": datetime.datetime.now().isoformat(),
	"config": {
	"max_steps": self.config.max_steps,
	"timeout_seconds": self.config.timeout_seconds,
	"verbose": self.config.verbose
	},
	"messages": self.message_history,
	"trace_logs": self.trace_logs
	}

	with open(filepath, 'w', encoding='utf-8') as f:
	json.dump(trace_data, f, indent=2, ensure_ascii=False)

	return filepath

	def generate_summary(self) -> Dict:
	"""Generate a summary of the agent execution."""
	summary = {
	"total_steps": len(self.trace_logs),
	"message_count": len(self.message_history),
	"execution_flow": [],
	"code_executions": [],
	"observations": [],
	"errors": [],
	"final_solution": None
	}

	for entry in self.trace_logs:
	step_info = {
	"step": entry["step_count"],
	"type": entry["step_type"],
	"timestamp": entry["timestamp"]
	}

	if entry["step_type"] == "reasoning":
	summary["execution_flow"].append({
	**step_info,
	"reasoning": entry["content"][:200] + "..." if len(entry["content"]) > 200 else entry["content"]
	})
	elif entry["step_type"] == "code_execution":
	summary["code_executions"].append({
	**step_info,
	"code": entry["content"]
	})
	elif entry["step_type"] == "observation":
	summary["observations"].append({
	**step_info,
	"output": entry["content"][:500] + "..." if len(entry["content"]) > 500 else entry["content"]
	})
	elif entry["step_type"] == "error":
	summary["errors"].append({
	**step_info,
	"error": entry["content"]
	})
	elif entry["step_type"] == "solution":
	summary["final_solution"] = {
	**step_info,
	"solution": entry["content"]
	}

	return summary

	def save_summary_to_file(self, filepath: str = None) -> str:
	"""Save the execution summary to a JSON file."""
	if filepath is None:
	timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
	filepath = f"agent_summary_{timestamp}.json"

	summary = self.generate_summary()
	summary["timestamp"] = datetime.datetime.now().isoformat()

	with open(filepath, 'w', encoding='utf-8') as f:
	json.dump(summary, f, indent=2, ensure_ascii=False)

	return filepath