Spaces:

Blablablab
/

codebook

Paused

App Files Files Community

codebook / potato /coding_agent_runner.py

davidjurgens

Deploy: Potato — Codebook Annotation

aceb1b2 verified 2 days ago

Raw

History Blame Contribute Delete

15.5 kB

	"""
	Coding Agent Runner

	Manages the lifecycle of a coding agent session. Mirrors AgentRunner
	but adapted for terminal-based coding agents (no Playwright).

	State machine: IDLE → RUNNING → PAUSED → COMPLETED → ERROR
	Communication: SSE listener pattern (same as AgentRunner)
	"""

	import json
	import logging
	import os
	import threading
	import time
	import uuid
	from dataclasses import dataclass, field
	from enum import Enum
	from typing import Any, Callable, Dict, List, Optional

	from .coding_agent_backend import (
	CodingAgentBackend,
	CodingAgentEvent,
	CodingAgentEventType,
	create_backend,
	)
	from .coding_agent_branch import BranchManager
	from .coding_agent_checkpoint import CheckpointManager
	from .coding_agent_sandbox import SandboxManager

	logger = logging.getLogger(__name__)


	class CodingAgentState(str, Enum):
	IDLE = "idle"
	RUNNING = "running"
	PAUSED = "paused"
	COMPLETED = "completed"
	ERROR = "error"


	@dataclass
	class CodingAgentConfig:
	"""Configuration for a coding agent session."""
	backend_type: str = "ollama_tool_use"
	ai_config: Dict[str, Any] = field(default_factory=dict)
	working_dir: str = "."
	max_turns: int = 50
	system_prompt: str = ""
	sandbox_mode: str = "worktree"

	@classmethod
	def from_config(cls, config: dict) -> "CodingAgentConfig":
	"""Create from YAML config dict."""
	live_config = config.get("live_coding_agent", {})
	return cls(
	backend_type=live_config.get("backend_type", "ollama_tool_use"),
	ai_config=live_config.get("ai_config", {}),
	working_dir=live_config.get("working_dir", "."),
	max_turns=live_config.get("max_turns", 50),
	system_prompt=live_config.get("system_prompt", ""),
	sandbox_mode=live_config.get("sandbox_mode", "worktree"),
	)


	class CodingAgentRunner:
	"""Manages a coding agent session with SSE event broadcasting."""

	def __init__(self, session_id: str, config: CodingAgentConfig,
	trace_dir: str = ""):
	self.session_id = session_id
	self.config = config
	self.trace_dir = trace_dir

	self._state = CodingAgentState.IDLE
	self._state_lock = threading.Lock()
	self._listeners: List[Callable] = []
	self._listener_lock = threading.Lock()

	self._backend: Optional[CodingAgentBackend] = None
	self._sandbox: Optional[SandboxManager] = None
	self._checkpoint_mgr: Optional[CheckpointManager] = None
	self._branch_mgr: Optional[BranchManager] = None
	self._structured_turns: List[Dict] = []
	self._task_description = ""
	self._started_at = 0.0
	self._event_thread: Optional[threading.Thread] = None

	@property
	def state(self) -> CodingAgentState:
	with self._state_lock:
	return self._state

	def _set_state(self, new_state: CodingAgentState):
	with self._state_lock:
	old = self._state
	self._state = new_state
	self._emit_event("state_change", {"old_state": old.value, "new_state": new_state.value})

	# --- Listener/SSE pattern (mirrors AgentRunner) ---

	def add_listener(self, callback: Callable) -> None:
	with self._listener_lock:
	self._listeners.append(callback)

	def remove_listener(self, callback: Callable) -> None:
	with self._listener_lock:
	self._listeners = [l for l in self._listeners if l is not callback]

	def _emit_event(self, event_type: str, data: dict):
	with self._listener_lock:
	for listener in self._listeners:
	try:
	listener(event_type, data)
	except Exception:
	pass

	# --- Control methods ---

	def start(self, task_description: str) -> None:
	"""Start the coding agent session."""
	if self.state != CodingAgentState.IDLE:
	raise RuntimeError(f"Cannot start in state {self.state}")

	self._task_description = task_description
	self._started_at = time.time()
	self._structured_turns = []

	# Create sandbox
	self._sandbox = SandboxManager(
	mode=self.config.sandbox_mode,
	base_dir=os.path.abspath(self.config.working_dir),
	)
	working_dir = self._sandbox.create(self.session_id)

	# Initialize checkpoint and branch managers
	self._checkpoint_mgr = CheckpointManager(working_dir, self.session_id)
	self._checkpoint_mgr.init()
	self._branch_mgr = BranchManager(self.session_id, working_dir)

	# Create backend
	backend_config = {
	"ai_config": self.config.ai_config,
	"max_turns": self.config.max_turns,
	}
	self._backend = create_backend(self.config.backend_type, backend_config)

	# Start the backend
	self._backend.start(task_description, working_dir, self.config.system_prompt)
	self._set_state(CodingAgentState.RUNNING)

	# Start event consumer thread
	self._event_thread = threading.Thread(target=self._consume_events, daemon=True)
	self._event_thread.start()

	self._emit_event("started", {
	"session_id": self.session_id,
	"task": task_description,
	"backend": self.config.backend_type,
	})

	def pause(self) -> None:
	if self._backend:
	self._backend.pause()
	self._set_state(CodingAgentState.PAUSED)

	def resume(self) -> None:
	if self._backend:
	self._backend.resume()
	self._set_state(CodingAgentState.RUNNING)

	def inject_instruction(self, instruction: str) -> None:
	if self._backend:
	self._backend.inject_instruction(instruction)
	self._emit_event("instruction_received", {"instruction": instruction})

	def stop(self) -> None:
	if self._backend:
	self._backend.stop()
	self._set_state(CodingAgentState.COMPLETED)
	self._save_trace()

	# --- Event consumption ---

	def _consume_events(self):
	"""Consume events from the backend and broadcast via SSE."""
	if not self._backend:
	return

	current_turn: Optional[Dict] = None

	try:
	for event in self._backend.get_events():
	et = event.event_type
	data = event.data

	if et == CodingAgentEventType.THINKING:
	self._emit_event("thinking", data)

	elif et == CodingAgentEventType.TOOL_CALL_START:
	self._emit_event("tool_call_start", data)

	elif et == CodingAgentEventType.TOOL_CALL_END:
	self._emit_event("tool_call", data)

	# Create checkpoint for file-modifying tools
	tool_name = data.get("tool", "")
	if tool_name.lower() in ("edit", "write", "bash", "create", "replace"):
	turn_idx = data.get("turn_index", len(self._structured_turns))
	if self._checkpoint_mgr:
	cp_id = self._checkpoint_mgr.create_checkpoint(
	turn_idx, tool_name,
	f"{tool_name} at step {turn_idx}",
	)
	if cp_id:
	self._emit_event("checkpoint", {
	"step_index": turn_idx,
	"checkpoint_id": cp_id,
	"tool": tool_name,
	})

	elif et == CodingAgentEventType.TURN_END:
	# Accumulate into structured_turns
	turn = {
	"role": "assistant",
	"content": data.get("content", ""),
	"tool_calls": data.get("tool_calls", []),
	}
	self._structured_turns.append(turn)
	self._emit_event("turn_end", {
	"turn_index": data.get("turn_index", len(self._structured_turns) - 1),
	**turn,
	})

	elif et == CodingAgentEventType.ERROR:
	self._set_state(CodingAgentState.ERROR)
	self._emit_event("error", data)

	elif et == CodingAgentEventType.COMPLETE:
	self._set_state(CodingAgentState.COMPLETED)
	self._emit_event("complete", {
	"total_turns": len(self._structured_turns),
	})
	self._save_trace()

	except Exception as e:
	logger.exception("Error consuming backend events")
	self._set_state(CodingAgentState.ERROR)
	self._emit_event("error", {"message": str(e)})

	# --- Checkpoint + Rollback ---

	def rollback_to_step(self, step_index: int) -> bool:
	"""Rollback files and conversation to the given step.

	Pauses the agent, restores files, truncates history.
	Returns True on success.
	"""
	if self._backend:
	self._backend.pause()
	self._set_state(CodingAgentState.PAUSED)

	# Rollback files
	if self._checkpoint_mgr:
	if not self._checkpoint_mgr.rollback_to(step_index):
	return False

	# Truncate structured turns
	self._structured_turns = self._structured_turns[:step_index + 1]

	# Truncate backend conversation history
	if self._backend:
	self._backend.truncate_history(step_index + 1)

	self._emit_event("rollback", {
	"step_index": step_index,
	"remaining_turns": len(self._structured_turns),
	})
	return True

	def get_checkpoints(self) -> List[dict]:
	"""Return list of checkpoint metadata."""
	if self._checkpoint_mgr:
	return self._checkpoint_mgr.list_checkpoints()
	return []

	def replay_from_step(self, step_index: int,
	instructions: Optional[str] = None,
	edited_actions: Optional[List[Dict]] = None) -> Optional[str]:
	"""Create a new branch from step_index and resume the agent.

	Args:
	step_index: Step to branch from
	instructions: Optional new instructions to inject
	edited_actions: Optional modified tool calls to execute first

	Returns:
	The new branch_id, or None on failure.
	"""
	# Pause current execution
	if self._backend:
	self._backend.pause()
	self._set_state(CodingAgentState.PAUSED)

	# Create a new branch
	if not self._branch_mgr:
	return None

	active_id = self._branch_mgr.active_branch_id
	try:
	branch = self._branch_mgr.create_branch(
	active_id, step_index,
	instructions=instructions,
	edited_actions=edited_actions,
	)
	except Exception as e:
	logger.error(f"Failed to create branch: {e}")
	return None

	# Rollback files to the branch point
	if self._checkpoint_mgr:
	self._checkpoint_mgr.rollback_to(step_index)

	# Truncate structured turns and backend history
	self._structured_turns = list(branch.turns)
	if self._backend:
	self._backend.truncate_history(step_index + 1)

	# Execute edited actions if provided
	if edited_actions:
	from .coding_agent_backend import execute_tool
	working_dir = self._sandbox.working_dir if self._sandbox else self.config.working_dir
	for action in edited_actions:
	tool_name = action.get("tool", "")
	tool_input = action.get("input", {})
	output = execute_tool(tool_name, tool_input, working_dir)
	action["output"] = output

	# Inject instructions if provided
	if instructions and self._backend:
	self._backend.inject_instruction(instructions)

	# Resume the agent
	if self._backend:
	self._backend.resume()
	self._set_state(CodingAgentState.RUNNING)

	self._emit_event("branch_created", {
	"branch_id": branch.branch_id,
	"parent_branch": active_id,
	"branch_point": step_index,
	"instructions": instructions,
	})

	return branch.branch_id

	def get_branches(self) -> List[dict]:
	"""List all branches."""
	if self._branch_mgr:
	return self._branch_mgr.list_branches()
	return []

	def switch_branch(self, branch_id: str) -> bool:
	"""Switch to a different branch."""
	if not self._branch_mgr:
	return False
	if self._branch_mgr.switch_branch(branch_id):
	branch = self._branch_mgr.get_branch(branch_id)
	if branch:
	self._structured_turns = list(branch.turns)
	return True
	return False

	def get_diff_since_step(self, step_index: int) -> str:
	"""Get diff from a step to current state."""
	if self._checkpoint_mgr:
	return self._checkpoint_mgr.get_diff_since(step_index)
	return ""

	# --- Trace export ---

	def get_trace(self) -> Dict[str, Any]:
	"""Get the full trace in CodingTraceDisplay format."""
	trace = {
	"session_id": self.session_id,
	"task_description": self._task_description,
	"structured_turns": list(self._structured_turns),
	"backend": self.config.backend_type,
	"model": self.config.ai_config.get("model", ""),
	"started_at": self._started_at,
	"sandbox_mode": self.config.sandbox_mode,
	}
	# Include branches if any were created
	if self._branch_mgr and len(self._branch_mgr.list_branches()) > 1:
	trace["branches"] = self._branch_mgr.save_all()
	# Include checkpoints
	if self._checkpoint_mgr:
	trace["checkpoints"] = self._checkpoint_mgr.list_checkpoints()
	return trace

	def get_structured_turns(self) -> List[Dict]:
	return list(self._structured_turns)

	def get_state_summary(self) -> Dict[str, Any]:
	return {
	"session_id": self.session_id,
	"state": self.state.value,
	"task": self._task_description,
	"turns": len(self._structured_turns),
	"backend": self.config.backend_type,
	}

	def _save_trace(self):
	"""Save trace to disk."""
	if not self.trace_dir:
	return

	os.makedirs(self.trace_dir, exist_ok=True)
	trace_path = os.path.join(self.trace_dir, "trace.json")
	try:
	with open(trace_path, "w", encoding="utf-8") as f:
	json.dump(self.get_trace(), f, indent=2, ensure_ascii=False)
	logger.info(f"Saved coding agent trace to {trace_path}")
	except Exception as e:
	logger.error(f"Failed to save trace: {e}")

	# --- Cleanup ---

	def cleanup(self):
	"""Clean up resources."""
	if self._backend:
	try:
	self._backend.stop()
	except Exception:
	pass
	if self._sandbox:
	try:
	self._sandbox.cleanup()
	except Exception:
	pass