Spaces:

ZENLLC
/

Orchestrator

Sleeping

App Files Files Community

Orchestrator / core /sim.py

ZENLLC

Create sim.py

9c9380f verified 24 days ago

raw

history blame contribute delete

30.9 kB

	import math
	import random
	from dataclasses import dataclass, field, asdict
	from typing import Dict, List, Tuple, Optional, Any

	import numpy as np
	from PIL import Image

	from .config import SimConfig, DEFAULT_MODEL_RATES
	from .events import EventStore
	from .pricing import cost_from_tokens
	from .ledger import Ledger
	from .tasks import TaskSystem, Task

	# -----------------------------
	# Arena settings (same vibe)
	# -----------------------------
	GRID_W, GRID_H = 29, 19
	TILE = 24
	HUD_H = 64
	SVG_W = GRID_W * TILE
	SVG_H = GRID_H * TILE + HUD_H

	VIEW_W, VIEW_H = 560, 315
	FOV_DEG = 74
	MAX_DEPTH = 22

	DIRS = [(1, 0), (0, 1), (-1, 0), (0, -1)]
	ORI_DEG = [0, 90, 180, 270]

	EMPTY = 0
	WALL = 1
	WORK = 2 # "work nodes" (tickets/customers)
	RISK = 3 # hazards/risks
	INCIDENT = 4 # urgent incident hotspots
	GATE = 5

	COL_BG = "#0b1020"
	COL_GRIDLINE = "#121a3b"
	COL_WALL = "#cdd2e6"
	COL_EMPTY = "#19214a"
	COL_WORK = "#9ab0ff"
	COL_RISK = "#ff3b3b"
	COL_INC = "#ffd17a"
	COL_GATE = "#7ad9ff"

	AGENT_COLORS = {
	"Planner": "#7ad9ff",
	"Worker1": "#6dffb0",
	"Worker2": "#ffd17a",
	"Reviewer": "#ff7ad9",
	"Ops": "#ff6d6d",
	}

	def clamp(v, lo, hi):
	return lo if v < lo else hi if v > hi else v

	def in_bounds(x: int, y: int) -> bool:
	return 0 <= x < GRID_W and 0 <= y < GRID_H

	def manhattan(a: Tuple[int, int], b: Tuple[int, int]) -> int:
	return abs(a[0] - b[0]) + abs(a[1] - b[1])

	def rng(seed: int) -> random.Random:
	r = random.Random()
	r.seed(seed & 0xFFFFFFFF)
	return r

	def base_border_grid() -> List[List[int]]:
	g = [[EMPTY for _ in range(GRID_W)] for _ in range(GRID_H)]
	for x in range(GRID_W):
	g[0][x] = WALL
	g[GRID_H - 1][x] = WALL
	for y in range(GRID_H):
	g[y][0] = WALL
	g[y][GRID_W - 1] = WALL
	return g

	def carve_office(seed: int) -> List[List[int]]:
	r = rng(seed)
	g = base_border_grid()

	# Add some inner walls (rooms)
	for _ in range(70):
	x = r.randint(2, GRID_W - 3)
	y = r.randint(2, GRID_H - 3)
	if r.random() < 0.70:
	g[y][x] = WALL

	# Carve some corridors
	for _ in range(120):
	x = r.randint(1, GRID_W - 2)
	y = r.randint(1, GRID_H - 2)
	g[y][x] = EMPTY

	# Gates (secure doors)
	for _ in range(6):
	x = r.randint(3, GRID_W - 4)
	y = r.randint(3, GRID_H - 4)
	if g[y][x] == WALL:
	g[y][x] = GATE

	# Work nodes
	for _ in range(16):
	x = r.randint(2, GRID_W - 3)
	y = r.randint(2, GRID_H - 3)
	if g[y][x] == EMPTY:
	g[y][x] = WORK

	# Risk nodes
	for _ in range(10):
	x = r.randint(2, GRID_W - 3)
	y = r.randint(2, GRID_H - 3)
	if g[y][x] == EMPTY:
	g[y][x] = RISK

	return g

	def is_blocking(tile: int) -> bool:
	return tile == WALL

	def neighbors4(x: int, y: int) -> List[Tuple[int, int]]:
	return [(x + 1, y), (x, y + 1), (x - 1, y), (x, y - 1)]

	def bfs_next_step(grid: List[List[int]], start: Tuple[int, int], goal: Tuple[int, int]) -> Optional[Tuple[int, int]]:
	if start == goal:
	return None
	sx, sy = start
	gx, gy = goal
	q = [(sx, sy)]
	prev = {start: None}
	while q:
	x, y = q.pop(0)
	if (x, y) == (gx, gy):
	break
	for nx, ny in neighbors4(x, y):
	if not in_bounds(nx, ny):
	continue
	if is_blocking(grid[ny][nx]):
	continue
	if (nx, ny) not in prev:
	prev[(nx, ny)] = (x, y)
	q.append((nx, ny))
	if (gx, gy) not in prev:
	return None
	cur = (gx, gy)
	while prev[cur] != start and prev[cur] is not None:
	cur = prev[cur]
	return cur

	def face_towards(ori: int, ax: int, ay: int, tx: int, ty: int) -> int:
	dx = tx - ax
	dy = ty - ay
	if abs(dx) > abs(dy):
	return 0 if dx > 0 else 2
	return 1 if dy > 0 else 3

	# -----------------------------
	# Agents + World
	# -----------------------------
	@dataclass
	class Agent:
	name: str
	role: str
	team: str
	x: int
	y: int
	ori: int = 0
	hp: int = 7

	model_key: str = "balanced" # economy\|balanced\|premium
	mode: str = "auto" # auto\|manual (manual hooks kept)
	brain: str = "biz" # biz\|random

	current_task_id: Optional[str] = None
	focus: str = "throughput" # throughput\|quality\|cost

	@dataclass
	class World:
	seed: int
	step: int
	grid: List[List[int]]

	run_id: str
	config: SimConfig

	agents: Dict[str, Agent]
	tasks: TaskSystem
	ledger: Ledger
	events: EventStore

	done: bool = False
	outcome: str = "running"

	outage_active: bool = False
	outage_timer_ticks: int = 0

	overlay: bool = True
	auto_camera: bool = True
	pov: str = "Planner"
	controlled: str = "Planner"

	# UI-friendly rolling log (not authoritative)
	ui_events: List[str] = field(default_factory=list)

	def init_world(seed: int, run_id: str, config: SimConfig) -> World:
	r = rng(seed)
	grid = carve_office(seed)

	# Spawn agents
	agents = {
	"Planner": Agent("Planner", role="Planner", team="Ops", x=2, y=2, ori=0, model_key="premium", focus="quality"),
	"Worker1": Agent("Worker1", role="Worker", team="Ops", x=GRID_W - 3, y=2, ori=2, model_key="balanced", focus="throughput"),
	"Worker2": Agent("Worker2", role="Worker", team="Ops", x=2, y=GRID_H - 3, ori=0, model_key="balanced", focus="throughput"),
	"Reviewer": Agent("Reviewer", role="Reviewer", team="Ops", x=GRID_W - 3, y=GRID_H - 3, ori=2, model_key="premium", focus="quality"),
	"Ops": Agent("Ops", role="Ops", team="Ops", x=GRID_W // 2, y=GRID_H // 2, ori=1, model_key="economy", focus="cost"),
	}

	tasks = TaskSystem(seed=seed)
	ledger = Ledger()
	store = EventStore(run_id=run_id)

	w = World(
	seed=seed,
	step=0,
	grid=grid,
	run_id=run_id,
	config=config,
	agents=agents,
	tasks=tasks,
	ledger=ledger,
	events=store,
	pov="Planner",
	controlled="Planner",
	overlay=True,
	auto_camera=True,
	ui_events=[f"Initialized run_id={run_id} seed={seed}"],
	)

	# Seed initial tasks
	for i in range(config.initial_tasks):
	t = tasks.create_task(
	t_sim=w.step,
	title=f"Backlog item #{i+1}",
	task_type=r.choice(["SUPPORT_TICKET", "SALES_OPS", "HR_ONBOARD", "SEC_REVIEW"]),
	priority=r.choice(["P1", "P2", "P3"]),
	sla_ticks=r.randint(72, 360), # a few days to a couple weeks depending on minutes_per_tick
	est_effort_min=r.randint(45, 220),
	value_usd=float(r.randint(50, 500)),
	)
	store.emit(w.step, "TASK_CREATED", payload={"task": t.task_id, "title": t.title, "type": t.task_type, "priority": t.priority}, state_obj_for_hash={"tasks": tasks.as_dict()})

	store.emit(w.step, "RUN_STARTED", payload={"minutes_per_tick": config.minutes_per_tick, "budget_soft": config.budget_usd_soft, "budget_hard": config.budget_usd_hard})
	return w

	# -----------------------------
	# Business logic: simulated LLM call + tool calls
	# -----------------------------
	def simulate_llm_work(w: World, agent: Agent, task: Task) -> Dict[str, Any]:
	"""
	This is your precision spine. Today it's simulated tokens/latency.
	Tomorrow you can swap in real model calls and record actual tokens/latency.
	"""
	cfg = w.config

	# Outage makes everything slower and more failure-prone
	outage_mult = 1.8 if w.outage_active else 1.0

	# Focus affects tokens & rework
	focus = agent.focus
	if focus == "quality":
	prompt = int(cfg.est_prompt_tokens_per_task * 1.15)
	completion = int(cfg.est_completion_tokens_per_task * 1.25)
	rework_mult = 0.55
	elif focus == "cost":
	prompt = int(cfg.est_prompt_tokens_per_task * 0.75)
	completion = int(cfg.est_completion_tokens_per_task * 0.70)
	rework_mult = 1.25
	else: # throughput
	prompt = int(cfg.est_prompt_tokens_per_task * 0.95)
	completion = int(cfg.est_completion_tokens_per_task * 0.95)
	rework_mult = 1.00

	# Model tier influences "effective latency" and (optionally) rework
	if agent.model_key == "economy":
	latency_ms = int(1400 * outage_mult)
	rework_mult *= 1.15
	elif agent.model_key == "balanced":
	latency_ms = int(1900 * outage_mult)
	rework_mult *= 0.95
	else: # premium
	latency_ms = int(2600 * outage_mult)
	rework_mult *= 0.80

	# Cache behavior: repeated tasks / retries more likely cached
	cached = 0
	if task.attempts >= 1:
	cached = int(prompt * 0.60)

	tokens = {
	"prompt_tokens": prompt,
	"completion_tokens": completion,
	"cached_prompt_tokens": cached,
	"reasoning_tokens": int(cfg.est_reasoning_tokens_per_task),
	}

	# Pricing
	rate = DEFAULT_MODEL_RATES.get(agent.model_key, DEFAULT_MODEL_RATES["balanced"])
	cost = cost_from_tokens(rate, tokens)

	# Tool calls (light simulation)
	tool_calls = 0
	if task.task_type in ("SEC_REVIEW", "SUPPORT_TICKET"):
	tool_calls = 2
	elif task.task_type == "SALES_OPS":
	tool_calls = 1
	else:
	tool_calls = 1

	return {
	"latency_ms": latency_ms,
	"tokens": tokens,
	"cost": cost,
	"tool_calls": tool_calls,
	"rework_mult": rework_mult,
	}

	def place_incident_tile(w: World, r: random.Random):
	# Mark an incident hotspot in the arena (purely UX, but helps narrative).
	for _ in range(60):
	x = r.randint(2, GRID_W - 3)
	y = r.randint(2, GRID_H - 3)
	if w.grid[y][x] == EMPTY:
	w.grid[y][x] = INCIDENT
	w.ui_events.append(f"t={w.step}: INCIDENT tile spawned at ({x},{y})")
	w.events.emit(w.step, "INCIDENT_SPAWNED", payload={"x": x, "y": y}, state_obj_for_hash={"grid": "incident"})
	return

	def sprinkle_new_work_nodes(w: World, r: random.Random, count: int = 2):
	for _ in range(count):
	x = r.randint(2, GRID_W - 3)
	y = r.randint(2, GRID_H - 3)
	if w.grid[y][x] == EMPTY:
	w.grid[y][x] = WORK

	def daily_injections(w: World):
	"""
	Once per simulated day, inject new tasks and stochastic events.
	"""
	cfg = w.config
	r = rng(w.seed + w.step * 997)

	ticks_per_day = max(1, int((24 * 60) / cfg.minutes_per_tick))
	if w.step % ticks_per_day != 0:
	return

	# New tasks
	for i in range(cfg.new_tasks_per_day):
	urgent = r.random() < cfg.incident_probability_per_day
	t = w.tasks.create_task(
	t_sim=w.step,
	title=("URGENT Incident: Service Degradation" if urgent else f"New inbound work #{w.step}-{i+1}"),
	task_type=("INCIDENT" if urgent else r.choice(["SUPPORT_TICKET", "SALES_OPS", "HR_ONBOARD", "SEC_REVIEW"])),
	priority=("P0" if urgent else r.choice(["P1", "P2", "P3"])),
	sla_ticks=(r.randint(6, 24) if urgent else r.randint(72, 360)),
	est_effort_min=(r.randint(90, 300) if urgent else r.randint(45, 220)),
	value_usd=float(r.randint(200, 2500) if urgent else r.randint(50, 500)),
	urgent=urgent,
	)
	w.events.emit(w.step, "TASK_CREATED", payload={"task": t.task_id, "title": t.title, "type": t.task_type, "priority": t.priority}, state_obj_for_hash={"task": asdict(t)})

	if urgent:
	place_incident_tile(w, r)

	# Outage event
	if (not w.outage_active) and (r.random() < cfg.outage_probability_per_day):
	w.outage_active = True
	w.outage_timer_ticks = r.randint(ticks_per_day // 2, ticks_per_day * 2)
	w.ui_events.append(f"t={w.step}: OUTAGE started ({w.outage_timer_ticks} ticks)")
	w.events.emit(w.step, "OUTAGE_STARTED", payload={"duration_ticks": w.outage_timer_ticks})

	# Add some new work nodes for visuals
	sprinkle_new_work_nodes(w, r, count=2)

	# -----------------------------
	# Agent policy: Planner -> Workers -> Reviewer
	# -----------------------------
	def agent_pick_target_tile(w: World, agent: Agent) -> Tuple[int, int]:
	"""
	Planner goes to WORK/INCIDENT; Workers go to WORK; Reviewer hovers.
	"""
	candidates = []
	for y in range(1, GRID_H - 1):
	for x in range(1, GRID_W - 1):
	if agent.name == "Planner" and w.grid[y][x] in (WORK, INCIDENT):
	candidates.append((x, y))
	elif agent.role == "Worker" and w.grid[y][x] == WORK:
	candidates.append((x, y))
	elif agent.name == "Ops" and w.grid[y][x] in (RISK, INCIDENT):
	candidates.append((x, y))
	if not candidates:
	return (agent.x, agent.y)
	candidates.sort(key=lambda p: manhattan((agent.x, agent.y), p))
	return candidates[0]

	def move_agent_step(w: World, agent: Agent, tx: int, ty: int):
	nxt = bfs_next_step(w.grid, (agent.x, agent.y), (tx, ty))
	if nxt is None:
	return
	nx, ny = nxt
	agent.ori = face_towards(agent.ori, agent.x, agent.y, nx, ny)
	agent.x, agent.y = nx, ny

	def maybe_start_task(w: World, agent: Agent):
	if agent.current_task_id:
	return
	# Only Planner and Workers start tasks; Reviewer reviews after work is done
	if agent.name in ("Reviewer",):
	return

	t = w.tasks.pick_next_task(w.step)
	if not t:
	return

	t.status = "IN_PROGRESS"
	t.owner = agent.name
	t.started_t = w.step
	t.attempts += 1
	agent.current_task_id = t.task_id

	w.ui_events.append(f"t={w.step}: {agent.name} started {t.task_id} ({t.priority}) {t.title}")
	w.events.emit(w.step, "TASK_STARTED", agent_id=agent.name, role=agent.role, model_key=agent.model_key, payload={"task": t.task_id, "priority": t.priority, "type": t.task_type, "attempt": t.attempts}, state_obj_for_hash={"task": asdict(t)})

	def maybe_complete_task(w: World, agent: Agent):
	if not agent.current_task_id:
	return
	tid = agent.current_task_id
	t = w.tasks.tasks.get(tid)
	if not t:
	agent.current_task_id = None
	return

	# Work happens when agent reaches a WORK/INCIDENT tile (narrative hook)
	tile = w.grid[agent.y][agent.x]
	if tile not in (WORK, INCIDENT, RISK):
	return

	# Simulate an LLM call + tools (or replace with real calls later)
	llm = simulate_llm_work(w, agent, t)
	w.ledger.mark_llm_call()
	w.ledger.add_latency(llm["latency_ms"])
	w.ledger.add_tokens(llm["tokens"])
	w.ledger.add_cost(llm["cost"]["usd"], agent_id=agent.name, model_key=agent.model_key)

	for _ in range(int(llm["tool_calls"])):
	w.ledger.mark_tool_call()

	w.events.emit(
	w.step,
	"LLM_CALL",
	agent_id=agent.name,
	role=agent.role,
	model_key=agent.model_key,
	payload={"task": t.task_id, "task_type": t.task_type, "attempt": t.attempts, "focus": agent.focus, "outage": w.outage_active},
	latency_ms=llm["latency_ms"],
	tokens=llm["tokens"],
	cost=llm["cost"],
	state_obj_for_hash={"ledger": {"spend": w.ledger.spend_usd, "calls": w.ledger.llm_calls}},
	)

	# Rework probability: base * complexity-ish * outage * focus multiplier
	cfg = w.config
	base = cfg.rework_probability_base
	complexity = 1.0 + min(2.0, (t.est_effort_min / 180.0))
	outage_mult = 1.35 if w.outage_active else 1.0
	p_rework = clamp(base * complexity * outage_mult * llm["rework_mult"], 0.01, 0.65)

	# Reviewer reduces rework on higher risk tasks by adding an extra pass
	needs_review = (t.task_type in ("SEC_REVIEW", "INCIDENT")) or (t.priority in ("P0", "P1"))

	# Budget enforcement
	w.ledger.check_budget(cfg.budget_usd_soft, cfg.budget_usd_hard)
	if w.ledger.spend_usd >= cfg.budget_usd_hard:
	# Budget hard stop: complete with degraded quality (rework likely)
	p_rework = min(0.85, p_rework * 1.65)
	w.events.emit(w.step, "BUDGET_HARD_STOP", payload={"spend_usd": w.ledger.spend_usd})

	# Decide status
	r = rng(w.seed ^ (w.step * 1315423911) ^ (hash(agent.name) & 0xFFFFFFFF))
	rework = r.random() < p_rework

	if needs_review:
	# Mark as awaiting review (Reviewer can "confirm" next)
	t.status = "BLOCKED"
	t.notes["awaiting_review"] = True
	w.ui_events.append(f"t={w.step}: {t.task_id} awaiting review")
	w.events.emit(w.step, "TASK_BLOCKED", agent_id=agent.name, payload={"task": t.task_id, "reason": "awaiting_review"})
	else:
	if rework:
	t.status = "REWORK"
	w.ui_events.append(f"t={w.step}: {t.task_id} needs REWORK")
	w.events.emit(w.step, "TASK_REWORK", agent_id=agent.name, payload={"task": t.task_id, "p_rework": p_rework})
	else:
	t.status = "DONE"
	t.completed_t = w.step
	w.ui_events.append(f"t={w.step}: {t.task_id} DONE ✅")
	w.events.emit(w.step, "TASK_COMPLETED", agent_id=agent.name, payload={"task": t.task_id, "value_usd": t.value_usd})

	agent.current_task_id = None

	# Clear tile to show "work node consumed"
	if tile == WORK:
	w.grid[agent.y][agent.x] = EMPTY
	elif tile == INCIDENT:
	w.grid[agent.y][agent.x] = RISK

	def reviewer_pass(w: World, reviewer: Agent):
	# Reviewer looks for blocked tasks awaiting review and finalizes them with a smaller LLM call
	blocked = [t for t in w.tasks.tasks.values() if t.status == "BLOCKED" and t.notes.get("awaiting_review")]
	if not blocked:
	return
	blocked.sort(key=lambda t: (t.priority != "P0", t.sla_due_t))
	t = blocked[0]

	# Reviewer "reviews" without moving dependence (simple)
	llm = simulate_llm_work(w, reviewer, t)
	# Reviewer tends to be higher quality; reduce p_rework
	llm["tokens"]["prompt_tokens"] = int(llm["tokens"]["prompt_tokens"] * 0.65)
	llm["tokens"]["completion_tokens"] = int(llm["tokens"]["completion_tokens"] * 0.55)
	llm["latency_ms"] = int(llm["latency_ms"] * 0.9)

	w.ledger.mark_llm_call()
	w.ledger.add_latency(llm["latency_ms"])
	w.ledger.add_tokens(llm["tokens"])
	w.ledger.add_cost(llm["cost"]["usd"], agent_id=reviewer.name, model_key=reviewer.model_key)

	w.events.emit(
	w.step,
	"REVIEW_PASS",
	agent_id=reviewer.name,
	role=reviewer.role,
	model_key=reviewer.model_key,
	payload={"task": t.task_id, "task_type": t.task_type},
	latency_ms=llm["latency_ms"],
	tokens=llm["tokens"],
	cost=llm["cost"],
	)

	# Determine whether task goes to rework or done (review reduces rework heavily)
	cfg = w.config
	base = cfg.rework_probability_base * 0.55
	complexity = 1.0 + min(2.0, (t.est_effort_min / 180.0))
	outage_mult = 1.25 if w.outage_active else 1.0
	p_rework = clamp(base * complexity * outage_mult, 0.01, 0.45)

	r = rng(w.seed ^ (w.step * 2654435761) ^ 0xA5A5A5A5)
	rework = r.random() < p_rework

	if rework:
	t.status = "REWORK"
	t.notes["awaiting_review"] = False
	w.ui_events.append(f"t={w.step}: REVIEW → {t.task_id} REWORK")
	w.events.emit(w.step, "TASK_REWORK", agent_id=reviewer.name, payload={"task": t.task_id, "p_rework": p_rework})
	else:
	t.status = "DONE"
	t.completed_t = w.step
	t.notes["awaiting_review"] = False
	w.ui_events.append(f"t={w.step}: REVIEW → {t.task_id} DONE ✅")
	w.events.emit(w.step, "TASK_COMPLETED", agent_id=reviewer.name, payload={"task": t.task_id, "value_usd": t.value_usd})

	# -----------------------------
	# Tick
	# -----------------------------
	def tick(w: World):
	if w.done:
	return

	# Daily injections
	daily_injections(w)

	# Outage timer
	if w.outage_active:
	w.outage_timer_ticks -= 1
	if w.outage_timer_ticks <= 0:
	w.outage_active = False
	w.ui_events.append(f"t={w.step}: OUTAGE ended")
	w.events.emit(w.step, "OUTAGE_ENDED", payload={})

	# Agents move + start/complete work
	for nm, a in w.agents.items():
	if nm == "Reviewer":
	continue
	target = agent_pick_target_tile(w, a)
	move_agent_step(w, a, target[0], target[1])
	maybe_start_task(w, a)
	maybe_complete_task(w, a)

	# Reviewer pass
	reviewer_pass(w, w.agents["Reviewer"])

	# Camera cuts
	if w.auto_camera:
	# Focus the POV on whoever is currently holding a task or nearest incident
	best = "Planner"
	best_score = -1e9
	inc_locs = [(x,y) for y in range(GRID_H) for x in range(GRID_W) if w.grid[y][x] == INCIDENT]
	for nm, a in w.agents.items():
	score = 0.0
	if a.current_task_id:
	score += 3.0
	if inc_locs:
	d = min(manhattan((a.x,a.y), p) for p in inc_locs)
	score += max(0, 12 - d) * 0.25
	score += (1.2 if nm == "Planner" else 0.0)
	if score > best_score:
	best_score = score
	best = nm
	w.pov = best

	# Budget alert events
	for msg in w.ledger.alerts[-2:]:
	if "EXCEEDED" in msg:
	w.events.emit(w.step, "BUDGET_ALERT", payload={"message": msg, "spend_usd": w.ledger.spend_usd})

	# Stop conditions (user can run "years"—don’t auto-stop unless you want)
	# Here we keep it running, but you can stop on hard budget if desired:
	if w.ledger.spend_usd >= w.config.budget_usd_hard * 1.5:
	w.done = True
	w.outcome = "stopped_budget"
	w.events.emit(w.step, "RUN_STOPPED", payload={"reason": "spend_guardrail", "spend_usd": w.ledger.spend_usd})
	w.ui_events.append(f"t={w.step}: RUN STOPPED (spend guardrail)")

	w.step += 1

	# prune UI log
	if len(w.ui_events) > 220:
	w.ui_events = w.ui_events[-220:]

	# -----------------------------
	# POV renderer (lightweight raycast, adapted)
	# -----------------------------
	SKY = np.array([12, 14, 26], dtype=np.uint8)
	FLOOR1 = np.array([24, 28, 54], dtype=np.uint8)
	FLOOR2 = np.array([10, 12, 22], dtype=np.uint8)
	WALL1 = np.array([205, 210, 232], dtype=np.uint8)
	WALL2 = np.array([160, 168, 195], dtype=np.uint8)
	GATEC = np.array([120, 220, 255], dtype=np.uint8)
	WORKC = np.array([154, 176, 255], dtype=np.uint8)
	INCC = np.array([255, 209, 122], dtype=np.uint8)
	RISKC = np.array([255, 59, 59], dtype=np.uint8)

	def within_fov(ax: int, ay: int, ori: int, tx: int, ty: int, fov_deg: float = FOV_DEG) -> bool:
	dx = tx - ax
	dy = ty - ay
	if dx == 0 and dy == 0:
	return True
	ang = (math.degrees(math.atan2(dy, dx)) % 360)
	facing = ORI_DEG[ori]
	diff = (ang - facing + 540) % 360 - 180
	return abs(diff) <= (fov_deg / 2)

	def bresenham_los(grid: List[List[int]], x0: int, y0: int, x1: int, y1: int) -> bool:
	dx = abs(x1 - x0)
	dy = abs(y1 - y0)
	sx = 1 if x0 < x1 else -1
	sy = 1 if y0 < y1 else -1
	err = dx - dy
	x, y = x0, y0
	while True:
	if (x, y) != (x0, y0) and (x, y) != (x1, y1):
	if grid[y][x] == WALL:
	return False
	if x == x1 and y == y1:
	return True
	e2 = 2 * err
	if e2 > -dy:
	err -= dy
	x += sx
	if e2 < dx:
	err += dx
	y += sy

	def raycast_pov(w: World, who: str) -> np.ndarray:
	a = w.agents[who]
	img = np.zeros((VIEW_H, VIEW_W, 3), dtype=np.uint8)
	img[:, :] = SKY
	for y in range(VIEW_H // 2, VIEW_H):
	t = (y - VIEW_H // 2) / max(1, (VIEW_H // 2))
	col = (1 - t) * FLOOR1 + t * FLOOR2
	img[y, :] = col.astype(np.uint8)

	ray_cols = VIEW_W
	half = math.radians(FOV_DEG / 2)
	base = math.radians(ORI_DEG[a.ori])

	for rx in range(ray_cols):
	cam = (2 * rx / (ray_cols - 1)) - 1
	ang = base + cam * half
	sin_a = math.sin(ang)
	cos_a = math.cos(ang)

	ox, oy = a.x + 0.5, a.y + 0.5
	depth = 0.0
	hit = None
	side = 0
	hit_tile = None

	while depth < MAX_DEPTH:
	depth += 0.06
	tx = int(ox + cos_a * depth)
	ty = int(oy + sin_a * depth)
	if not in_bounds(tx, ty):
	break
	tile = w.grid[ty][tx]
	if tile in (WALL, GATE, WORK, INCIDENT, RISK):
	hit = "tile"
	hit_tile = tile
	side = 1 if abs(cos_a) > abs(sin_a) else 0
	break

	if hit is None:
	continue

	depth *= math.cos(ang - base)
	depth = max(depth, 0.001)
	h = int((VIEW_H * 0.92) / depth)
	y0 = max(0, VIEW_H // 2 - h // 2)
	y1 = min(VIEW_H - 1, VIEW_H // 2 + h // 2)

	if hit_tile == GATE:
	col = GATEC.copy()
	elif hit_tile == WORK:
	col = WORKC.copy()
	elif hit_tile == INCIDENT:
	col = INCC.copy()
	elif hit_tile == RISK:
	col = RISKC.copy()
	else:
	col = (WALL1.copy() if side == 0 else WALL2.copy())

	dim = max(0.28, 1.0 - depth / MAX_DEPTH)
	col = (col * dim).astype(np.uint8)
	img[y0:y1, rx:rx + 1] = col

	# agent sprites
	for nm, other in w.agents.items():
	if nm == who:
	continue
	if not within_fov(a.x, a.y, a.ori, other.x, other.y):
	continue
	if not bresenham_los(w.grid, a.x, a.y, other.x, other.y):
	continue

	dx = other.x - a.x
	dy = other.y - a.y
	ang = math.degrees(math.atan2(dy, dx)) % 360
	facing = ORI_DEG[a.ori]
	diff = (ang - facing + 540) % 360 - 180
	sx = int((diff / (FOV_DEG / 2)) * (VIEW_W / 2) + (VIEW_W / 2))
	dist = math.sqrt(dx * dx + dy * dy)
	size = int((VIEW_H * 0.55) / max(dist, 1.0))
	size = clamp(size, 10, 110)

	ymid = VIEW_H // 2
	x0 = clamp(sx - size // 4, 0, VIEW_W - 1)
	x1 = clamp(sx + size // 4, 0, VIEW_W - 1)
	y0 = clamp(ymid - size // 2, 0, VIEW_H - 1)
	y1 = clamp(ymid + size // 2, 0, VIEW_H - 1)

	hexcol = AGENT_COLORS.get(nm, "#ffd17a").lstrip("#")
	rgb = np.array([int(hexcol[i:i+2], 16) for i in (0, 2, 4)], dtype=np.uint8)
	img[y0:y1, x0:x1] = rgb

	if w.overlay:
	cx, cy = VIEW_W // 2, VIEW_H // 2
	img[cy - 1:cy + 2, cx - 16:cx + 16] = np.array([110, 210, 255], dtype=np.uint8)
	img[cy - 16:cy + 16, cx - 1:cx + 2] = np.array([110, 210, 255], dtype=np.uint8)
	return img

	# -----------------------------
	# SVG renderer
	# -----------------------------
	def tile_color(tile: int) -> str:
	return {
	EMPTY: COL_EMPTY,
	WALL: COL_WALL,
	WORK: COL_WORK,
	RISK: COL_RISK,
	INCIDENT: COL_INC,
	GATE: COL_GATE,
	}.get(tile, COL_EMPTY)

	def svg_render(w: World) -> str:
	# HUD headline: business clock
	cfg = w.config
	minutes = w.step * cfg.minutes_per_tick
	days = minutes / (24 * 60)
	headline = f"ZEN Orchestrator Sandbox • day={days:.2f} • tick={w.step} • outage={w.outage_active}"
	detail = f"spend=${w.ledger.spend_usd:.4f} • llm_calls={w.ledger.llm_calls} • tool_calls={w.ledger.tool_calls} • overdue={len(w.tasks.overdue_tasks(w.step))}"

	css = f"""
	<style>
	.root {{
	background: {COL_BG};
	border-radius: 18px;
	overflow: hidden;
	box-shadow: 0 18px 40px rgba(0,0,0,0.45);
	}}
	.hud {{
	font-family: ui-sans-serif, system-ui, -apple-system, Segoe UI, Roboto, Arial;
	fill: rgba(235,240,255,0.92);
	}}
	.hudSmall {{ fill: rgba(235,240,255,0.72); }}
	.tile {{ shape-rendering: crispEdges; }}
	.gridline {{ stroke: {COL_GRIDLINE}; stroke-width: 1; opacity: 0.45; }}
	.agent {{
	transition: transform 220ms cubic-bezier(.2,.8,.2,1);
	filter: drop-shadow(0px 8px 10px rgba(0,0,0,0.45));
	}}
	.pulse {{
	animation: pulse 1.2s ease-in-out infinite;
	opacity: 0.22;
	}}
	@keyframes pulse {{
	0% {{ transform: scale(1.0); opacity: 0.14; }}
	50% {{ transform: scale(1.15); opacity: 0.26; }}
	100% {{ transform: scale(1.0); opacity: 0.14; }}
	}}
	.badge {{
	fill: rgba(15,23,51,0.72);
	stroke: rgba(170,195,255,0.16);
	stroke-width: 1;
	}}
	.dead {{ opacity: 0.22; filter: none; }}
	.banner {{ fill: rgba(255,255,255,0.08); }}
	</style>
	"""

	svg = [f"""
	<div class="root">
	{css}
	<svg width="{SVG_W}" height="{SVG_H}" viewBox="0 0 {SVG_W} {SVG_H}">
	<rect x="0" y="0" width="{SVG_W}" height="{SVG_H}" fill="{COL_BG}"/>
	<rect class="banner" x="0" y="0" width="{SVG_W}" height="{HUD_H}" rx="0" ry="0"/>
	<text class="hud" x="18" y="28" font-size="16" font-weight="700">{headline}</text>
	<text class="hud hudSmall" x="18" y="50" font-size="12">{detail}</text>
	"""]

	for y in range(GRID_H):
	for x in range(GRID_W):
	t = w.grid[y][x]
	c = tile_color(t)
	px = x * TILE
	py = HUD_H + y * TILE
	svg.append(f'<rect class="tile" x="{px}" y="{py}" width="{TILE}" height="{TILE}" fill="{c}"/>')

	for x in range(GRID_W + 1):
	px = x * TILE
	svg.append(f'<line class="gridline" x1="{px}" y1="{HUD_H}" x2="{px}" y2="{SVG_H}"/>')
	for y in range(GRID_H + 1):
	py = HUD_H + y * TILE
	svg.append(f'<line class="gridline" x1="0" y1="{py}" x2="{SVG_W}" y2="{py}"/>')

	for nm, a in w.agents.items():
	px = a.x * TILE
	py = HUD_H + a.y * TILE
	col = AGENT_COLORS.get(nm, "#ffd17a")
	dead_cls = " dead" if a.hp <= 0 else ""
	svg.append(f"""
	<g class="agent{dead_cls}" style="transform: translate({px}px, {py}px);">
	<circle class="pulse" cx="{TILE/2}" cy="{TILE/2}" r="{TILE*0.46}" fill="{col}"></circle>
	<circle cx="{TILE/2}" cy="{TILE/2}" r="{TILE*0.34}" fill="{col}" opacity="0.98"></circle>
	""")
	dx, dy = DIRS[a.ori]
	x2 = TILE/2 + dx(TILE0.32)
	y2 = TILE/2 + dy(TILE0.32)
	svg.append(f'<line x1="{TILE/2}" y1="{TILE/2}" x2="{x2}" y2="{y2}" stroke="rgba(10,10,14,0.85)" stroke-width="4" stroke-linecap="round"/>')

	badge_w = max(64, 10 * len(nm) * 0.62)
	svg.append(f'<rect class="badge" x="{TILE/2 - badge_w/2}" y="{TILE*0.05}" rx="10" width="{badge_w}" height="16"/>')
	task = a.current_task_id or "-"
	svg.append(f'<text x="{TILE/2}" y="{TILE*0.05 + 12}" text-anchor="middle" font-size="10" fill="rgba(235,240,255,0.92)" font-family="ui-sans-serif, system-ui">{nm}:{task}</text>')

	if nm == w.controlled:
	svg.append(f'<circle cx="{TILE0.88}" cy="{TILE0.18}" r="6" fill="rgba(110,180,255,0.95)"/>')
	svg.append("</g>")

	svg.append("</svg></div>")
	return "".join(svg)