Spaces:

qpluslab
/

openra-rl

Paused

github-actions[bot]

Sync from GitHub ac82c3e

02f4a63 2 months ago

34.3 kB

	#!/usr/bin/env python3
	"""Scripted Red Alert bot that plays a full game via the OpenEnv client API.

	Exercises ALL Sprint 4+5 observation fields and action types:
	- Observations: spatial_map, visible_enemy_buildings, unit facing/stance/speed/
	attack_range/experience/passengers, building cell coords/can_produce/power/
	rally/repair/sell_value
	- Actions: all 20 types including GUARD, SET_STANCE, ENTER_TRANSPORT, UNLOAD,
	SET_RALLY_POINT, REPAIR, SELL, POWER_DOWN, SET_PRIMARY

	Usage:
	docker run -p 8000:8000 openra-rl
	python examples/scripted_bot.py --verbose
	"""

	import argparse
	import asyncio
	import base64
	import sys
	from typing import List, Optional, Tuple

	from openra_env.client import OpenRAEnv
	from openra_env.models import (
	ActionType,
	BuildingInfoModel,
	CommandModel,
	OpenRAAction,
	OpenRAObservation,
	UnitInfoModel,
	)

	# Stance constants matching C# AutoTarget.UnitStance enum
	STANCE_HOLD_FIRE = 0
	STANCE_RETURN_FIRE = 1
	STANCE_DEFEND = 2
	STANCE_ATTACK_ANYTHING = 3

	STANCE_NAMES = {0: "HoldFire", 1: "ReturnFire", 2: "Defend", 3: "AttackAnything"}


	class ScriptedBot:
	"""State-machine bot with a Red Alert build order exercising all actions.

	Phases:
	deploy_mcv - Deploy MCV, set stance on starting units
	build_base - Build power/barracks/war factory, set rally points
	train_army - Train infantry + APC, guard CY, load transport
	attack - Attack-move toward enemy buildings, unload APC
	sustain - Continuous production, repair, sell damaged buildings
	"""

	# Build order uses both faction names — bot picks whichever is available
	BARRACKS_TYPES = {"tent", "barr"} # Allied / Soviet
	WAR_FACTORY_TYPES = {"weap"}
	BUILD_PRIORITY = [
	"powr", # Power Plant ($300) — shared
	"barracks", # Placeholder: tent (Allied) or barr (Soviet)
	"proc", # Ore Refinery ($2000) — needed before war factory
	"weap", # War Factory ($2000) — shared
	"powr", # Second Power Plant
	]

	INFANTRY_TRAIN_TARGET = 6
	GUARD_COUNT = 2 # infantry to guard CY
	TRANSPORT_TYPE = "apc"
	COMBAT_UNIT_TYPES = {"e1", "e2", "e3", "e4", "1tnk", "2tnk", "3tnk", "arty", "jeep", "apc"}
	INFANTRY_TYPES = {"e1", "e2", "e3", "e4"}
	VEHICLE_TYPES = {"1tnk", "2tnk", "3tnk", "arty", "jeep"}

	def __init__(self, verbose: bool = False):
	self.phase = "deploy_mcv"
	self.build_index = 0
	self.placement_count = 0
	self.deploy_issued = False
	self.verbose = verbose
	self._guards_assigned: set[int] = set() # actor IDs guarding CY
	self._stances_set: set[int] = set() # actor IDs with stance already set
	self._rally_set: set[int] = set() # building actor IDs with rally point set
	self._apc_trained = False
	self._apc_loaded = False
	self._repair_issued: set[int] = set() # building actor IDs being repaired
	self._sold: set[int] = set() # building actor IDs sold
	self._powered_down: set[int] = set() # building actor IDs powered down
	self._primary_set: set[int] = set() # building actor IDs set as primary

	def decide(self, obs: OpenRAObservation) -> OpenRAAction:
	"""Given current observation, return commands for this tick."""
	commands: List[CommandModel] = []

	self._update_phase(obs)

	# Priority 1: Place completed buildings
	commands.extend(self._handle_placement(obs))

	# Priority 2: Deploy MCV
	if self.phase == "deploy_mcv":
	cmd = self._handle_deploy(obs)
	if cmd:
	commands.append(cmd)

	# Priority 3: Set rally points on production buildings
	commands.extend(self._handle_rally_points(obs))

	# Priority 4: Power management (power down buildings if power negative)
	commands.extend(self._handle_power_management(obs))

	# Priority 5: Set primary production buildings
	commands.extend(self._handle_set_primary(obs))

	# Priority 6: Repair damaged buildings
	commands.extend(self._handle_repairs(obs))

	# Priority 7: Queue production (buildings + units)
	commands.extend(self._handle_production(obs))

	# Priority 8: Set stances on new units
	commands.extend(self._handle_stances(obs))

	# Priority 9: Assign guards to CY
	commands.extend(self._handle_guards(obs))

	# Priority 10: Load infantry into APC
	commands.extend(self._handle_transport(obs))

	# Priority 11: Combat — attack + unload
	commands.extend(self._handle_combat(obs))

	# Priority 12: Sell heavily damaged buildings
	commands.extend(self._handle_sell(obs))

	if not commands:
	commands.append(CommandModel(action=ActionType.NO_OP))

	return OpenRAAction(commands=commands)

	# ── Phase transitions ──────────────────────────────────────────

	def _update_phase(self, obs: OpenRAObservation):
	has_cy = any(b.type == "fact" for b in obs.buildings)
	has_barracks = any(b.type in self.BARRACKS_TYPES for b in obs.buildings)
	combat_units = [u for u in obs.units if u.type in self.COMBAT_UNIT_TYPES]
	non_guard_combat = [u for u in combat_units if u.actor_id not in self._guards_assigned]

	if self.phase == "deploy_mcv" and has_cy:
	self.phase = "build_base"
	self._log("Phase → build_base")
	elif self.phase == "build_base" and self.build_index >= len(self.BUILD_PRIORITY):
	self.phase = "train_army"
	self._log("Phase → train_army")
	elif self.phase == "train_army" and len(non_guard_combat) >= self.INFANTRY_TRAIN_TARGET:
	self.phase = "attack"
	self._log(f"Phase → attack ({len(non_guard_combat)} combat units ready)")
	elif self.phase == "attack" and has_barracks:
	# Stay in attack but also sustain production
	pass

	# ── Deploy MCV ─────────────────────────────────────────────────

	def _handle_deploy(self, obs: OpenRAObservation) -> Optional[CommandModel]:
	if self.deploy_issued:
	return None
	mcv = next((u for u in obs.units if u.type == "mcv"), None)
	if mcv:
	self.deploy_issued = True
	self._log(f"Deploying MCV (actor {mcv.actor_id}, facing={mcv.facing})")
	return CommandModel(action=ActionType.DEPLOY, actor_id=mcv.actor_id)
	return None

	# ── Building placement ─────────────────────────────────────────

	def _handle_placement(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	cy = self._find_building(obs, "fact")
	if not cy:
	return commands

	for prod in obs.production:
	if prod.queue_type == "Building" and prod.progress >= 0.99:
	x, y = self._placement_offset(cy)
	self._log(f"Placing {prod.item} at cell ({x}, {y}) [attempt {self.placement_count}]")
	commands.append(CommandModel(
	action=ActionType.PLACE_BUILDING,
	item_type=prod.item,
	target_x=x,
	target_y=y,
	))
	self.placement_count += 1
	return commands

	def _placement_offset(self, cy: BuildingInfoModel) -> Tuple[int, int]:
	"""Calculate placement position relative to CY using cell coords."""
	# Use pos_x // 1024 as CenterPosition maps to cell more reliably
	cx = cy.pos_x // 1024
	cy_y = cy.pos_y // 1024
	# Many offsets to maximize chance of finding valid terrain
	offsets = [
	(3, 0), (-3, 0), (0, 3), (0, -3),
	(3, 3), (-3, 3), (3, -3), (-3, -3),
	(6, 0), (-6, 0), (0, 6), (0, -6),
	(2, 0), (-2, 0), (0, 2), (0, -2),
	(4, 0), (-4, 0), (0, 4), (0, -4),
	]
	idx = self.placement_count % len(offsets)
	dx, dy = offsets[idx]
	return cx + dx, cy_y + dy

	# ── Rally points (Sprint 4 action) ─────────────────────────────

	def _handle_rally_points(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	cy = self._find_building(obs, "fact")
	if not cy:
	return commands

	# Set rally point on barracks and war factory toward CY
	for b in obs.buildings:
	if b.type in ("tent", "weap") and b.actor_id not in self._rally_set:
	rally_x = cy.cell_x if cy.cell_x > 0 else cy.pos_x // 1024
	rally_y = cy.cell_y if cy.cell_y > 0 else cy.pos_y // 1024
	self._log(f"Setting rally on {b.type} (actor {b.actor_id}) → ({rally_x}, {rally_y})")
	commands.append(CommandModel(
	action=ActionType.SET_RALLY_POINT,
	actor_id=b.actor_id,
	target_x=rally_x,
	target_y=rally_y,
	))
	self._rally_set.add(b.actor_id)
	return commands

	# ── Power management (Sprint 5 action) ─────────────────────────

	def _handle_power_management(self, obs: OpenRAObservation) -> List[CommandModel]:
	"""Power down non-essential buildings when power balance is negative."""
	commands = []
	power_balance = obs.economy.power_provided - obs.economy.power_drained
	if power_balance >= 0:
	return commands

	# Power down radar/tech buildings first (keep production running)
	POWER_DOWN_PRIORITY = ["dome", "spen", "syrd", "hpad", "afld", "fix"]
	for btype in POWER_DOWN_PRIORITY:
	for b in obs.buildings:
	if b.type == btype and b.is_powered and b.actor_id not in self._powered_down:
	commands.append(CommandModel(action=ActionType.POWER_DOWN, actor_id=b.actor_id))
	self._powered_down.add(b.actor_id)
	self._log(f"Powering down {b.type} (actor {b.actor_id}) — power balance: {power_balance}")
	return commands # one at a time
	return commands

	# ── Set primary building (Sprint 5 action) ───────────────────

	def _handle_set_primary(self, obs: OpenRAObservation) -> List[CommandModel]:
	"""Set primary on newest production building of each type."""
	commands = []
	for btype_set in [self.BARRACKS_TYPES, self.WAR_FACTORY_TYPES]:
	buildings_of_type = [b for b in obs.buildings if b.type in btype_set]
	if len(buildings_of_type) >= 2:
	newest = max(buildings_of_type, key=lambda b: b.actor_id)
	if newest.actor_id not in self._primary_set:
	commands.append(CommandModel(action=ActionType.SET_PRIMARY, actor_id=newest.actor_id))
	self._primary_set.add(newest.actor_id)
	self._log(f"Setting primary: {newest.type} (actor {newest.actor_id})")
	return commands

	# ── Repair damaged buildings (Sprint 4 observation + existing action) ──

	def _handle_repairs(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	for b in obs.buildings:
	if (b.hp_percent < 0.7
	and not b.is_repairing
	and b.actor_id not in self._repair_issued
	and obs.economy.cash >= 500):
	self._log(f"Repairing {b.type} (actor {b.actor_id}, hp={b.hp_percent:.0%})")
	commands.append(CommandModel(
	action=ActionType.REPAIR,
	actor_id=b.actor_id,
	))
	self._repair_issued.add(b.actor_id)
	return commands

	# ── Production ─────────────────────────────────────────────────

	def _handle_production(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []

	# Building construction — treat any Building queue item as "in progress"
	# (includes completed-but-unplaced buildings that block the queue)
	building_in_queue = any(
	p.queue_type == "Building"
	for p in obs.production
	)
	if not building_in_queue and self.build_index < len(self.BUILD_PRIORITY):
	item_type = self._resolve_build_item(obs, self.BUILD_PRIORITY[self.build_index])
	if item_type is None:
	# Can't resolve this item yet, skip
	pass
	elif self._has_building_type(obs, item_type, self.build_index):
	self.build_index += 1
	elif self._can_produce_item(obs, item_type):
	self._log(f"Building {item_type} (#{self.build_index + 1}/{len(self.BUILD_PRIORITY)})")
	commands.append(CommandModel(action=ActionType.BUILD, item_type=item_type))
	self.build_index += 1

	# Infantry training
	has_barracks = any(b.type in self.BARRACKS_TYPES for b in obs.buildings)
	infantry_training = any(
	p.queue_type == "Infantry" and p.progress < 0.99
	for p in obs.production
	)
	infantry = [u for u in obs.units if u.type in self.INFANTRY_TYPES]
	total_target = self.INFANTRY_TRAIN_TARGET + self.GUARD_COUNT

	if has_barracks and not infantry_training and len(infantry) < total_target:
	if self._can_produce_item(obs, "e1") and obs.economy.cash >= 100:
	self._log(f"Training e1 ({len(infantry)}/{total_target})")
	commands.append(CommandModel(action=ActionType.TRAIN, item_type="e1"))

	# APC from war factory
	has_weap = any(b.type == "weap" for b in obs.buildings)
	vehicle_training = any(
	p.queue_type == "Vehicle" and p.progress < 0.99
	for p in obs.production
	)
	if (has_weap and not vehicle_training and not self._apc_trained
	and self._can_produce_item(obs, self.TRANSPORT_TYPE)
	and obs.economy.cash >= 800):
	self._log("Training APC for transport ops")
	commands.append(CommandModel(action=ActionType.TRAIN, item_type=self.TRANSPORT_TYPE))
	self._apc_trained = True

	# Continuous vehicle production in attack phase
	if (self.phase == "attack" and has_weap and not vehicle_training
	and obs.economy.cash >= 800):
	# Build light tanks if available
	if self._can_produce_item(obs, "1tnk"):
	self._log("Training 1tnk (continuous production)")
	commands.append(CommandModel(action=ActionType.TRAIN, item_type="1tnk"))

	return commands

	def _can_produce_item(self, obs: OpenRAObservation, item_type: str) -> bool:
	"""Check if item is buildable using per-building can_produce (Sprint 4)."""
	# First check global available_production
	if item_type in obs.available_production:
	return True
	# Also check per-building can_produce lists
	for b in obs.buildings:
	if item_type in b.can_produce:
	return True
	return False

	# ── Stances (Sprint 4 action) ──────────────────────────────────

	def _handle_stances(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	for u in obs.units:
	if u.actor_id in self._stances_set:
	continue
	if u.type not in self.COMBAT_UNIT_TYPES:
	continue

	# Guards get Defend stance, attackers get AttackAnything
	if u.actor_id in self._guards_assigned:
	desired = STANCE_DEFEND
	else:
	desired = STANCE_ATTACK_ANYTHING

	if u.stance != desired:
	self._log(
	f"Setting {u.type} (actor {u.actor_id}) stance: "
	f"{STANCE_NAMES.get(u.stance, '?')} → {STANCE_NAMES[desired]}"
	)
	commands.append(CommandModel(
	action=ActionType.SET_STANCE,
	actor_id=u.actor_id,
	target_x=desired,
	))
	self._stances_set.add(u.actor_id)
	return commands

	# ── Guard CY (Sprint 4 action) ────────────────────────────────

	def _handle_guards(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	if len(self._guards_assigned) >= self.GUARD_COUNT:
	return commands

	cy = self._find_building(obs, "fact")
	if not cy:
	return commands

	# Find idle infantry not yet guarding
	for u in obs.units:
	if len(self._guards_assigned) >= self.GUARD_COUNT:
	break
	if (u.type in self.INFANTRY_TYPES
	and u.is_idle
	and u.actor_id not in self._guards_assigned):
	self._log(
	f"Assigning {u.type} (actor {u.actor_id}, "
	f"range={u.attack_range}) to guard CY"
	)
	commands.append(CommandModel(
	action=ActionType.GUARD,
	actor_id=u.actor_id,
	target_actor_id=cy.actor_id,
	))
	self._guards_assigned.add(u.actor_id)
	return commands

	# ── Transport: load/unload (Sprint 4 actions) ─────────────────

	def _handle_transport(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	if self._apc_loaded:
	return commands

	apc = next(
	(u for u in obs.units
	if u.type == self.TRANSPORT_TYPE and u.passenger_count == 0),
	None,
	)
	if not apc:
	return commands

	# Load idle infantry (not guards) into the APC
	loaded = 0
	for u in obs.units:
	if loaded >= 4: # APC capacity
	break
	if (u.type in self.INFANTRY_TYPES
	and u.is_idle
	and u.actor_id not in self._guards_assigned):
	self._log(
	f"Loading {u.type} (actor {u.actor_id}, "
	f"speed={u.speed}) into APC {apc.actor_id}"
	)
	commands.append(CommandModel(
	action=ActionType.ENTER_TRANSPORT,
	actor_id=u.actor_id,
	target_actor_id=apc.actor_id,
	))
	loaded += 1

	if loaded > 0:
	self._apc_loaded = True
	return commands

	# ── Combat ─────────────────────────────────────────────────────

	def _handle_combat(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	if self.phase != "attack":
	return commands

	# Unload APC near enemy
	commands.extend(self._handle_unload(obs))

	# Attack-move idle fighters toward enemy
	idle_fighters = [
	u for u in obs.units
	if (u.type in self.COMBAT_UNIT_TYPES
	and u.is_idle
	and u.actor_id not in self._guards_assigned)
	]

	if len(idle_fighters) < 2:
	return commands

	target_x, target_y = self._find_attack_target(obs)

	for unit in idle_fighters:
	commands.append(CommandModel(
	action=ActionType.ATTACK_MOVE,
	actor_id=unit.actor_id,
	target_x=target_x,
	target_y=target_y,
	))

	if idle_fighters:
	self._log(
	f"Attacking with {len(idle_fighters)} units "
	f"toward ({target_x}, {target_y})"
	)
	return commands

	def _handle_unload(self, obs: OpenRAObservation) -> List[CommandModel]:
	"""Unload APC when near enemies."""
	commands = []
	for u in obs.units:
	if u.type != self.TRANSPORT_TYPE or u.passenger_count <= 0:
	continue

	# Check if any enemy is within ~15 cells
	for enemy in obs.visible_enemies:
	dx = abs(u.cell_x - enemy.cell_x)
	dy = abs(u.cell_y - enemy.cell_y)
	if dx + dy < 15:
	self._log(
	f"Unloading APC (actor {u.actor_id}, "
	f"{u.passenger_count} passengers) near enemy"
	)
	commands.append(CommandModel(
	action=ActionType.UNLOAD,
	actor_id=u.actor_id,
	))
	break

	# Also unload near enemy buildings
	for eb in obs.visible_enemy_buildings:
	dx = abs(u.cell_x - eb.cell_x)
	dy = abs(u.cell_y - eb.cell_y)
	if dx + dy < 15:
	self._log(
	f"Unloading APC near enemy building {eb.type} "
	f"(hp={eb.hp_percent:.0%})"
	)
	commands.append(CommandModel(
	action=ActionType.UNLOAD,
	actor_id=u.actor_id,
	))
	break
	return commands

	def _find_attack_target(self, obs: OpenRAObservation) -> Tuple[int, int]:
	"""Prioritize enemy buildings > enemy units > map center."""
	# Priority 1: visible enemy buildings (Sprint 4 field)
	if obs.visible_enemy_buildings:
	# Prefer production buildings
	prod_buildings = [
	b for b in obs.visible_enemy_buildings
	if b.type in ("fact", "tent", "weap", "hpad", "afld")
	]
	target = prod_buildings[0] if prod_buildings else obs.visible_enemy_buildings[0]
	return target.cell_x, target.cell_y

	# Priority 2: visible enemy units
	if obs.visible_enemies:
	enemy = obs.visible_enemies[0]
	return enemy.cell_x, enemy.cell_y

	# Fallback: map center
	if obs.map_info.width > 0:
	return obs.map_info.width // 2, obs.map_info.height // 2
	return 64, 64

	# ── Sell heavily damaged buildings ─────────────────────────────

	def _handle_sell(self, obs: OpenRAObservation) -> List[CommandModel]:
	commands = []
	for b in obs.buildings:
	if (b.hp_percent < 0.2
	and b.type != "fact" # never sell CY
	and b.actor_id not in self._sold):
	self._log(
	f"Selling {b.type} (actor {b.actor_id}, hp={b.hp_percent:.0%}, "
	f"refund=${b.sell_value})"
	)
	commands.append(CommandModel(
	action=ActionType.SELL,
	actor_id=b.actor_id,
	))
	self._sold.add(b.actor_id)
	return commands

	# ── Helpers ────────────────────────────────────────────────────

	def _resolve_build_item(self, obs: OpenRAObservation, placeholder: str) -> Optional[str]:
	"""Resolve faction-agnostic build item to actual producible type."""
	if placeholder == "barracks":
	# Find which barracks type is available
	for btype in self.BARRACKS_TYPES:
	if self._can_produce_item(obs, btype):
	return btype
	return None
	return placeholder

	def _has_building_type(self, obs: OpenRAObservation, item_type: str, build_index: int) -> bool:
	"""Check if we already have enough of this building type."""
	already_built = sum(1 for b in obs.buildings if b.type == item_type)
	# Count how many times this item appears up to current index
	resolved_order = []
	for i, p in enumerate(self.BUILD_PRIORITY[:build_index + 1]):
	if p == "barracks":
	resolved_order.append(item_type if item_type in self.BARRACKS_TYPES else p)
	else:
	resolved_order.append(p)
	target_count = resolved_order.count(item_type)
	return already_built >= target_count

	def _find_building(self, obs: OpenRAObservation, btype: str) -> Optional[BuildingInfoModel]:
	return next((b for b in obs.buildings if b.type == btype), None)

	def _log(self, msg: str):
	if self.verbose:
	print(f" [Bot] {msg}")


	# ── Status display ─────────────────────────────────────────────────


	def print_status(step: int, obs: OpenRAObservation, bot: ScriptedBot):
	"""Print a rich status line using Sprint 4 observation fields."""
	combat = [u for u in obs.units if u.type in bot.COMBAT_UNIT_TYPES]
	buildings = ", ".join(sorted(set(b.type for b in obs.buildings))) or "none"
	power_balance = obs.economy.power_provided - obs.economy.power_drained

	# Count enemy intel
	enemy_units = len(obs.visible_enemies)
	enemy_buildings = len(obs.visible_enemy_buildings)

	print(
	f"Step {step:4d} \| Tick {obs.tick:5d} \| "
	f"${obs.economy.cash:5d} \| Pwr:{power_balance:+d} \| "
	f"Units:{len(obs.units)} (combat:{len(combat)}) \| "
	f"Enemy:{enemy_units}u/{enemy_buildings}b \| "
	f"Bldgs:[{buildings}] \| {bot.phase}"
	)


	def print_detailed_status(obs: OpenRAObservation):
	"""Print full observation details using all Sprint 4 fields."""
	print("\n── Detailed Observation ──")

	# Spatial map
	if obs.spatial_channels > 0 and obs.spatial_map:
	raw_bytes = base64.b64decode(obs.spatial_map)
	w, h = obs.map_info.width, obs.map_info.height
	expected_bytes = w * h * obs.spatial_channels * 4
	print(
	f" Spatial: {w}x{h} map, {obs.spatial_channels} channels, "
	f"{len(raw_bytes)} bytes (expected {expected_bytes})"
	)
	else:
	print(" Spatial: not populated")

	# Economy
	e = obs.economy
	print(
	f" Economy: ${e.cash} cash, {e.ore} ore, "
	f"power {e.power_provided}/{e.power_drained} "
	f"({e.power_provided - e.power_drained:+d}), "
	f"{e.harvester_count} harvesters"
	)

	# Production queue
	if obs.production:
	print(f" Production queue ({len(obs.production)}):")
	for p in obs.production:
	print(f" {p.queue_type}: {p.item} @ {p.progress:.0%} (paused={p.paused})")
	if obs.available_production:
	print(f" Available production: {', '.join(obs.available_production[:15])}")
	else:
	print(" Available production: (none)")

	# Own buildings with Sprint 4 fields
	print(f" Buildings ({len(obs.buildings)}):")
	for b in obs.buildings:
	extras = []
	if b.power_amount != 0:
	extras.append(f"pwr={b.power_amount:+d}")
	if b.is_producing:
	extras.append(f"producing={b.producing_item}@{b.production_progress:.0%}")
	if b.is_repairing:
	extras.append("REPAIRING")
	if b.rally_x >= 0:
	extras.append(f"rally=({b.rally_x},{b.rally_y})")
	if b.can_produce:
	extras.append(f"can_produce=[{','.join(b.can_produce[:5])}{'...' if len(b.can_produce) > 5 else ''}]")
	extra_str = f" ({', '.join(extras)})" if extras else ""
	print(
	f" {b.type:6s} #{b.actor_id:4d} "
	f"cell=({b.cell_x},{b.cell_y}) "
	f"hp={b.hp_percent:.0%} "
	f"sell=${b.sell_value}{extra_str}"
	)

	# Own units with Sprint 4 fields
	print(f" Units ({len(obs.units)}):")
	for u in obs.units[:10]: # cap at 10 for readability
	stance_name = STANCE_NAMES.get(u.stance, f"?{u.stance}")
	extras = []
	if u.experience_level > 0:
	extras.append(f"vet={u.experience_level}")
	if u.passenger_count >= 0:
	extras.append(f"cargo={u.passenger_count}")
	extra_str = f" ({', '.join(extras)})" if extras else ""
	print(
	f" {u.type:6s} #{u.actor_id:4d} "
	f"cell=({u.cell_x},{u.cell_y}) "
	f"hp={u.hp_percent:.0%} "
	f"face={u.facing:4d} spd={u.speed:3d} "
	f"rng={u.attack_range:5d} "
	f"stance={stance_name} "
	f"{'IDLE' if u.is_idle else u.current_activity}{extra_str}"
	)
	if len(obs.units) > 10:
	print(f" ... and {len(obs.units) - 10} more")

	# Visible enemies
	if obs.visible_enemies:
	print(f" Visible enemy units ({len(obs.visible_enemies)}):")
	for u in obs.visible_enemies[:5]:
	print(
	f" {u.type:6s} #{u.actor_id:4d} "
	f"cell=({u.cell_x},{u.cell_y}) hp={u.hp_percent:.0%} "
	f"spd={u.speed} rng={u.attack_range}"
	)

	# Visible enemy buildings (Sprint 4 field)
	if obs.visible_enemy_buildings:
	print(f" Visible enemy buildings ({len(obs.visible_enemy_buildings)}):")
	for b in obs.visible_enemy_buildings[:5]:
	print(
	f" {b.type:6s} #{b.actor_id:4d} "
	f"cell=({b.cell_x},{b.cell_y}) hp={b.hp_percent:.0%} "
	f"pwr={b.power_amount:+d}"
	)


	# ── Main loop ──────────────────────────────────────────────────────


	async def run_bot(url: str, max_steps: int, verbose: bool):
	"""Connect to the OpenRA-RL server and play one full game."""
	print(f"Connecting to {url}...")
	bot = ScriptedBot(verbose=verbose)

	async with OpenRAEnv(base_url=url, message_timeout_s=300.0) as env:
	print("Resetting environment...")
	result = await env.reset()
	obs = result.observation
	print(f"Game started! Map: {obs.map_info.map_name} ({obs.map_info.width}x{obs.map_info.height})")

	# Print initial detailed status
	if verbose:
	print_detailed_status(obs)

	print_status(0, obs, bot)

	step = 0
	total_reward = 0.0

	while not result.done and step < max_steps:
	action = bot.decide(result.observation)
	result = await env.step(action)
	step += 1
	total_reward += result.reward or 0.0
	obs = result.observation

	if step % 100 == 0:
	print_status(step, obs, bot)

	# Detailed dump at key milestones
	if verbose and step in (50, 200, 500, 1000):
	print_detailed_status(obs)

	# Final report
	print()
	print("=" * 70)
	obs = result.observation
	if obs.done:
	print(f"GAME OVER: {obs.result.upper()} after {step} steps (tick {obs.tick})")
	else:
	print(f"Reached max steps ({max_steps}) at tick {obs.tick}")

	print(f"Total reward: {total_reward:.3f}")
	print(f"Final cash: ${obs.economy.cash}")
	print(f"Power balance: {obs.economy.power_provided - obs.economy.power_drained:+d}")
	print(f"Units killed: {obs.military.units_killed}")
	print(f"Units lost: {obs.military.units_lost}")
	print(f"Buildings killed: {obs.military.buildings_killed}")
	print(f"Buildings lost: {obs.military.buildings_lost}")
	print(f"Army value: ${obs.military.army_value}")
	print(f"Own buildings: {len(obs.buildings)}")
	print(f"Visible enemies: {len(obs.visible_enemies)} units, {len(obs.visible_enemy_buildings)} buildings")

	# Spatial map stats
	if obs.spatial_channels > 0 and obs.spatial_map:
	raw_bytes = base64.b64decode(obs.spatial_map)
	n_floats = len(raw_bytes) // 4
	print(f"Spatial map: {n_floats} floats ({obs.spatial_channels} channels)")
	else:
	print("Spatial map: not populated")

	# Show veteran units
	vets = [u for u in obs.units if u.experience_level > 0]
	if vets:
	print(f"Veterans: {', '.join(f'{u.type}#{u.actor_id}(lvl{u.experience_level})' for u in vets)}")

	if verbose:
	print_detailed_status(obs)

	print("=" * 70)


	def main():
	parser = argparse.ArgumentParser(description="Scripted Red Alert bot via OpenEnv")
	parser.add_argument(
	"--url",
	default="http://localhost:8000",
	help="OpenRA-RL server URL (default: http://localhost:8000)",
	)
	parser.add_argument(
	"--max-steps",
	type=int,
	default=5000,
	help="Maximum steps before stopping (default: 5000)",
	)
	parser.add_argument(
	"--verbose",
	action="store_true",
	help="Print detailed bot decisions and observation dumps",
	)
	args = parser.parse_args()

	try:
	asyncio.run(run_bot(args.url, args.max_steps, args.verbose))
	except KeyboardInterrupt:
	print("\nInterrupted by user")
	sys.exit(0)
	except ConnectionRefusedError:
	print(f"\nCould not connect to {args.url}")
	print("Is the OpenRA-RL server running?")
	print(" docker run -p 8000:8000 openra-rl")
	sys.exit(1)


	if __name__ == "__main__":
	main()