Spaces:

qpluslab
/

OpenRA-Bench

Running

App Files Files Community

OpenRA-Bench / tools /gen_catalog.py

yxc20098

Research-grounded 200-level scenario catalog (12 categories) + integ

aa7cb95 about 2 months ago

Raw

History Blame Contribute Delete

11.3 kB

	#!/usr/bin/env python3
	"""Generate the research-grounded 200-level scenario catalog.

	Procedurally parameterized per the anti-memorization rule (Procgen /
	SMACv2): each pack in a category varies coords/thresholds/decoys, and
	each pack's 3 levels form a monotone difficulty ladder where the
	decision gets harder (less info, more decoys, tighter clock,
	committed budget, attrition cap) — never just bigger raw numbers.

	Win-conditions use ONLY predicates in win_conditions.py; all packs run
	on rush-hour-arena (the only Rust-loadable map until S10). Output: flat
	`cat-<code>-NN.yaml` files in packs/, auto-covered by the parametrized
	engine-run gate. See SCENARIO_CATALOG.md.

	Run: python tools/gen_catalog.py (writes packs, prints a summary)
	"""

	from __future__ import annotations

	import pathlib

	import yaml

	PACKS = pathlib.Path(__file__).resolve().parent.parent / "openra_bench" / "scenarios" / "packs"

	# Capability tag (taxonomy) -> schema capability literal.
	CAP = {"perception": "perception", "reasoning": "reasoning", "action": "action"}

	AG = {"agent": {"faction": "allies"}}
	EN = {"enemy": {"faction": "soviet"}}


	def jeep(n, x, y):
	return {"type": "jeep", "owner": "agent", "position": [x, y], "count": n}


	def squad(x, y):
	return [
	{"type": "2tnk", "owner": "agent", "position": [x, y], "count": 2},
	{"type": "e1", "owner": "agent", "position": [x + 1, y + 2], "count": 3},
	]


	def enemy(t, x, y, n=1):
	return {"type": t, "owner": "enemy", "position": [x, y], "count": n, "stance": 2}


	def econ_base(cash, tent=False):
	actors = [
	{"type": "fact", "owner": "agent", "position": [10, 18]},
	{"type": "powr", "owner": "agent", "position": [14, 18]},
	{"type": "jeep", "owner": "agent", "position": [8, 16]},
	enemy("e1", 114, 34),
	]
	if tent:
	actors.insert(2, {"type": "tent", "owner": "agent", "position": [12, 21]})
	return {
	"agent": AG["agent"], "enemy": EN["enemy"],
	"tools": ["build", "place_building", "move_units", "deploy", "stop"],
	"planning": True, "termination": {"max_ticks": 40000},
	"actors": actors,
	}, cash


	def scout_base():
	return {
	"agent": AG["agent"], "enemy": EN["enemy"],
	"tools": ["move_units", "attack_unit", "stop"],
	"planning": True, "termination": {"max_ticks": 30000},
	"actors": [jeep(2, 6, 6), {"type": "e1", "owner": "agent",
	"position": [7, 8], "count": 2}],
	}


	def combat_base(decoys=0):
	a = squad(8, 18) + [enemy("e1", 100, 20, 2), enemy("e3", 104, 24)]
	for d in range(decoys):
	a.append(enemy("e1", 40 + d * 8, 10, 1))
	return {
	"agent": AG["agent"], "enemy": EN["enemy"],
	"tools": ["move_units", "attack_unit", "attack_move", "stop"],
	"planning": True, "termination": {"max_ticks": 30000},
	"actors": a,
	}


	# Per category: (code, title, cap, robo, meaning, n_packs, base_fn, win_fn)
	# win_fn(p, lvl) -> dict ; lvl in 0(easy)/1(med)/2(hard); p = pack index.
	def L(*xs):
	return {"all_of": list(xs)}


	CATS = [
	("c1", "Frontier Scouting", "perception",
	"UAV/UGV frontier selection: choose which unknown region to commit a "
	"time-limited searcher to.",
	"Pathfinding is solved; deciding WHICH unexplored region to commit to "
	"under partial information and a deadline is the real search problem.",
	6, lambda p: scout_base(),
	lambda p, l: L({"explored_pct_gte": 38 + l * 9 + p},
	*([{"units_lost_lte": 0}] if l == 2 else []),
	{"within_ticks": 16000 - l * 3500 - p * 200})),
	("c2", "Threat Enumeration", "perception",
	"Scene state-estimation under fog and decoys before committing force.",
	"Estimating hidden adversary state from partial sightings before "
	"acting — perception under occlusion and distractors.",
	6, lambda p: combat_base(decoys=2),
	lambda p, l: L({"enemies_discovered_gte": 2 + l},
	{"units_lost_lte": 1 if l < 2 else 0},
	{"within_ticks": 14000 - l * 3000 - p * 150})),
	("c3", "Tech Critical Path", "reasoning",
	"Task-graph scheduling with prerequisites under a makespan.",
	"Precondition-ordered construction (B needs A) to hit a capability "
	"deadline — topological planning under a cost+time budget.",
	6, lambda p: econ_base(6000, tent=False),
	lambda p, l: L({"has_building": "tent"},
	{"building_total_gte": 4 + l},
	{"power_surplus_gte": 0},
	{"within_ticks": 22000 - l * 5000 - p * 300})),
	("c4", "Power-Budget Online", "reasoning",
	"Keeping an online resource (power) non-negative while expanding.",
	"Sequencing subsystem bring-up so a shared online resource never goes "
	"negative — constraint-respecting schedule.",
	5, lambda p: econ_base(5000, tent=False),
	lambda p, l: L({"power_surplus_gte": 0},
	{"building_total_gte": 4 + l},
	{"within_ticks": 20000 - l * 4500 - p * 250})),
	("c5", "Budget Allocation (spend)", "reasoning",
	"Indivisible-budget allocation: wide vs deep, splitting clears nothing.",
	"Allocating a finite budget across competing investments where a "
	"half-measure on both fails — resource-allocation under a hard cap.",
	6, lambda p: econ_base(2200 - p * 120, tent=True),
	lambda p, l: L({"building_count_gte": {"type": "powr", "n": 2}},
	{"building_total_gte": 5 + l},
	{"within_ticks": 20000 - l * 4500})),
	("c6", "Time-Boxed Capital Deploy", "reasoning",
	"Convert a budget into fielded force AND standing infra before a clock.",
	"Provisioning under an energy/money budget and a mission deadline — "
	"how much to commit and when.",
	6, lambda p: econ_base(2000 - p * 100, tent=True),
	lambda p, l: L({"own_units_gte": 4 + l},
	{"building_total_gte": 4 + l},
	*([{"units_lost_lte": 0}] if l == 2 else []),
	{"within_ticks": 16000 - l * 3500})),
	("c7", "Defensive-Direction Commit", "perception",
	"Place limited defenses toward the most likely approach under "
	"directional uncertainty.",
	"Committing scarce defensive assets to an inferred threat axis — "
	"spatial decision under directional ambiguity.",
	6, lambda p: econ_base(5000, tent=True),
	lambda p, l: L({"building_in_region": {"type": "pbox", "x": 40 + p * 5,
	"y": 20, "radius": 9 - l,
	"count": 2 + (l == 2)}},
	{"within_ticks": 24000 - l * 5000})),
	("c8", "Base-Placement & Staging", "perception",
	"Found a base in a designated region, then stage toward a threat axis.",
	"Choosing a base site that satisfies spatial constraints, then "
	"pre-positioning — facility-layout + staging.",
	5, lambda p: econ_base(4000, tent=False),
	lambda p, l: L({"building_in_region": {"type": "powr", "x": 30 + p * 4,
	"y": 18, "radius": 10 - l * 2,
	"count": 1}},
	{"building_total_gte": 3 + l},
	{"within_ticks": 22000 - l * 5000})),
	("c9", "Commit-vs-Retreat", "reasoning",
	"Engage vs hold under partial info with an attrition cap.",
	"The core risk call: commit force on visible info vs wait for more — "
	"decision under uncertainty with a loss budget.",
	6, lambda p: combat_base(decoys=1 + p % 3),
	lambda p, l: L({"units_killed_gte": 2 + l},
	{"units_lost_lte": 3 - l},
	{"within_ticks": 14000 - l * 3000})),
	("c10", "Force Coordination", "action",
	"Drive split groups to converge simultaneously and survive.",
	"Coordinated multi-robot rendezvous: steer separated teams to a "
	"common staging point on time.",
	6, lambda p: {
	"agent": AG["agent"], "enemy": EN["enemy"],
	"tools": ["move_units", "attack_unit", "stop"], "planning": True,
	"termination": {"max_ticks": 30000},
	"actors": [jeep(2, 6, 6), jeep(2, 6, 34),
	{"type": "e1", "owner": "enemy", "position": [110, 20],
	"count": 2, "stance": 2}],
	},
	lambda p, l: L({"all_units_in_region": {"x": 55 + p * 3, "y": 20,
	"radius": 7 - l}},
	{"units_lost_lte": 1 if l < 2 else 0},
	{"within_ticks": 13000 - l * 3000})),
	("c11", "Tempo / Timing Window", "reasoning",
	"Strike inside a window that opens late and closes — not earliest, "
	"not biggest.",
	"Acting only inside a valid time window (takt-time): too early or too "
	"late both fail.",
	5, lambda p: combat_base(decoys=1),
	lambda p, l: L({"after_ticks": 1500 + l * 800},
	{"units_killed_gte": 2 + l},
	{"within_ticks": 12000 - l * 2500})),
	("c12", "Error Recovery / Replan", "reasoning",
	"After a setback, rebuild/repair and re-establish capability under a "
	"hard clock.",
	"Detecting plan failure and repairing it under reduced means and a "
	"deadline — receding-horizon replanning.",
	5, lambda p: econ_base(3000, tent=True),
	lambda p, l: L({"has_building": "tent"},
	{"building_total_gte": 4 + l},
	{"after_ticks": 1200},
	{"within_ticks": 22000 - l * 5000})),
	]

	LEVELS = ("easy", "medium", "hard")


	def build():
	n_packs = n_levels = 0
	for code, title, cap, robo, meaning, npk, base_fn, win_fn in CATS:
	for p in range(npk):
	b = base_fn(p)
	base, cash = (b if isinstance(b, tuple) else (b, None))
	levels = {}
	for li, lv in enumerate(LEVELS):
	levels[lv] = {
	"description": f"{title}: {lv} — the decision is harder "
	f"(less info / tighter clock / committed choice).",
	"win_condition": win_fn(p, li),
	"max_turns": 45 + li * 8,
	}
	if li == 2:
	levels[lv]["fail_condition"] = {"units_lost_lte": -1}
	pack = {
	"meta": {
	"id": f"cat-{code}-{p:02d}",
	"title": f"{title} #{p + 1}",
	"capability": CAP[cap],
	"real_world_meaning": meaning,
	"robotics_analogue": robo,
	"author": "catalog-generator",
	},
	"base_map": "rush-hour-arena",
	"base": base,
	"levels": levels,
	}
	if cash is not None:
	pack["starting_cash"] = cash
	(PACKS / f"cat-{code}-{p:02d}.yaml").write_text(
	yaml.safe_dump(pack, sort_keys=False, default_flow_style=False)
	)
	n_packs += 1
	n_levels += 3
	print(f"generated {n_packs} packs / {n_levels} levels across {len(CATS)} categories")
	return n_packs, n_levels


	if __name__ == "__main__":
	build()