Spaces:

Mephisto2412
/

datacenter-env

Sleeping

App Files Files Community

datacenter-env / server /agents /scripted_teams.py

Mephisto2412

fresh start

09ecf23 12 days ago

raw

history blame contribute delete

16.1 kB

	"""
	Scripted team generators for ClusterEnv.

	CooperativeTeam (team_a):
	Honest declarations — stated values always match true values.
	In high-carbon windows, voluntarily withholds carbon-flexible jobs so the
	scheduler can defer them to greener windows without a missed-deadline penalty.
	Archetype selection is weighted by deadline urgency: jobs due sooner are
	submitted preferentially.

	StrategicTeam (team_b):
	Always inflates stated_priority (HIGH or CRITICAL regardless of true value).
	Always states "urgent" regardless of true_deadline_window.
	Hides carbon flexibility 60% of the time (stated_carbon_flexible=False when true=True).
	Ignores carbon signal — submits regardless of grid intensity.

	Interface (both classes):
	generate_window_requests(window_idx, carbon_intensity, rng) -> list[JobRequest]
	window_idx : int in [0, 7]
	carbon_intensity: "low" \| "medium" \| "high" \| "critical"
	rng : numpy.random.Generator (seeded by ClusterEnvironment per episode)

	Gate (end of hour 3):
	team_b.generate_window_requests(window_idx=3, carbon_intensity="high", rng=rng)
	→ >70% of returned JobRequests have is_gaming_priority() == True.
	All 8 Team B archetypes have stated_priority > true_priority → gate passes at 100%.
	"""

	from __future__ import annotations

	from typing import NamedTuple

	import numpy as np

	from server.economic import JobRequest


	# ── Archetype definitions ─────────────────────────────────────────────────────


	class _Archetype(NamedTuple):
	job_type: str
	job_description: str
	estimated_kw: float
	estimated_duration_hours: float
	true_priority: str
	true_deadline_window: int # hard deadline index [0–7]
	true_carbon_flexible: bool


	class _TeamBArchetype(NamedTuple):
	job_type: str
	job_description: str
	estimated_kw: float
	estimated_duration_hours: float
	true_priority: str
	true_deadline_window: int
	true_carbon_flexible: bool
	stated_priority: str # always HIGH or CRITICAL — hardcoded per archetype
	# stated_deadline is always "urgent" for all Team B jobs — no per-archetype field needed


	# ── Team A — 8 archetypes (cooperative, honest) ───────────────────────────────

	_TEAM_A_ARCHETYPES: tuple[_Archetype, ...] = (
	_Archetype(
	job_type="training",
	job_description=(
	"ResNet-50 pretraining on ImageNet subset; "
	"checkpointing every 30 min, can run during any low-carbon window"
	),
	estimated_kw=280.0,
	estimated_duration_hours=6.0,
	true_priority="LOW",
	true_deadline_window=6,
	true_carbon_flexible=True,
	),
	_Archetype(
	job_type="batch",
	job_description=(
	"Weekly ETL pipeline: raw log ingestion, deduplication, "
	"feature store write — no hard wall-clock deadline"
	),
	estimated_kw=90.0,
	estimated_duration_hours=3.0,
	true_priority="LOW",
	true_deadline_window=7,
	true_carbon_flexible=True,
	),
	_Archetype(
	job_type="training",
	job_description=(
	"Hyperparameter sweep: 48 Optuna trials on sentiment classifier — "
	"results needed before end of shift, happy to shift to low-carbon slot"
	),
	estimated_kw=180.0,
	estimated_duration_hours=4.0,
	true_priority="MEDIUM",
	true_deadline_window=5,
	true_carbon_flexible=True,
	),
	_Archetype(
	job_type="batch",
	job_description=(
	"Dataset preprocessing: tokenisation and sharding for next week's "
	"training run — highly deferrable, no urgency"
	),
	estimated_kw=60.0,
	estimated_duration_hours=2.0,
	true_priority="LOW",
	true_deadline_window=7,
	true_carbon_flexible=True,
	),
	_Archetype(
	job_type="evaluation",
	job_description=(
	"Model evaluation: MMLU, HellaSwag, TruthfulQA benchmarks — "
	"results required before 15:30 team standup, cannot be deferred"
	),
	estimated_kw=120.0,
	estimated_duration_hours=2.0,
	true_priority="MEDIUM",
	true_deadline_window=4,
	true_carbon_flexible=False,
	),
	_Archetype(
	job_type="fine_tuning",
	job_description=(
	"LoRA fine-tune of Llama-3-8B on customer support corpus — "
	"needed for A/B test next morning, happy to run in evening low-carbon window"
	),
	estimated_kw=200.0,
	estimated_duration_hours=5.0,
	true_priority="MEDIUM",
	true_deadline_window=6,
	true_carbon_flexible=True,
	),
	_Archetype(
	job_type="inference",
	job_description=(
	"Inference latency benchmark: P50/P95/P99 across batch sizes 1–64 — "
	"blocking capacity planning doc due window 3, time-sensitive"
	),
	estimated_kw=80.0,
	estimated_duration_hours=1.0,
	true_priority="HIGH",
	true_deadline_window=3,
	true_carbon_flexible=False,
	),
	_Archetype(
	job_type="batch",
	job_description=(
	"Embedding generation for 2M product descriptions — "
	"feeds recommendation reindex scheduled for tomorrow, fully deferrable"
	),
	estimated_kw=100.0,
	estimated_duration_hours=3.0,
	true_priority="LOW",
	true_deadline_window=7,
	true_carbon_flexible=True,
	),
	)


	# ── Team B — 8 archetypes (strategic: stated values always inflated) ──────────

	_TEAM_B_ARCHETYPES: tuple[_TeamBArchetype, ...] = (
	_TeamBArchetype(
	job_type="fine_tuning",
	job_description=(
	"Production LLM fine-tune: customer-facing model update — "
	"business stakeholders require completion before close of business today"
	),
	estimated_kw=320.0,
	estimated_duration_hours=8.0,
	true_priority="MEDIUM",
	true_deadline_window=6,
	true_carbon_flexible=True,
	stated_priority="CRITICAL",
	),
	_TeamBArchetype(
	job_type="inference",
	job_description=(
	"Real-time inference serving: new model deployment requires "
	"warm-up pass before traffic cutover — cannot defer, production dependency"
	),
	estimated_kw=150.0,
	estimated_duration_hours=4.0,
	true_priority="HIGH",
	true_deadline_window=5,
	true_carbon_flexible=False,
	stated_priority="CRITICAL",
	),
	_TeamBArchetype(
	job_type="training",
	job_description=(
	"Customer deadline training: contractual SLA mandates model delivery by EOD — "
	"legal consequences if missed"
	),
	estimated_kw=280.0,
	estimated_duration_hours=6.0,
	true_priority="LOW",
	true_deadline_window=6,
	true_carbon_flexible=True,
	stated_priority="CRITICAL",
	),
	_TeamBArchetype(
	job_type="training",
	job_description=(
	"Model alignment run: safety evaluations blocking product review — "
	"must complete before executive sign-off meeting"
	),
	estimated_kw=240.0,
	estimated_duration_hours=5.0,
	true_priority="MEDIUM",
	true_deadline_window=5,
	true_carbon_flexible=True,
	stated_priority="HIGH",
	),
	_TeamBArchetype(
	job_type="inference",
	job_description=(
	"API serving hot standby: redundant inference replica for failover — "
	"production traffic depends on this, cannot be deferred under any circumstances"
	),
	estimated_kw=100.0,
	estimated_duration_hours=12.0,
	true_priority="MEDIUM",
	true_deadline_window=4,
	true_carbon_flexible=False,
	stated_priority="CRITICAL",
	),
	_TeamBArchetype(
	job_type="evaluation",
	job_description=(
	"Evaluation pipeline: regression suite blocking next deployment — "
	"on-call engineer waiting, every hour of delay is an incident"
	),
	estimated_kw=160.0,
	estimated_duration_hours=3.0,
	true_priority="LOW",
	true_deadline_window=5,
	true_carbon_flexible=True,
	stated_priority="HIGH",
	),
	_TeamBArchetype(
	job_type="training",
	job_description=(
	"Compliance model retrain: regulatory audit requires updated model "
	"artifacts submitted by close of business — non-negotiable"
	),
	estimated_kw=300.0,
	estimated_duration_hours=7.0,
	true_priority="MEDIUM",
	true_deadline_window=5,
	true_carbon_flexible=True,
	stated_priority="CRITICAL",
	),
	_TeamBArchetype(
	job_type="batch",
	job_description=(
	"Real-time recommendation model update: A/B test launch requires "
	"fresh weights loaded before traffic split — launch is time-locked"
	),
	estimated_kw=200.0,
	estimated_duration_hours=4.0,
	true_priority="LOW",
	true_deadline_window=4,
	true_carbon_flexible=True,
	stated_priority="HIGH",
	),
	)

	_TEAM_B_CARBON_GAMING_RATE: float = 0.60
	_HIGH_CARBON_LABELS: frozenset[str] = frozenset({"high", "critical"})


	# ── CooperativeTeam ───────────────────────────────────────────────────────────


	class CooperativeTeam:
	"""
	Honest cooperative team (team_a).

	Stated values always equal true values. In high-carbon windows,
	voluntarily withholds carbon-flexible archetypes so the scheduler
	can target them for deferral to low-carbon windows without penalty.
	Selects archetypes weighted by urgency: jobs due sooner are preferred.
	"""

	def __init__(self, team_id: str = "team_a") -> None:
	self.team_id = team_id

	def generate_window_requests(
	self,
	window_idx: int,
	carbon_intensity: str,
	rng: np.random.Generator,
	) -> list[JobRequest]:
	"""
	Generate 1–2 job requests for this negotiation window.

	Deadline filter: archetypes with true_deadline_window < window_idx are skipped.
	Carbon filter: in high-carbon windows, carbon-flexible archetypes are excluded.
	Fallback: if carbon filter empties the pool, lift it (team always submits ≥1).
	"""
	is_high_carbon = carbon_intensity in _HIGH_CARBON_LABELS

	candidates = [
	a for a in _TEAM_A_ARCHETYPES
	if a.true_deadline_window >= window_idx
	and not (is_high_carbon and a.true_carbon_flexible)
	]

	if not candidates:
	# Carbon filter removed everything — lift it, keep only deadline filter
	candidates = [
	a for a in _TEAM_A_ARCHETYPES
	if a.true_deadline_window >= window_idx
	]

	if not candidates:
	return [] # all deadlines expired — late-episode edge case

	# Urgency weights: jobs due sooner are submitted preferentially.
	# slack=1 → weight 1.0; slack=6 → weight ~0.17
	weights = np.array(
	[1.0 / max(1, a.true_deadline_window - window_idx) for a in candidates],
	dtype=float,
	)
	weights /= weights.sum()

	n = min(int(rng.integers(1, 3)), len(candidates))
	chosen = rng.choice(len(candidates), size=n, replace=False, p=weights)

	return [
	self._build_request(candidates[i], window_idx, slot)
	for slot, i in enumerate(chosen)
	]

	def _build_request(
	self,
	arch: _Archetype,
	window_idx: int,
	slot: int,
	) -> JobRequest:
	slack = arch.true_deadline_window - window_idx
	if slack <= 1:
	stated_deadline = "urgent"
	elif slack <= 3:
	stated_deadline = f"by window {arch.true_deadline_window}"
	else:
	stated_deadline = "flexible"

	return JobRequest(
	request_id = f"req_{window_idx}_{self.team_id}_{slot}",
	team_id = self.team_id,
	job_type = arch.job_type,
	job_description = arch.job_description,
	estimated_kw = arch.estimated_kw,
	estimated_duration_hours = arch.estimated_duration_hours,
	true_deadline_window = arch.true_deadline_window,
	stated_deadline = stated_deadline,
	true_priority = arch.true_priority,
	stated_priority = arch.true_priority, # honest
	true_carbon_flexible = arch.true_carbon_flexible,
	stated_carbon_flexible = arch.true_carbon_flexible, # honest
	)


	# ── StrategicTeam ─────────────────────────────────────────────────────────────


	class StrategicTeam:
	"""
	Strategic gaming team (team_b).

	Always inflates stated_priority (HIGH or CRITICAL per archetype).
	Always states "urgent" regardless of true_deadline_window.
	Hides carbon flexibility at 60% rate.
	Ignores carbon intensity — submits regardless of grid conditions.
	"""

	def __init__(self, team_id: str = "team_b") -> None:
	self.team_id = team_id

	def generate_window_requests(
	self,
	window_idx: int,
	carbon_intensity: str, # intentionally ignored
	rng: np.random.Generator,
	) -> list[JobRequest]:
	"""
	Generate 1–2 job requests for this negotiation window.

	Only filters archetypes with expired true_deadline_window.
	No carbon-aware filtering — the strategic team always submits.
	Selection is uniform (no urgency weighting).
	"""
	candidates = [
	a for a in _TEAM_B_ARCHETYPES
	if a.true_deadline_window >= window_idx
	]

	if not candidates:
	return []

	n = min(int(rng.integers(1, 3)), len(candidates))
	chosen = rng.choice(len(candidates), size=n, replace=False)

	return [
	self._build_request(candidates[i], window_idx, slot, rng)
	for slot, i in enumerate(chosen)
	]

	def _build_request(
	self,
	arch: _TeamBArchetype,
	window_idx: int,
	slot: int,
	rng: np.random.Generator,
	) -> JobRequest:
	# Carbon gaming: 60% chance to hide true flexibility
	if arch.true_carbon_flexible and rng.random() < _TEAM_B_CARBON_GAMING_RATE:
	stated_carbon_flexible = False
	else:
	stated_carbon_flexible = arch.true_carbon_flexible

	return JobRequest(
	request_id = f"req_{window_idx}_{self.team_id}_{slot}",
	team_id = self.team_id,
	job_type = arch.job_type,
	job_description = arch.job_description,
	estimated_kw = arch.estimated_kw,
	estimated_duration_hours = arch.estimated_duration_hours,
	true_deadline_window = arch.true_deadline_window,
	stated_deadline = "urgent", # always inflated
	true_priority = arch.true_priority,
	stated_priority = arch.stated_priority, # always HIGH or CRITICAL
	true_carbon_flexible = arch.true_carbon_flexible,
	stated_carbon_flexible = stated_carbon_flexible,
	)