Spaces:

soham27
/

AvigilanceEnv

Sleeping

App Files Files Community

AvigilanceEnv / app.py

soham27

Add real-source ingestion and expand hybrid corpus

c07553d about 2 months ago

raw

history blame contribute delete

62.7 kB

	import json
	from pathlib import Path
	from typing import Any

	import uvicorn
	from fastapi import FastAPI, HTTPException
	from fastapi.responses import HTMLResponse, JSONResponse, RedirectResponse

	from environment.avigilance_env import AvigilanceEnv
	from environment.models import AvigilanceAction


	FRONTEND_HTML = """
	<!DOCTYPE html>
	<html lang="en">
	<head>
	<meta charset="UTF-8">
	<meta name="viewport" content="width=device-width, initial-scale=1.0">
	<title>AvigilanceEnv Space Console</title>
	<link rel="preconnect" href="https://fonts.googleapis.com">
	<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
	<link href="https://fonts.googleapis.com/css2?family=Sora:wght@400;500;600;700;800&family=IBM+Plex+Mono:wght@400;500&display=swap" rel="stylesheet">
	<style>
	:root {
	--bg: #f3ecdf;
	--panel: rgba(255, 250, 244, 0.76);
	--panel-strong: linear-gradient(145deg, #0f2e36 0%, #1f4e57 44%, #d26831 100%);
	--text: #12232c;
	--muted: #5c6b72;
	--accent: #d26831;
	--line: rgba(18, 35, 44, 0.12);
	--line-strong: rgba(255, 255, 255, 0.18);
	--shadow: 0 28px 70px rgba(20, 35, 41, 0.14);
	--shadow-soft: 0 16px 32px rgba(20, 35, 41, 0.08);
	--surface-dark: #0f2128;
	--surface-dark-2: #132a33;
	--success: #19816f;
	--warn: #b96e17;
	}

	* { box-sizing: border-box; }
	html { scroll-behavior: smooth; }

	body {
	margin: 0;
	font-family: "Sora", "Segoe UI Variable", sans-serif;
	color: var(--text);
	background:
	radial-gradient(circle at 10% 10%, rgba(210, 104, 49, 0.16), transparent 18%),
	radial-gradient(circle at 88% 12%, rgba(15, 140, 127, 0.14), transparent 20%),
	linear-gradient(180deg, #f8f2e8 0%, var(--bg) 100%);
	}

	code, pre, textarea, input, select {
	font-family: "IBM Plex Mono", monospace;
	}

	.page-shell {
	position: relative;
	width: min(1360px, calc(100vw - 32px));
	margin: 0 auto;
	padding: 24px 0 64px;
	}

	.page-noise {
	position: fixed;
	inset: 0;
	background-image:
	linear-gradient(rgba(255,255,255,0.03) 1px, transparent 1px),
	linear-gradient(90deg, rgba(255,255,255,0.03) 1px, transparent 1px);
	background-size: 24px 24px;
	pointer-events: none;
	opacity: 0.45;
	}

	.topbar,
	.hero,
	.ops-grid,
	.walkthrough-grid,
	.console-grid,
	.hero-signal-grid,
	.task-card-grid,
	.summary-strip {
	display: grid;
	gap: 20px;
	}

	.topbar {
	grid-template-columns: 1.2fr auto;
	align-items: end;
	gap: 16px;
	margin-bottom: 20px;
	}

	.topbar-copy {
	display: grid;
	gap: 14px;
	}

	.topbar-nav {
	display: flex;
	flex-wrap: wrap;
	gap: 10px;
	}

	.nav-link {
	display: inline-flex;
	align-items: center;
	justify-content: center;
	padding: 10px 14px;
	border-radius: 999px;
	border: 1px solid rgba(18, 35, 44, 0.12);
	background: rgba(255, 251, 247, 0.72);
	color: var(--text);
	text-decoration: none;
	font-size: 0.82rem;
	font-weight: 700;
	box-shadow: var(--shadow-soft);
	}

	.topbar h1 {
	margin: 8px 0 0;
	font-size: clamp(2.4rem, 5vw, 4.7rem);
	line-height: 0.95;
	letter-spacing: -0.06em;
	}

	.topbar-chips {
	display: flex;
	flex-wrap: wrap;
	justify-content: flex-end;
	gap: 10px;
	}

	.chip {
	padding: 10px 14px;
	border-radius: 999px;
	border: 1px solid rgba(18, 35, 44, 0.1);
	background: rgba(255, 251, 247, 0.86);
	box-shadow: var(--shadow-soft);
	font-size: 0.82rem;
	}

	.hero {
	grid-template-columns: 1.5fr 0.95fr;
	align-items: stretch;
	margin-bottom: 22px;
	}

	.panel {
	border: 1px solid var(--line);
	border-radius: 28px;
	box-shadow: var(--shadow);
	background: var(--panel);
	padding: 24px;
	}

	.panel-dark {
	background: linear-gradient(135deg, #fff9f1 0%, #f5e7d7 55%, #edd8c0 100%);
	color: var(--text);
	position: relative;
	overflow: hidden;
	border: 1px solid rgba(18, 35, 44, 0.08);
	}

	.panel-dark::after {
	content: "";
	position: absolute;
	inset: auto -40px -50px auto;
	width: 280px;
	height: 280px;
	border-radius: 50%;
	background: radial-gradient(circle, rgba(210, 104, 49, 0.18), transparent 72%);
	pointer-events: none;
	}

	.hero-stage { padding: 28px; }
	.hero-copy { position: relative; z-index: 1; }

	.hero-copy h2 {
	margin: 10px 0 14px;
	max-width: 13ch;
	font-size: clamp(2.1rem, 4vw, 3.6rem);
	line-height: 0.98;
	letter-spacing: -0.05em;
	}

	.hero-copy .lead {
	max-width: 64ch;
	color: var(--muted);
	font-size: 1rem;
	line-height: 1.72;
	}

	.eyebrow,
	.label {
	text-transform: uppercase;
	letter-spacing: 0.18em;
	font-size: 0.72rem;
	font-weight: 600;
	}

	.hero-actions,
	.button-group,
	.control-row {
	display: flex;
	flex-wrap: wrap;
	gap: 12px;
	}

	.hero-actions { margin-top: 22px; }

	.hero-signal-grid {
	margin-top: 28px;
	grid-template-columns: repeat(4, minmax(0, 1fr));
	position: relative;
	z-index: 1;
	}

	.signal-card {
	min-height: 128px;
	padding: 18px;
	border-radius: 22px;
	border: 1px solid rgba(18, 35, 44, 0.08);
	background: rgba(255, 255, 255, 0.74);
	}

	.signal-card.highlight { background: rgba(255, 255, 255, 0.92); }

	.signal-card .label { color: var(--accent); }

	.signal-card strong {
	display: block;
	margin: 10px 0 6px;
	font-size: 1.2rem;
	color: var(--text);
	}

	.signal-card p {
	margin: 0;
	color: var(--muted);
	line-height: 1.55;
	}

	.hero-rail h3 {
	margin: 10px 0 8px;
	font-size: 1.5rem;
	line-height: 1.1;
	}

	.hero-rail p,
	.console-heading p,
	.walkthrough article p {
	margin: 0;
	color: var(--muted);
	line-height: 1.6;
	}

	.hero-rail {
	display: grid;
	align-content: start;
	gap: 18px;
	}

	.task-card-grid { margin: 22px 0; }

	.task-card {
	padding: 16px 18px;
	border-radius: 20px;
	border: 1px solid var(--line);
	background: rgba(255, 255, 255, 0.58);
	text-align: left;
	cursor: pointer;
	transition: transform 160ms ease, border-color 160ms ease, background 160ms ease;
	}

	.task-card:hover,
	.task-card.is-active {
	transform: translateY(-1px);
	border-color: rgba(210, 104, 49, 0.45);
	background: rgba(255, 245, 237, 0.96);
	}

	.task-card span,
	.rail-metrics span {
	display: block;
	margin-bottom: 6px;
	text-transform: uppercase;
	letter-spacing: 0.14em;
	font-size: 0.7rem;
	color: var(--muted);
	}

	.task-card strong,
	.rail-metrics strong {
	display: block;
	font-size: 0.98rem;
	line-height: 1.4;
	}

	.rail-metrics { display: grid; gap: 14px; margin-bottom: 18px; }
	.wide { width: 100%; }

	.button {
	appearance: none;
	border: 1px solid transparent;
	border-radius: 999px;
	padding: 12px 18px;
	cursor: pointer;
	text-decoration: none;
	transition: transform 160ms ease, background 160ms ease, border-color 160ms ease;
	font-weight: 700;
	}

	.button:hover { transform: translateY(-1px); }
	.button.primary { background: var(--accent); color: #fff7f0; }
	.button.secondary { background: var(--surface-dark); color: #f6efe5; }
	.button.ghost { background: transparent; color: var(--text); border-color: var(--line); }

	.ops-grid { grid-template-columns: 1.5fr 0.82fr; margin-bottom: 22px; }
	.side-stack { display: grid; gap: 20px; }
	.panel-accent { background: linear-gradient(180deg, rgba(255, 249, 242, 0.92), rgba(255, 244, 233, 0.82)); }
	.walkthrough-grid { grid-template-columns: repeat(3, 1fr); }
	.summary-strip { grid-template-columns: repeat(3, minmax(0, 1fr)); margin-bottom: 18px; }
	.explain-grid { display: grid; grid-template-columns: 1.08fr 0.92fr; gap: 18px; margin-top: 18px; }
	.meaning-stack { display: grid; gap: 16px; }

	.panel-header {
	display: flex;
	align-items: center;
	justify-content: space-between;
	gap: 16px;
	margin-bottom: 18px;
	}

	.panel-header.compact { margin-bottom: 14px; }
	.panel-header h2 { margin: 8px 0 0; font-size: 1.45rem; }

	.checklist { margin: 0; padding-left: 18px; line-height: 1.7; }
	.checklist.strong li + li { margin-top: 10px; }

	label { display: grid; gap: 8px; min-width: 180px; }

	input, select, textarea {
	width: 100%;
	border: 1px solid var(--line);
	border-radius: 16px;
	background: rgba(255, 255, 255, 0.78);
	color: var(--text);
	padding: 13px 15px;
	}

	select, input { min-height: 50px; }
	textarea { min-height: 320px; resize: vertical; }

	#actionInputHelp {
	margin: 10px 2px 0;
	color: var(--muted);
	font-size: 0.9rem;
	line-height: 1.4;
	}

	.stretch { align-items: flex-end; }
	.stretch .button { min-height: 50px; }

	.summary-card,
	.console-panel,
	.meaning-panel,
	.legend-panel,
	.walkthrough article,
	.panel-log {
	border: 1px solid rgba(18, 35, 44, 0.08);
	border-radius: 22px;
	background: rgba(255, 255, 255, 0.48);
	box-shadow: var(--shadow-soft);
	}

	.summary-card { padding: 16px 18px; }
	.summary-card strong { display: block; margin-top: 8px; font-size: 1rem; line-height: 1.45; }
	.console-grid.triple { grid-template-columns: repeat(3, minmax(0, 1fr)); }
	.console-panel { padding: 18px; }
	.console-heading { margin-bottom: 14px; }
	.console-heading h3,
	.walkthrough article h3 { margin: 0 0 6px; font-size: 1.05rem; }

	.meaning-panel,
	.legend-panel {
	padding: 18px;
	}

	.meaning-panel h3,
	.legend-panel h3 {
	margin: 0 0 8px;
	font-size: 1rem;
	}

	.meaning-panel p,
	.legend-panel p {
	margin: 0;
	color: var(--muted);
	line-height: 1.6;
	}

	.meaning-body {
	margin-top: 12px;
	white-space: pre-wrap;
	line-height: 1.65;
	}

	.legend-list {
	display: grid;
	gap: 10px;
	margin-top: 14px;
	}

	.legend-item {
	padding: 12px 14px;
	border-radius: 16px;
	background: rgba(255, 255, 255, 0.7);
	border: 1px solid rgba(18, 35, 44, 0.08);
	}

	.legend-item strong {
	display: block;
	margin-bottom: 6px;
	font-size: 0.92rem;
	}

	.legend-item span {
	color: var(--muted);
	line-height: 1.55;
	font-size: 0.92rem;
	}

	.hint-list {
	display: grid;
	gap: 10px;
	margin: 0;
	padding-left: 18px;
	line-height: 1.65;
	}

	.control-hint {
	margin: 10px 0 0;
	color: var(--muted);
	line-height: 1.6;
	font-size: 0.92rem;
	}

	.reward-detail-grid {
	display: grid;
	grid-template-columns: repeat(4, minmax(0, 1fr));
	gap: 12px;
	margin-bottom: 18px;
	}

	.reward-detail-card {
	padding: 14px;
	border-radius: 18px;
	background: rgba(255, 255, 255, 0.66);
	border: 1px solid rgba(18, 35, 44, 0.08);
	box-shadow: var(--shadow-soft);
	}

	.reward-detail-card strong {
	display: block;
	margin-top: 6px;
	font-size: 1rem;
	line-height: 1.45;
	}

	pre {
	margin: 0;
	min-height: 320px;
	padding: 18px;
	border-radius: 18px;
	background: linear-gradient(180deg, var(--surface-dark) 0%, var(--surface-dark-2) 100%);
	color: #dce8e6;
	overflow: auto;
	white-space: pre-wrap;
	word-break: break-word;
	line-height: 1.5;
	}

	.status-pill {
	padding: 10px 14px;
	border-radius: 999px;
	background: rgba(15, 33, 40, 0.08);
	font-size: 0.82rem;
	font-weight: 700;
	}

	.status-pill.ok { background: rgba(25, 129, 111, 0.14); color: var(--success); }
	.status-pill.warn { background: rgba(185, 110, 23, 0.14); color: var(--warn); }
	.status-pill.error { background: rgba(160, 33, 33, 0.14); color: #8d1f1f; }

	.timeline {
	display: grid;
	gap: 12px;
	margin: 0;
	padding: 0;
	list-style: none;
	}

	.timeline li {
	padding: 14px 14px 14px 16px;
	border-left: 3px solid rgba(210, 104, 49, 0.45);
	border-radius: 0 18px 18px 0;
	background: rgba(255, 255, 255, 0.52);
	}

	.timeline-tag {
	display: inline-flex;
	margin-bottom: 8px;
	padding: 4px 9px;
	border-radius: 999px;
	background: rgba(18, 35, 44, 0.08);
	font-size: 0.72rem;
	text-transform: uppercase;
	letter-spacing: 0.14em;
	}

	.timeline p { margin: 0; line-height: 1.5; }
	.walkthrough article { padding: 18px; }

	@media (max-width: 960px) {
	.topbar,
	.hero,
	.ops-grid,
	.walkthrough-grid,
	.console-grid,
	.hero-signal-grid,
	.summary-strip,
	.explain-grid {
	grid-template-columns: 1fr;
	}

	.reward-detail-grid {
	grid-template-columns: 1fr 1fr;
	}

	.topbar-chips { justify-content: flex-start; }

	.page-shell {
	width: min(100vw - 20px, 100%);
	padding-top: 18px;
	}

	.hero-stage,
	.hero-rail,
	.panel { padding: 20px; }
	}
	</style>
	</head>
	<body>
	<div class="page-shell">
	<div class="page-noise" aria-hidden="true"></div>
	<header class="topbar">
	<div class="topbar-copy">
	<div>
	<p class="eyebrow">DGCA Monitoring Space</p>
	<h1>Avigilance Mission Console</h1>
	</div>
	<nav class="topbar-nav" aria-label="Primary">
	<a class="nav-link" href="#controlDeck">Control Deck</a>
	<a class="nav-link" href="#jsonGuide">JSON Guide</a>
	<a class="nav-link" href="#walkthrough">Walkthrough</a>
	</nav>
	</div>
	<div class="topbar-chips">
	<span class="chip">20k+ Hybrid Corpus</span>
	<span class="chip">OpenEnv Ready</span>
	<span class="chip">Real Ingestion Plan Ready</span>
	</div>
	</header>
	<main>
	<section class="hero" id="console">
	<article class="hero-stage panel panel-dark">
	<div class="hero-copy">
	<p class="eyebrow">Live Operations Deck</p>
	<h2>Run task resets, inspect payloads, and submit exact environment actions from one screen.</h2>
	<p class="lead">This Space root is entirely self-contained in app.py and now fronts a 20k-plus hybrid corpus with broader airline, airport, and incident coverage, plus a documented path for DGCA, AAIB, and AAI ingestion.</p>
	<div class="hero-actions">
	<a class="button primary" href="#controlDeck">Open Control Deck</a>
	<a class="button ghost" href="#walkthrough">Verification Flow</a>
	</div>
	</div>
	<div class="hero-signal-grid">
	<div class="signal-card highlight">
	<span class="label">API Health</span>
	<strong id="healthStatus">Checking...</strong>
	<p id="healthDetail">Polling live service metadata.</p>
	</div>
	<div class="signal-card">
	<span class="label">Runtime</span>
	<strong id="metadataStatus">Loading...</strong>
	<p id="corpusStatus">Loading corpus coverage and manifest details.</p>
	</div>
	<div class="signal-card">
	<span class="label">Session</span>
	<strong id="sessionStatus">No episode yet</strong>
	<p id="sessionDetail">Reset any task to initialize an active episode.</p>
	</div>
	<div class="signal-card">
	<span class="label">Reward Guardrail</span>
	<strong>(0, 1)</strong>
	<p>Scores remain strictly inside the open interval.</p>
	</div>
	</div>
	</article>
	<aside class="hero-rail panel">
	<div class="rail-block">
	<p class="eyebrow">Active Task</p>
	<h3 id="taskTitle">task1 · FTO Quality Scorer</h3>
	<p id="taskDescription">Grade a Flying Training Organisation against the DGCA rubric and recommend action.</p>
	</div>
	<div class="task-card-grid">
	<button class="task-card is-active" data-task="task1" type="button">
	<span>task1</span>
	<strong>FTO Quality</strong>
	</button>
	<button class="task-card" data-task="task2" type="button">
	<span>task2</span>
	<strong>Incident Prioritiser</strong>
	</button>
	<button class="task-card" data-task="task3" type="button">
	<span>task3</span>
	<strong>Resource Allocator</strong>
	</button>
	</div>
	<div class="rail-metrics">
	<div>
	<span class="label">Endpoints</span>
	<strong>/reset · /step · /state</strong>
	</div>
	<div>
	<span class="label">Use Case</span>
	<strong>Reviewer preflight and corpus inspection</strong>
	</div>
	</div>
	<button class="button secondary wide" id="refreshStatus" type="button">Refresh Live Status</button>
	</aside>
	</section>

	<section class="ops-grid">
	<article class="panel panel-accent">
	<div class="panel-header">
	<div>
	<p class="eyebrow">Control Deck</p>
	<h2 id="controlDeck">Interactive Task Runner</h2>
	</div>
	<div class="status-pill" id="resultBadge">Awaiting reset</div>
	</div>
	<div class="control-row">
	<label>
	<span class="label">Task</span>
	<select id="taskSelect">
	<option value="task1">task1: FTO Quality Scorer</option>
	<option value="task2">task2: Incident Prioritiser</option>
	<option value="task3">task3: Resource Allocator</option>
	</select>
	</label>
	<label>
	<span class="label">Seed</span>
	<input id="seedInput" type="number" value="42">
	</label>
	<div class="button-group stretch">
	<button class="button primary" id="resetEpisode" type="button">Reset Episode</button>
	<button class="button ghost" id="randomSeed" type="button">Randomize Seed</button>
	<button class="button ghost" id="loadExample" type="button">Load Example Action</button>
	<button class="button ghost" id="fetchState" type="button">Fetch State</button>
	<button class="button secondary" id="submitAction" type="button">Submit Step</button>
	</div>
	</div>
	<p class="control-hint">The default seed is 42, which recreates the same scenario every time. If you want different observations and different rewards, change the seed or use Randomize Seed before resetting.</p>
	<div class="summary-strip">
	<div class="summary-card">
	<span class="label">Observation Snapshot</span>
	<strong id="observationSummary">No observation loaded</strong>
	</div>
	<div class="summary-card">
	<span class="label">Last Reward</span>
	<strong id="rewardSummary">None yet</strong>
	</div>
	<div class="summary-card">
	<span class="label">Episode State</span>
	<strong id="doneSummary">Idle</strong>
	</div>
	</div>
	<div class="reward-detail-grid">
	<div class="reward-detail-card">
	<span class="label">Accuracy</span>
	<strong id="accuracySummary">Not available</strong>
	</div>
	<div class="reward-detail-card">
	<span class="label">Consistency</span>
	<strong id="consistencySummary">Not available</strong>
	</div>
	<div class="reward-detail-card">
	<span class="label">Safety Alignment</span>
	<strong id="safetySummary">Not available</strong>
	</div>
	<div class="reward-detail-card">
	<span class="label">Why This Changes</span>
	<strong id="rewardWhySummary">Depends on seed and action</strong>
	</div>
	</div>
	<div class="console-grid triple">
	<section class="console-panel">
	<div class="console-heading">
	<h3>Observation Payload</h3>
	<p>Backend response after reset or step.</p>
	</div>
	<pre id="observationView">Press Reset Episode to start.</pre>
	</section>
	<section class="console-panel">
	<div class="console-heading">
	<h3>Action Editor</h3>
	<p>Use typed JSON matching the task schema.</p>
	</div>
	<label for="actionInput" class="label">Action JSON</label>
	<textarea id="actionInput" spellcheck="false" aria-describedby="actionInputHelp"></textarea>
	<p id="actionInputHelp">The helper can prefill a valid payload, but you can edit every field before submit.</p>
	</section>
	<section class="console-panel">
	<div class="console-heading">
	<h3>Runtime Result</h3>
	<p>State, reward, or error output from the active request.</p>
	</div>
	<pre id="resultView">Waiting for actions.</pre>
	</section>
	</div>
	<div class="explain-grid">
	<div class="meaning-stack">
	<section class="meaning-panel">
	<h3>Observation Interpretation</h3>
	<p>Plain-English explanation of what the latest observation is telling you.</p>
	<div class="meaning-body" id="observationMeaning">Reset a task to see the live scenario translated into plain language.</div>
	</section>
	<section class="meaning-panel">
	<h3>Action Interpretation</h3>
	<p>Readable summary of the action payload currently in the editor.</p>
	<div class="meaning-body" id="actionMeaning">Pick a task or load an example action to see what your JSON is doing.</div>
	</section>
	<section class="meaning-panel">
	<h3>Result Interpretation</h3>
	<p>Short explanation of reward, completion state, and backend response behavior.</p>
	<div class="meaning-body" id="resultMeaning">Submit a step or fetch state to decode the response here.</div>
	</section>
	</div>
	<section class="legend-panel">
	<h3>Current Task Field Guide</h3>
	<p>Human-readable meaning of the most important fields for the selected task.</p>
	<div class="legend-list" id="fieldLegend"></div>
	</section>
	</div>
	</article>
	<aside class="side-stack">
	<article class="panel">
	<div class="panel-header compact">
	<div>
	<p class="eyebrow">Operational Notes</p>
	<h2>Task Guidance</h2>
	</div>
	</div>
	<ul class="checklist strong">
	<li><strong>task1</strong> is a one-step FTO grading decision with a DGCA action recommendation.</li>
	<li><strong>task2</strong> ranks incidents by urgency and can escalate the highest-risk cases immediately.</li>
	<li><strong>task3</strong> allocates inspector time and may require multiple steps depending on the scenario.</li>
	</ul>
	</article>
	<article class="panel" id="jsonGuide">
	<div class="panel-header compact">
	<div>
	<p class="eyebrow">JSON Guide</p>
	<h2>What The Response Means</h2>
	</div>
	</div>
	<ul class="hint-list">
	<li><strong>observation</strong> is the live environment state after reset or step.</li>
	<li><strong>reward</strong> is the scored feedback for the action you submitted.</li>
	<li><strong>done</strong> tells you whether the episode is finished.</li>
	<li><strong>info</strong> contains extra backend details that help explain the outcome.</li>
	<li><strong>action JSON</strong> is your decision payload, not the backend response.</li>
	</ul>
	</article>
	<article class="panel panel-log">
	<div class="panel-header compact">
	<div>
	<p class="eyebrow">Activity Feed</p>
	<h2>Operator Timeline</h2>
	</div>
	</div>
	<ol class="timeline" id="timeline">
	<li>
	<span class="timeline-tag">boot</span>
	<p>Console loaded. Pulling service metadata.</p>
	</li>
	</ol>
	</article>
	</aside>
	</section>

	<section class="walkthrough panel" id="walkthrough">
	<div class="panel-header">
	<div>
	<p class="eyebrow">Verification Path</p>
	<h2>How This Space Should Be Reviewed</h2>
	</div>
	</div>
	<div class="walkthrough-grid">
	<article>
	<h3>1. Reset a live task</h3>
	<p>Choose one of the three environments, seed it deterministically, and inspect the exact observation payload emitted by the backend.</p>
	</article>
	<article>
	<h3>2. Submit a typed action</h3>
	<p>Load the generated example or replace it with your own JSON, then submit the request against the same /step endpoint validators hit.</p>
	</article>
	<article>
	<h3>3. Verify contract behavior</h3>
	<p>Use the result panel and activity feed to confirm reward bounds, episode status, and endpoint availability before running repository validation scripts.</p>
	</article>
	</div>
	</section>
	</main>
	</div>
	<script>
	const healthStatus = document.getElementById("healthStatus");
	const healthDetail = document.getElementById("healthDetail");
	const metadataStatus = document.getElementById("metadataStatus");
	const corpusStatus = document.getElementById("corpusStatus");
	const sessionStatus = document.getElementById("sessionStatus");
	const sessionDetail = document.getElementById("sessionDetail");
	const observationView = document.getElementById("observationView");
	const resultView = document.getElementById("resultView");
	const actionInput = document.getElementById("actionInput");
	const taskSelect = document.getElementById("taskSelect");
	const seedInput = document.getElementById("seedInput");
	const taskTitle = document.getElementById("taskTitle");
	const taskDescription = document.getElementById("taskDescription");
	const rewardSummary = document.getElementById("rewardSummary");
	const accuracySummary = document.getElementById("accuracySummary");
	const consistencySummary = document.getElementById("consistencySummary");
	const safetySummary = document.getElementById("safetySummary");
	const rewardWhySummary = document.getElementById("rewardWhySummary");
	const doneSummary = document.getElementById("doneSummary");
	const observationSummary = document.getElementById("observationSummary");
	const resultBadge = document.getElementById("resultBadge");
	const timeline = document.getElementById("timeline");
	const taskCards = Array.from(document.querySelectorAll(".task-card"));
	const observationMeaning = document.getElementById("observationMeaning");
	const actionMeaning = document.getElementById("actionMeaning");
	const resultMeaning = document.getElementById("resultMeaning");
	const fieldLegend = document.getElementById("fieldLegend");

	const TASK_META = {
	task1: {
	title: "task1 · FTO Quality Scorer",
	description: "Grade a Flying Training Organisation against the DGCA rubric and recommend action.",
	legend: [
	["fto_profile", "The current training organization being reviewed, including safety, operations, compliance, and student support inputs."],
	["total_score", "Your aggregate DGCA-style assessment score for the FTO."],
	["recommended_action", "The operational decision you want the evaluator to take after grading."],
	["risk_flags", "Explicit reasons why this FTO may need closer attention."]
	]
	},
	task2: {
	title: "task2 · Incident Prioritiser",
	description: "Rank active incidents by operational urgency and identify escalation candidates.",
	legend: [
	["incident_batch", "The set of incidents currently waiting to be triaged."],
	["priority_ranking", "Your ordered list from most urgent to least urgent incident."],
	["escalate_immediately", "Incidents that should be handled without delay."],
	["defer_list", "Incidents that can safely wait compared with higher-priority items."]
	]
	},
	task3: {
	title: "task3 · Resource Allocator",
	description: "Allocate inspection bandwidth across incidents and FTO audits under time constraints.",
	legend: [
	["incident_queue / fto_audit_queue", "The backlog competing for limited inspection time."],
	["inspector_assignments", "Which work items each inspector should handle this round."],
	["deferred_items", "Items intentionally left for later because capacity ran out."],
	["predicted_risk_reduction", "Your estimate of how much operational risk the allocation removes."]
	]
	}
	};

	function pretty(value) {
	return JSON.stringify(value, null, 2);
	}

	function setBadge(label, tone = "") {
	resultBadge.textContent = label;
	resultBadge.className = `status-pill${tone ? ` ${tone}` : ""}`;
	}

	function pushTimeline(tag, message) {
	const item = document.createElement("li");
	item.innerHTML = `<span class="timeline-tag">${tag}</span><p>${message}</p>`;
	timeline.prepend(item);
	while (timeline.children.length > 6) {
	timeline.removeChild(timeline.lastElementChild);
	}
	}

	function renderLegend(taskId) {
	fieldLegend.innerHTML = "";
	for (const [field, meaning] of TASK_META[taskId].legend) {
	const item = document.createElement("div");
	item.className = "legend-item";
	item.innerHTML = `<strong>${field}</strong><span>${meaning}</span>`;
	fieldLegend.appendChild(item);
	}
	}

	function setTask(taskId) {
	const meta = TASK_META[taskId];
	taskSelect.value = taskId;
	taskTitle.textContent = meta.title;
	taskDescription.textContent = meta.description;
	renderLegend(taskId);
	taskCards.forEach((card) => {
	card.classList.toggle("is-active", card.dataset.task === taskId);
	});
	}

	function summarizeObservation(taskId, observation) {
	if (!observation) return "No observation loaded";
	if (taskId === "task1" && observation.fto_profile) {
	const fto = observation.fto_profile;
	return `${fto.fto_name} · pass rate ${fto.pass_rate} · incidents ${fto.recent_incidents}`;
	}
	if (taskId === "task2" && observation.incident_batch) {
	return `${observation.incident_batch.length} incidents in the current triage batch`;
	}
	if (taskId === "task3") {
	const incidents = (observation.incident_queue \|\| []).length;
	const ftos = (observation.fto_audit_queue \|\| []).length;
	return `${incidents} incidents and ${ftos} FTO audits competing for inspectors`;
	}
	return "Observation loaded";
	}

	function explainObservation(taskId, observation) {
	if (!observation) {
	return "No observation has been loaded yet. Start with Reset Episode to generate a scenario from the backend.";
	}

	if (taskId === "task1" && observation.fto_profile) {
	const fto = observation.fto_profile;
	return `You are assessing ${fto.fto_name}. The payload exposes the five rubric components, current pass-rate, and recent incidents so you can decide whether the FTO is healthy, borderline, or risky enough for enforcement.`;
	}

	if (taskId === "task2" && observation.incident_batch) {
	return `This observation is a triage queue of ${observation.incident_batch.length} incidents. Your job is to sort them by urgency, decide what must be escalated immediately, and identify what can be deferred.`;
	}

	if (taskId === "task3") {
	const incidents = (observation.incident_queue \|\| []).length;
	const ftos = (observation.fto_audit_queue \|\| []).length;
	return `You are balancing ${incidents} incident items and ${ftos} FTO audits against limited inspector capacity. The observation tells you what is competing for time before you build assignments.`;
	}

	return "The observation is the environment state you are supposed to reason over before sending an action.";
	}

	function explainAction(taskId, payload) {
	if (!payload \|\| !payload.task_id) {
	return "The action editor is empty or incomplete. A valid action must include task_id and the task-specific decision object.";
	}

	if (taskId === "task1" && payload.fto_grade_action) {
	const action = payload.fto_grade_action;
	return `This action grades the FTO as ${action.grade \|\| "unknown"}, recommends ${action.recommended_action \|\| "no action"}, and records the reasoning the evaluator should use to justify that decision.`;
	}

	if (taskId === "task2" && payload.incident_priority_action) {
	const action = payload.incident_priority_action;
	return `This action submits a ranked incident list${Array.isArray(action.priority_ranking) ? ` with ${action.priority_ranking.length} entries` : ""}, plus explicit escalation and defer decisions for the batch.`;
	}

	if (taskId === "task3" && payload.resource_allocation_action) {
	const action = payload.resource_allocation_action;
	const inspectorCount = action.inspector_assignments ? Object.keys(action.inspector_assignments).length : 0;
	return `This allocation assigns work across ${inspectorCount} inspectors, marks what gets deferred, and estimates the risk reduction delivered by this plan.`;
	}

	return "The action JSON is your proposed decision. The backend will score it against the environment rules when you submit it.";
	}

	function explainResult(result) {
	if (!result) {
	return "No backend result has been received yet.";
	}

	if (result.reward) {
	return `The backend accepted your action and returned a reward payload. The score is ${result.reward.score}, which is the overall quality signal for that step. The accuracy, consistency, and safety alignment fields underneath it explain why the number moved. done=${result.done} tells you whether the episode has ended, and info contains extra scoring context from the environment.`;
	}

	if (result.status === "no_active_episode") {
	return "There is no active episode for the selected task yet. Reset the task first so the state endpoint has something to return.";
	}

	if (result.task_id \|\| result.event === "reset") {
	return "This response confirms the current task session status. After a reset, the next step is to inspect the observation and submit an action.";
	}

	if (result.error \|\| result.detail) {
	return "The backend rejected the request. Check the raw result panel for the exact validation or runtime error details.";
	}

	return "This panel translates raw backend output into the operational meaning of the response.";
	}

	function updateActionMeaningFromEditor() {
	try {
	const payload = JSON.parse(actionInput.value);
	actionMeaning.textContent = explainAction(taskSelect.value, payload);
	} catch (error) {
	actionMeaning.textContent = `The action editor is not valid JSON yet: ${error.message}`;
	}
	}

	function resetRewardBreakdown() {
	rewardSummary.textContent = "None yet";
	accuracySummary.textContent = "Not available";
	consistencySummary.textContent = "Not available";
	safetySummary.textContent = "Not available";
	rewardWhySummary.textContent = "Depends on seed and action";
	}

	function updateRewardBreakdown(reward, seed) {
	if (!reward) {
	resetRewardBreakdown();
	return;
	}

	rewardSummary.textContent = `${reward.score}`;
	accuracySummary.textContent = `${reward.accuracy_component}`;
	consistencySummary.textContent = `${reward.consistency_component}`;
	safetySummary.textContent = `${reward.safety_alignment_component}`;
	rewardWhySummary.textContent = `Seed ${seed} + current action`;
	}

	function defaultAction(taskId, observation) {
	if (!observation) return { task_id: taskId };

	if (taskId === "task1" && observation.fto_profile) {
	const fto = observation.fto_profile;
	const total = Number((
	fto.performance_score +
	fto.operational_score +
	fto.safety_score +
	fto.compliance_score +
	fto.student_support_score
	).toFixed(2));

	return {
	task_id: "task1",
	fto_grade_action: {
	grade: total >= 75 ? "A" : total >= 50 ? "B" : "C",
	total_score: total,
	risk_flags: [],
	recommended_action: total >= 75 ? "clear" : "self_assessment_required",
	justification: "Single-file UI example action generated from the visible FTO profile."
	}
	};
	}

	if (taskId === "task2" && observation.incident_batch) {
	const ids = observation.incident_batch.map((item) => item.incident_id);
	return {
	task_id: "task2",
	incident_priority_action: {
	priority_ranking: ids,
	top_3_rationale: "Example ranking generated in the single-file Space UI.",
	defer_list: ids.slice(3),
	escalate_immediately: ids.slice(0, 2),
	pattern_detected: false,
	pattern_description: null
	}
	};
	}

	if (taskId === "task3") {
	const incidentIds = (observation.incident_queue \|\| []).map((item) => item.incident_id);
	const ftoIds = (observation.fto_audit_queue \|\| []).map((item) => item.fto_id);
	const allItems = incidentIds.concat(ftoIds);
	return {
	task_id: "task3",
	resource_allocation_action: {
	inspector_assignments: {
	inspector_1: allItems.slice(0, 2),
	inspector_2: allItems.slice(2, 4)
	},
	deferred_items: allItems.slice(4),
	priority_rationale: "Example allocation generated in the single-file Space UI.",
	predicted_risk_reduction: 0.55,
	abstain: false,
	abstain_reason: null
	}
	};
	}

	return { task_id: taskId };
	}

	async function fetchJson(url, options = {}) {
	const response = await fetch(url, options);
	const data = await response.json();
	if (!response.ok) {
	throw new Error(pretty(data));
	}
	return data;
	}

	async function refreshStatus() {
	try {
	const [health, metadata] = await Promise.all([
	fetchJson("/health"),
	fetchJson("/metadata")
	]);
	const summary = metadata.corpus_summary \|\| {};
	healthStatus.textContent = health.status;
	healthDetail.textContent = `Environment is reachable with ${summary.total_records \|\| 0} records across ${summary.unique_airports \|\| 0} airports.`;
	metadataStatus.textContent = `${metadata.name} v${metadata.version}`;
	corpusStatus.textContent = `${summary.fto_profiles \|\| 0} FTO profiles, ${summary.incident_reports \|\| 0} incidents, ${summary.resource_scenarios \|\| 0} resource scenarios.`;
	setBadge("Service reachable", "ok");
	pushTimeline("status", `Health check passed for ${metadata.name} ${metadata.version}.`);
	} catch (error) {
	healthStatus.textContent = "Unavailable";
	metadataStatus.textContent = String(error.message \|\| error);
	corpusStatus.textContent = "Corpus manifest could not be loaded.";
	healthDetail.textContent = "Health or metadata endpoint failed.";
	setBadge("Service issue", "error");
	pushTimeline("error", `Status refresh failed: ${String(error.message \|\| error)}`);
	}
	}

	async function resetEpisode() {
	const taskId = taskSelect.value;
	const seed = Number(seedInput.value \|\| 42);
	try {
	const observation = await fetchJson(`/reset?task_id=${taskId}&seed=${seed}`, { method: "POST" });
	observationView.textContent = pretty(observation);
	actionInput.value = pretty(defaultAction(taskId, observation));
	observationSummary.textContent = summarizeObservation(taskId, observation);
	observationMeaning.textContent = explainObservation(taskId, observation);
	updateActionMeaningFromEditor();
	rewardSummary.textContent = "Awaiting first step";
	accuracySummary.textContent = "Awaiting step";
	consistencySummary.textContent = "Awaiting step";
	safetySummary.textContent = "Awaiting step";
	rewardWhySummary.textContent = `Seed ${seed} loaded; reward appears after submit`;
	doneSummary.textContent = "Episode active";
	sessionStatus.textContent = `${taskId} seeded with ${seed}`;
	sessionDetail.textContent = `Example action payload loaded and ready for editing. If you reuse the same seed and the same action, you should expect the same reward.`;
	const resetResult = { event: "reset", task_id: taskId, seed, status: "ready" };
	resultView.textContent = pretty(resetResult);
	resultMeaning.textContent = `${explainResult(resetResult)} Rewards are not hardcoded. This environment is deterministic for the same seed and decision payload.`;
	setBadge("Episode ready", "ok");
	pushTimeline("reset", `Started ${taskId} with deterministic seed ${seed}.`);
	} catch (error) {
	resultView.textContent = `Reset failed:\n${error.message}`;
	resultMeaning.textContent = "The reset call failed, so no observation was loaded. The raw result shows the exact error returned by the backend.";
	setBadge("Reset failed", "error");
	pushTimeline("error", `Reset failed for ${taskId}: ${String(error.message \|\| error)}`);
	}
	}

	async function submitAction() {
	let payload;
	try {
	payload = JSON.parse(actionInput.value);
	} catch (error) {
	resultView.textContent = `Action JSON parse error:\n${error.message}`;
	actionMeaning.textContent = `The action editor cannot be submitted because the JSON is invalid: ${error.message}`;
	return;
	}

	try {
	const result = await fetchJson("/step", {
	method: "POST",
	headers: { "Content-Type": "application/json" },
	body: JSON.stringify(payload)
	});
	observationView.textContent = pretty(result.observation);
	resultView.textContent = pretty(result);
	sessionStatus.textContent = result.done ? "Episode completed" : "Episode active";
	sessionDetail.textContent = result.done ? "The environment reported a completed episode." : "A further step may still be available for this task.";
	observationSummary.textContent = summarizeObservation(payload.task_id, result.observation);
	observationMeaning.textContent = explainObservation(payload.task_id, result.observation);
	actionMeaning.textContent = explainAction(payload.task_id, payload);
	updateRewardBreakdown(result.reward, seedInput.value \|\| 42);
	doneSummary.textContent = result.done ? "Done" : "In progress";
	resultMeaning.textContent = `${explainResult(result)} If the score looks repeated, check whether the seed and the action payload are still the same.`;
	setBadge(result.done ? "Step complete" : "Step accepted", result.done ? "ok" : "warn");
	pushTimeline("step", `Submitted ${payload.task_id}; reward score ${result.reward.score}; done=${result.done}.`);
	} catch (error) {
	resultView.textContent = `Step failed:\n${error.message}`;
	resultMeaning.textContent = "The step request failed before a reward could be produced. Check the raw result for the exact validation or runtime problem.";
	setBadge("Step failed", "error");
	pushTimeline("error", `Step request failed: ${String(error.message \|\| error)}`);
	}
	}

	async function fetchState() {
	const taskId = taskSelect.value;
	try {
	const state = await fetchJson(`/state?task_id=${taskId}`);
	resultView.textContent = pretty(state);
	doneSummary.textContent = state.done ? "Done" : "State fetched";
	sessionDetail.textContent = `Fetched state for ${taskId}.`;
	resultMeaning.textContent = explainResult(state);
	setBadge("State fetched", "warn");
	pushTimeline("state", `Fetched live state for ${taskId}.`);
	} catch (error) {
	resultView.textContent = `State fetch failed:\n${error.message}`;
	resultMeaning.textContent = "The state lookup failed. Usually that means the task has not been reset yet or the backend returned an error.";
	setBadge("State failed", "error");
	pushTimeline("error", `State fetch failed for ${taskId}: ${String(error.message \|\| error)}`);
	}
	}

	document.getElementById("refreshStatus").addEventListener("click", refreshStatus);
	document.getElementById("resetEpisode").addEventListener("click", resetEpisode);
	document.getElementById("randomSeed").addEventListener("click", () => {
	seedInput.value = Math.floor(Math.random() * 100000) + 1;
	rewardWhySummary.textContent = `Seed changed to ${seedInput.value}; reset to generate a different scenario`;
	setBadge("Seed randomized", "warn");
	});
	document.getElementById("submitAction").addEventListener("click", submitAction);
	document.getElementById("fetchState").addEventListener("click", fetchState);
	document.getElementById("loadExample").addEventListener("click", () => {
	let observation = null;
	try {
	observation = JSON.parse(observationView.textContent);
	} catch (error) {
	observation = null;
	}
	actionInput.value = pretty(defaultAction(taskSelect.value, observation));
	updateActionMeaningFromEditor();
	setBadge("Example action loaded", "warn");
	pushTimeline("draft", `Loaded example payload for ${taskSelect.value}.`);
	});

	taskSelect.addEventListener("change", () => {
	setTask(taskSelect.value);
	actionInput.value = pretty(defaultAction(taskSelect.value, null));
	observationSummary.textContent = "Task changed; reset to load live observation";
	observationMeaning.textContent = "Task switched. Reset the episode to load a fresh backend observation for this workflow.";
	updateActionMeaningFromEditor();
	resetRewardBreakdown();
	doneSummary.textContent = "Idle";
	sessionDetail.textContent = `Ready to reset ${taskSelect.value}.`;
	resultMeaning.textContent = "No backend result has been received for the newly selected task yet.";
	});

	taskCards.forEach((card) => {
	card.addEventListener("click", () => {
	setTask(card.dataset.task);
	actionInput.value = pretty(defaultAction(card.dataset.task, null));
	observationSummary.textContent = "Task changed; reset to load live observation";
	observationMeaning.textContent = "Task switched. Reset the episode to load a fresh backend observation for this workflow.";
	updateActionMeaningFromEditor();
	resetRewardBreakdown();
	doneSummary.textContent = "Idle";
	sessionDetail.textContent = `Ready to reset ${card.dataset.task}.`;
	resultMeaning.textContent = "No backend result has been received for the newly selected task yet.";
	});
	});

	actionInput.addEventListener("input", updateActionMeaningFromEditor);

	setTask(taskSelect.value);
	refreshStatus();
	actionInput.value = pretty(defaultAction(taskSelect.value, null));
	observationMeaning.textContent = "Reset a task to see the live scenario translated into plain language.";
	updateActionMeaningFromEditor();
	resetRewardBreakdown();
	resultMeaning.textContent = "Submit a step or fetch state to decode the backend response here.";
	</script>
	</body>
	</html>
	"""

	api_app = FastAPI(
	title="AvigilanceEnv",
	description="India Aviation Safety Monitoring OpenEnv — DGCA Early Warning System",
	version="1.1.0",
	)

	_envs: dict[str, AvigilanceEnv] = {}
	_data_dir = Path(__file__).resolve().parent / "data"


	def _to_jsonable(value: Any) -> Any:
	if hasattr(value, "model_dump"):
	return value.model_dump(mode="json")
	return value


	def _dump_json(value: Any) -> str:
	return json.dumps(_to_jsonable(value), indent=2, ensure_ascii=True)


	def _load_corpus_manifest() -> dict[str, Any]:
	manifest_path = _data_dir / "corpus_manifest.json"
	if manifest_path.exists():
	with manifest_path.open("r", encoding="utf-8") as handle:
	return json.load(handle)

	return {
	"version": "unknown",
	"summary": {
	"total_records": 0,
	"fto_profiles": 0,
	"incident_reports": 0,
	"resource_scenarios": 0,
	"unique_airports": 0,
	"unique_airlines": 0,
	},
	"source_catalog": [],
	"space_ready": False,
	}


	def _reset_session(task_id: str = "task1", seed: int = 42) -> dict[str, Any]:
	env = AvigilanceEnv(task_id=task_id, seed=seed)
	_envs[task_id] = env
	obs = env.reset()
	return obs.model_dump(mode="json")


	def _step_session(action: AvigilanceAction) -> dict[str, Any]:
	env = _envs.get(action.task_id)
	if env is None:
	raise HTTPException(status_code=400, detail=f"No active episode for {action.task_id}. Call /reset first.")

	obs, reward, done, info = env.step(action)
	return {
	"observation": obs.model_dump(mode="json"),
	"reward": reward.model_dump(mode="json"),
	"done": done,
	"info": info,
	}


	def _get_state(task_id: str = "task1") -> dict[str, Any]:
	env = _envs.get(task_id)
	if env is None:
	return {"status": "no_active_episode"}
	return env.state()


	@api_app.get("/api/info")
	def api_info() -> dict[str, Any]:
	return {
	"name": "AvigilanceEnv",
	"description": "India Aviation Safety Monitoring — OpenEnv Early Warning System",
	"tasks": ["task1", "task2", "task3"],
	"status": "ready",
	}


	@api_app.post("/reset")
	def reset(task_id: str = "task1", seed: int = 42) -> JSONResponse:
	try:
	return JSONResponse(content=_reset_session(task_id=task_id, seed=seed))
	except HTTPException:
	raise
	except Exception as exc:
	raise HTTPException(status_code=500, detail=str(exc)) from exc


	@api_app.post("/step")
	def step(action: AvigilanceAction) -> JSONResponse:
	try:
	return JSONResponse(content=_step_session(action))
	except HTTPException:
	raise
	except Exception as exc:
	raise HTTPException(status_code=500, detail=str(exc)) from exc


	@api_app.get("/state")
	def state(task_id: str = "task1") -> JSONResponse:
	return JSONResponse(content=_get_state(task_id=task_id))


	@api_app.get("/health")
	def health() -> dict[str, Any]:
	return {"status": "healthy", "env": "AvigilanceEnv"}


	@api_app.get("/metadata")
	def metadata() -> dict[str, Any]:
	manifest = _load_corpus_manifest()
	return {
	"name": "AvigilanceEnv",
	"description": "India Aviation Safety Monitoring OpenEnv — DGCA Early Warning System",
	"version": "1.2.0",
	"tasks": ["task1", "task2", "task3"],
	"walkthrough": "/#walkthrough",
	"corpus_summary": manifest.get("summary", {}),
	"corpus_version": manifest.get("version", "unknown"),
	"space_ready": manifest.get("space_ready", False),
	"ingestion_plan_path": "walkthrough/real-data-ingestion-plan.md",
	}


	@api_app.get("/walkthrough")
	def walkthrough() -> RedirectResponse:
	return RedirectResponse(url="/#walkthrough", status_code=307)


	@api_app.get("/", response_class=HTMLResponse)
	def frontend() -> HTMLResponse:
	return HTMLResponse(FRONTEND_HTML)


	@api_app.get("/schema")
	def schema() -> dict[str, Any]:
	from environment.models import AvigilanceAction as ActionModel
	from environment.models import AvigilanceObservation, AvigilanceReward

	return {
	"observation": AvigilanceObservation.model_json_schema(),
	"action": ActionModel.model_json_schema(),
	"state": AvigilanceReward.model_json_schema(),
	}


	@api_app.post("/mcp")
	def mcp(payload: dict \| None = None) -> dict[str, Any]:
	body = payload or {}
	return {
	"jsonrpc": "2.0",
	"id": body.get("id"),
	"result": {
	"name": "AvigilanceEnv",
	"tools": ["reset", "step", "state"],
	},
	}


	app = api_app


	def main() -> None:
	uvicorn.run(app, host="0.0.0.0", port=7860)


	if __name__ == "__main__":
	main()