Spaces:

build-small-hackathon
/

TinyNarrator

Running

cvpfus

Document Docker Space metadata and fallbacks

4565f15 12 days ago

75.1 kB

	from __future__ import annotations

	import json
	import py_compile
	import sys
	import urllib.error
	import wave
	from pathlib import Path
	from unittest.mock import patch, MagicMock


	ROOT = Path(__file__).resolve().parents[1]
	sys.path.insert(0, str(ROOT))

	import app
	from fastapi.testclient import TestClient


	def assert_true(condition: bool, message: str) -> None:
	if not condition:
	raise AssertionError(message)


	def verify_static_assets() -> None:
	required = [
	ROOT / "LICENSE",
	ROOT / "DEPLOY_SPACES.md",
	ROOT / "Dockerfile",
	ROOT / "start.sh",
	ROOT / "SUBMISSION.md",
	ROOT / "static" / "index.html",
	ROOT / "static" / "generate.html",
	ROOT / "static" / "app.css",
	ROOT / "static" / "app.js",
	ROOT / "static" / "generate.js",
	ROOT / "static" / "generated" / "desk-reader.svg",
	ROOT / "static" / "generated" / "desk-reader.png",
	ROOT / "static" / "generated" / "model-map.svg",
	ROOT / "static" / "generated" / "model-map.png",
	ROOT / "static" / "generated" / "field-notes.svg",
	]
	for path in required:
	assert_true(path.exists(), f"Missing required asset: {path}")
	try:
	from PIL import Image

	for path in [ROOT / "static" / "generated" / "desk-reader.png", ROOT / "static" / "generated" / "model-map.png"]:
	with Image.open(path) as image:
	assert_true(image.size == (1200, 675), f"Vision PNG should match article image ratio: {path}")
	assert_true(image.format == "PNG", f"Vision companion asset should be PNG: {path}")
	except ImportError:
	pass

	app_js = (ROOT / "static" / "app.js").read_text(encoding="utf-8")
	app_source = (ROOT / "app.py").read_text(encoding="utf-8")
	generate_js = (ROOT / "static" / "generate.js").read_text(encoding="utf-8")
	index_html = (ROOT / "static" / "index.html").read_text(encoding="utf-8")
	generate_html = (ROOT / "static" / "generate.html").read_text(encoding="utf-8")
	deploy_spaces = (ROOT / "DEPLOY_SPACES.md").read_text(encoding="utf-8")
	dockerfile = (ROOT / "Dockerfile").read_text(encoding="utf-8")
	start_script = (ROOT / "start.sh").read_text(encoding="utf-8")
	assert_true("FROM python:3.12-slim" in dockerfile, "Spaces Dockerfile should use a free CPU Python base image")
	assert_true("nvidia/cuda" not in dockerfile, "Spaces Dockerfile should not require paid HF GPU CUDA image")
	assert_true("llama-server" not in start_script, "Spaces start script should not launch local llama.cpp")
	assert_true("free CPU" in deploy_spaces, "Spaces deploy guide should describe free CPU deployment")
	assert_true("modal_workers/reader_brain.py" in deploy_spaces, "Spaces deploy guide should document Modal reader-brain deployment")
	assert_true("CPU Basic" in deploy_spaces, "Spaces deploy guide should recommend CPU Basic hardware")
	assert_true("LLAMA_CPP_TOKEN" in deploy_spaces, "Spaces deploy guide should document reader-brain auth token")
	assert_true("tiny-narrator-reader-brain-token" in deploy_spaces, "Spaces deploy guide should document the Modal reader token secret")
	assert_true('href="/" aria-current="page">Reader' in index_html, "Reader page should mark Reader route current")
	assert_true('href="/generate">Generate' in index_html, "Reader page should link to Generate route")
	assert_true('href="/">Reader' in generate_html, "Generate page should link back to Reader route")
	assert_true('href="/generate" aria-current="page">Generate' in generate_html, "Generate page should mark Generate route current")
	assert_true("articleGeneratorForm" in generate_html, "Generate page should expose the article generator form")
	assert_true("generatedThumbnail" in generate_html, "Generate page should expose a generated thumbnail preview")
	assert_true("readerToggle" in generate_html, "Generate page should expose a screen reader toggle")
	assert_true("transcriptLog" in generate_html, "Generate page should expose a narration transcript")
	assert_true("speechAudio" in generate_html, "Generate page should expose speech playback")
	assert_true("/api/generate-article" in generate_js, "Generate frontend should call article generation API")
	assert_true("/api/reader-brain" in generate_js, "Generate frontend should call reader-brain narration API")
	assert_true("/api/speak" in generate_js, "Generate frontend should call speech API")
	assert_true('node.type === "image"' in generate_js, "Generate reader should reserve reader-brain item narration for images")
	assert_true('runtime: "raw text"' in generate_js, "Generate reader should speak text-only nodes without reader-brain")
	assert_true("Image description." in generate_js, "Generate reader should force image narration to announce image descriptions")
	assert_true("refreshReaderNodes" in generate_js, "Generate frontend should build a generated article reader path")
	assert_true('data-reader-type="heading"' in generate_js, "Generated article sections should mark heading reader nodes")
	assert_true('data-reader-type="paragraph"' in generate_js, "Generated article sections should mark paragraph reader nodes")
	assert_true("thumbnail.generation_model" in generate_js, "Generate frontend should render Klein thumbnail receipt")
	assert_true('data-reader-type="heading"' in index_html, "Article should mark heading reader nodes")
	assert_true('data-reader-type="image"' in index_html, "Article should mark image reader nodes")
	assert_true("vision_asset_url" in app_source, "Article images should expose PNG assets for vision APIs")
	assert_true("/static/generated/desk-reader.png" in app_source, "Desk reader should have a PNG vision asset")
	assert_true("/static/generated/model-map.png" in app_source, "Model map should have a PNG vision asset")
	assert_true('href="#notes"' not in index_html, "Article navigation should not include the Field Notes section")
	assert_true('id="notes"' not in index_html, "Article UI should not render the Field Notes section")
	assert_true("Field Notes" not in index_html, "Article UI should not render Field Notes copy")
	assert_true("Field Notes" not in generate_html, "Generate UI should not render Field Notes copy")
	assert_true('alt=""' not in index_html, "Article images should not start with empty alt text")
	assert_true(
	"reader brain, vision, speech, and image generation models" in index_html,
	"Article should include meaningful fallback alt text for generated images",
	)
	assert_true('aria-live="polite"' in index_html, "Article should expose an aria-live narration region")
	for shortcut in ['aria-keyshortcuts="Space"', 'aria-keyshortcuts="N"', 'aria-keyshortcuts="R"', 'aria-keyshortcuts="S"']:
	assert_true(shortcut in index_html, f"Reader controls should expose {shortcut}")
	assert_true("transcriptLog" in index_html, "Article should expose a visible transcript log")
	assert_true("readerQueueList" not in index_html, "Article sidebar should not include a visible reader queue")
	assert_true("repeatButton" in index_html, "Reader controls should expose a visible repeat command")
	assert_true("stopButton" in index_html, "Reader controls should expose a visible stop command")
	assert_true("modelStackList" in index_html, "Article sidebar should expose the model stack panel")
	assert_true("modelBudgetStatus" in index_html, "Article sidebar should expose model stack status")
	for removed_id in [
	"demoScriptList",
	"demoApiCheckList",
	"imageReceiptList",
	"runtimeStatusList",
	"submissionReadinessList",
	"copyEvidenceButton",
	"modelBudgetList",
	"runtimeSetupList",
	]:
	assert_true(removed_id not in index_html, f"Article sidebar should not include removed evidence panel: {removed_id}")
	assert_true("loadDemoScript" not in app_js, "Article frontend should not render the structured demo script")
	assert_true("loadModelBudget" in app_js, "Article frontend should render the model stack panel")
	assert_true("/api/model-budget" in app_js, "Article frontend should fetch model budget data")
	assert_true("/api/runtime-status" in app_js, "Article frontend should fetch runtime status")
	assert_true("status-pill" in app_js or "statusClass" in app_js, "Article frontend should render per-role status labels")
	assert_true("modelStackList.innerHTML" in app_js, "Article frontend should render model stack items")
	assert_true("Tiny Titan pass" in app_js, "Article frontend should render per-model Tiny Titan pass labels")
	assert_true("/evidence" not in index_html, "Article page should not link to a removed evidence page")
	assert_true("copyTextToClipboard" in app_js, "Frontend copy actions should share clipboard fallback handling")
	assert_true(
	"Transcript is visible, but clipboard access is unavailable." in app_js,
	"Transcript copy should report unavailable clipboard access",
	)
	assert_true("transcript-position" in app_js, "Transcript should render the narrated reader position")
	assert_true("readerItemStatus(node)" in app_js, "Narration transcript entries should include reader item position")
	assert_true('node.type === "image"' in app_js, "Article reader should reserve reader-brain item narration for images")
	assert_true('runtime: "raw text"' in app_js, "Article reader should speak text-only nodes without reader-brain")
	assert_true("Image description." in app_js, "Article reader should force image narration to announce image descriptions")
	assert_true(
	"[${entry.type} / ${entry.position} / ${entry.runtime}]" in app_js,
	"Copied transcript should include type, position, and runtime",
	)
	assert_true("function haltPlayback" in app_js, "Reader controls should expose a shared playback halt helper")
	assert_true(
	"haltPlayback({ clearAutoAdvance: false });" in app_js,
	"New narration commands should interrupt current speech immediately",
	)
	assert_true("aria-current" in app_js, "Reader mode should expose the active item as current")
	assert_true("shouldHandleReaderShortcut" in app_js, "Reader shortcuts should not hijack form controls")
	assert_true("controls.repeat.click()" in app_js, "R should route through the visible repeat command")
	assert_true("controls.stop.click()" in app_js, "Escape should route through the visible stop command")
	assert_true("reader-node-" in app_js, "Reader nodes should receive stable ids for control context")
	assert_true("renderReaderQueue" not in app_js, "Frontend should not render a visible reader queue")
	assert_true("readerQueueList" not in app_js, "Frontend should not bind a visible reader queue")
	assert_true("narrate(node.index)" in app_js, "Reader mode should support click-to-read article items")

	assert_true("describeGeneratedThumbnail" in generate_js, "Generate frontend should describe generated thumbnails")
	assert_true("/api/describe-image" in generate_js, "Generate frontend should call describe-image for thumbnails")
	assert_true("image_url" in generate_js, "Generate frontend should send image_url to describe-image")
	assert_true("generatedThumbnail.alt" in generate_js, "Generate frontend should update thumbnail alt from descriptor")
	assert_true("fallbackAlt" in generate_js, "Generate frontend should preserve fallback alt on descriptor failure")

	submission = (ROOT / "SUBMISSION.md").read_text(encoding="utf-8")
	for target in ["Tiny Titan", "Llama Champion", "Off-Brand", "Field Notes"]:
	assert_true(target in submission, f"Submission packet should mention {target}")
	for endpoint in [
	"/api/model-budget",
	"/api/runtime-setup",
	"/api/accessibility-audit",
	"/api/demo-script",
	"/api/submission-readiness",
	"/api/evidence-bundle",
	"/api/generate-article",
	]:
	assert_true(endpoint in submission, f"Submission packet should mention {endpoint}")
	assert_true(
	"nvidia/NVIDIA-Nemotron-3-Nano-4B-GGUF" in submission,
	"Submission packet should include the reader-brain model",
	)
	for evidence in ["reader cursor", "shortcut safety", "aria-current"]:
	assert_true(evidence in submission, f"Submission packet should mention {evidence}")
	for evidence in ["prompt", "seed", "FLUX.2-klein-4B", "fallback asset"]:
	assert_true(evidence in submission, f"Submission packet should mention image receipt evidence: {evidence}")


	def front_matter_value(readme: str, key: str) -> str:
	lines = readme.splitlines()
	if not lines or lines[0] != "---":
	return ""
	for line in lines[1:]:
	if line == "---":
	break
	name, separator, value = line.partition(":")
	if separator and name.strip() == key:
	return value.strip()
	return ""


	def verify_space_metadata() -> None:
	readme = (ROOT / "README.md").read_text(encoding="utf-8")
	requirements = (ROOT / "requirements.txt").read_text(encoding="utf-8").splitlines()
	license_text = (ROOT / "LICENSE").read_text(encoding="utf-8")

	sdk = front_matter_value(readme, "sdk")
	app_port = front_matter_value(readme, "app_port")
	emoji = front_matter_value(readme, "emoji")
	title = front_matter_value(readme, "title")
	license_id = front_matter_value(readme, "license")

	assert_true(title == "Tiny Narrator", "Space metadata should name the app")
	assert_true(sdk == "docker", "Space metadata should declare the Docker SDK")
	assert_true(app_port == "7860", "Docker Space metadata should expose app_port 7860")
	assert_true(emoji and "ð" not in emoji, "Space metadata emoji should be valid UTF-8")
	assert_true(license_id == "apache-2.0", "Space metadata should declare the Apache-2.0 license")
	assert_true("Apache License" in license_text, "Repository should include the Apache license text")
	assert_true("Version 2.0" in license_text, "Repository license should match Space metadata")
	assert_true(any(line.startswith("gradio==") for line in requirements), "requirements.txt should pin Gradio")
	for package in ["pydantic", "kokoro", "soundfile", "python-dotenv"]:
	assert_true(
	any(
	line.startswith(f"{package}>=") or line.startswith(f"{package}==") or line.strip() == package
	for line in requirements
	),
	f"requirements.txt should include {package}",
	)


	def verify_dotenv_wiring() -> None:
	"""Verify that python-dotenv is wired in before core env constants are read."""
	requirements = (ROOT / "requirements.txt").read_text(encoding="utf-8").splitlines()
	assert_true(
	any(line.strip() == "python-dotenv" or line.startswith("python-dotenv>=") for line in requirements),
	"requirements.txt should include python-dotenv",
	)

	app_source = (ROOT / "app.py").read_text(encoding="utf-8")
	assert_true("from dotenv import load_dotenv" in app_source, "app.py should import load_dotenv")
	assert_true("load_dotenv()" in app_source, "app.py should call load_dotenv()")

	import_pos = app_source.index("from dotenv import load_dotenv")
	call_pos = app_source.index("load_dotenv()")
	llama_const = app_source.index("LLAMA_CPP_BASE_URL = os.getenv")
	assert_true(
	import_pos < call_pos < llama_const,
	"load_dotenv() should be called before LLAMA_CPP_BASE_URL is assigned",
	)

	env_example = ROOT / ".env.example"
	assert_true(env_example.exists(), ".env.example should exist")
	env_content = env_example.read_text(encoding="utf-8")
	for secret_pattern in ["sk-", "AKIA", "ghp_", "xoxb-"]:
	assert_true(
	secret_pattern not in env_content,
	f".env.example should not contain real-looking secrets ({secret_pattern})",
	)


	def verify_live_smoke_script() -> None:
	"""Verify that the live smoke test script exists, is syntactically valid, and documents redaction."""
	smoke_path = ROOT / "scripts" / "live_smoke.py"
	assert_true(smoke_path.exists(), "scripts/live_smoke.py should exist")
	py_compile.compile(str(smoke_path), doraise=True)
	smoke_source = smoke_path.read_text(encoding="utf-8")
	assert_true("--base-url" in smoke_source, "Smoke script should support --base-url argument")
	assert_true("/api/runtime-status" in smoke_source, "Smoke script should check runtime status")
	assert_true("/api/describe-image" in smoke_source, "Smoke script should check describe-image")
	assert_true("/api/generate-image" in smoke_source, "Smoke script should check generate-image")
	assert_true("_role_is_configured" in smoke_source, "Smoke script should fail configured live paths instead of skipping them")
	assert_true('details.get("configured") is True' in smoke_source, "Smoke script should preserve configured metadata from runtime status")
	assert_true("SKIP" in smoke_source or "skip" in smoke_source, "Smoke script should document skipping behavior")
	assert_true("Secrets" in smoke_source or "secrets" in smoke_source or "never printed" in smoke_source.lower(), "Smoke script should document secret redaction")


	def verify_core_fallbacks() -> None:
	no_live_reader = [
	patch.object(app, "LLAMA_CPP_BASE_URL", ""),
	patch.object(app, "MINICPM_VISION_BASE_URL", ""),
	patch.object(app, "MINICPM_VISION_API_KEY", ""),
	]
	for patcher in no_live_reader:
	patcher.start()
	try:
	narration = app.reader_brain_core(
	node_type="heading",
	text="Why tiny models matter",
	position="item 1 of 1",
	mode="narrate",
	)
	finally:
	for patcher in reversed(no_live_reader):
	patcher.stop()
	assert_true(narration["ok"], "Reader-brain fallback did not return ok")
	assert_true("Heading." in narration["narration"], "Reader-brain fallback lost heading prefix")
	assert_true(isinstance(narration["elapsed_ms"], int), "Reader-brain response should include elapsed_ms")

	with patch.object(app, "LLAMA_CPP_BASE_URL", ""), patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
	image_fallback = app.reader_brain_core(
	node_type="image",
	text="A highlighted paragraph sits beside playback controls.",
	position="item 1 of 1",
	mode="narrate",
	)
	assert_true(
	image_fallback["narration"].startswith("Image description."),
	"Image fallback narration should clearly announce image descriptions",
	)

	with patch.object(app, "LLAMA_CPP_BASE_URL", ""), patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
	summary = app.reader_brain_core(
	node_type="section",
	text="Tiny models can run close to the reader. They keep latency low and preserve privacy.",
	position="Why",
	mode="summarize",
	)
	assert_true(summary["ok"], "Reader-brain summary fallback did not return ok")
	assert_true(summary["narration"].startswith("Summary."), "Summary fallback should announce summary mode")

	with patch.object(app, "LLAMA_CPP_BASE_URL", ""), patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
	unconfigured_reader = app.reader_brain_core(
	node_type="paragraph",
	text="This paragraph should be narrated without a configured endpoint.",
	position="item 1 of 1",
	mode="narrate",
	)
	assert_true(unconfigured_reader["runtime"] == "fallback", "Unconfigured reader brain should use fallback")
	assert_true(
	"not configured" in unconfigured_reader["warning"],
	"Unconfigured reader brain should explain the missing endpoint",
	)

	unconfigured_article = app.generate_article_core("accessible classroom tools")
	assert_true(unconfigured_article["runtime"] == "fallback", "Unconfigured article generation should use fallback")
	assert_true(
	"not configured" in unconfigured_article["warning"],
	"Unconfigured article generation should explain the missing endpoint",
	)

	empty_llama_response = MagicMock()
	empty_llama_response.read.return_value = json.dumps({"choices": [{"message": {"content": ""}}]}).encode("utf-8")
	empty_llama_response.__enter__ = lambda s: s
	empty_llama_response.__exit__ = MagicMock(return_value=False)
	with patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
	with patch("urllib.request.urlopen", return_value=empty_llama_response):
	empty_narration = app.reader_brain_core(
	node_type="paragraph",
	text="This paragraph still needs narration.",
	position="item 2 of 3",
	mode="narrate",
	)
	assert_true(empty_narration["runtime"] == "fallback", "Empty llama.cpp response should use fallback narration")
	assert_true(empty_narration["narration"], "Empty llama.cpp response should not return empty narration")

	minicpm_reader_response = MagicMock()
	minicpm_reader_response.read.return_value = json.dumps(
	{"choices": [{"message": {"content": "Fallback narration from MiniCPM."}}]}
	).encode("utf-8")
	minicpm_reader_response.__enter__ = lambda s: s
	minicpm_reader_response.__exit__ = MagicMock(return_value=False)
	with patch.object(app, "LLAMA_CPP_BASE_URL", "https://llama.example/v1"):
	with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
	with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
	with patch("urllib.request.urlopen", side_effect=[urllib.error.URLError("llama down"), minicpm_reader_response]) as urlopen_mock:
	minicpm_narration = app.reader_brain_core(
	node_type="paragraph",
	text="This paragraph should use MiniCPM after llama.cpp fails.",
	position="item 2 of 3",
	mode="narrate",
	)
	minicpm_request = urlopen_mock.call_args_list[1].args[0]
	minicpm_body = json.loads(minicpm_request.data.decode("utf-8"))
	assert_true(minicpm_narration["runtime"] == "minicpm-v4.6-fallback", "MiniCPM should run before rule fallback")
	assert_true(minicpm_narration["model"] == app.MINICPM_VISION_MODEL, "MiniCPM reader fallback should report MiniCPM model")
	assert_true(minicpm_body["model"] == app.MINICPM_VISION_MODEL, "MiniCPM fallback should send MiniCPM model id")
	assert_true("llama.cpp unavailable" in minicpm_narration["warning"], "MiniCPM fallback should preserve primary failure warning")

	reasoning_response = MagicMock()
	reasoning_response.read.return_value = json.dumps(
	{"choices": [{"message": {"content": "", "reasoning_content": "Heading. Live narration from llama.cpp."}}]}
	).encode("utf-8")
	reasoning_response.__enter__ = lambda s: s
	reasoning_response.__exit__ = MagicMock(return_value=False)
	with patch("urllib.request.urlopen", return_value=reasoning_response):
	reasoning_narration = app.reader_brain_core(
	node_type="heading",
	text="Live heading",
	position="item 1 of 1",
	mode="narrate",
	)
	assert_true(reasoning_narration["runtime"] == "llama.cpp", "Reader brain should use alternate llama.cpp message text fields")
	assert_true("Live narration" in reasoning_narration["narration"], "Reader brain should extract reasoning_content when content is empty")

	image_llama_response = MagicMock()
	image_llama_response.read.return_value = json.dumps(
	{"choices": [{"message": {"content": "A digital reader shows a highlighted paragraph and playback controls."}}]}
	).encode("utf-8")
	image_llama_response.__enter__ = lambda s: s
	image_llama_response.__exit__ = MagicMock(return_value=False)
	with patch("urllib.request.urlopen", return_value=image_llama_response):
	image_narration = app.reader_brain_core(
	node_type="image",
	text="A digital reader shows a highlighted paragraph and playback controls.",
	position="item 2 of 3",
	mode="narrate",
	)
	assert_true(image_narration["runtime"] == "llama.cpp", "Image narration should use live reader-brain when available")
	assert_true(
	image_narration["narration"].startswith("Image description."),
	"Live reader-brain image narration should keep an image description prefix",
	)

	description = app.describe_image_core("model-map", caption=None, prompt=None)
	assert_true(description["ok"], "Image description did not return ok")
	assert_true("small AI models" in description["alt_text"], "Image description fallback changed unexpectedly")
	assert_true(description["runtime"] == "fallback", "Image description without MiniCPM config should use fallback runtime")
	assert_true(description["model"] == app.MODEL_MANIFEST["vision"]["id"], "Image description should report the vision model id")
	assert_true(isinstance(description["elapsed_ms"], int), "Image description should include elapsed_ms")

	article_descriptions = app.describe_article_images_core()
	assert_true(article_descriptions["ok"], "Article image descriptions did not return ok")
	assert_true(len(article_descriptions["descriptions"]) == 2, "Article should expose two image descriptions")
	assert_true(
	all(item["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"] for item in article_descriptions["descriptions"]),
	"Article image descriptions should include the planned image-generation model",
	)
	assert_true(
	all(isinstance(item["seed"], int) for item in article_descriptions["descriptions"]),
	"Article image descriptions should include generation seeds",
	)
	assert_true(isinstance(article_descriptions["elapsed_ms"], int), "Article image descriptions should include elapsed_ms")
	assert_true(article_descriptions["model"] == app.MODEL_MANIFEST["vision"]["id"], "Article image descriptions should report vision model id")
	assert_true(article_descriptions["runtime"] == "fallback", "Article image descriptions should use fallback without MiniCPM config")

	speech = app.speak_core("Tiny Narrator verification.", voice="af_heart", speed=1.0)
	assert_true(speech["ok"], "Speech path did not return ok")
	assert_true(isinstance(speech["elapsed_ms"], int), "Speech response should include elapsed_ms")
	audio_path = ROOT / speech["audio_url"].lstrip("/")
	assert_true(audio_path.exists(), f"Speech output missing: {audio_path}")
	with wave.open(str(audio_path), "rb") as wav:
	assert_true(wav.getframerate() == 24000, "Speech output should be 24 kHz")
	assert_true(wav.getnchannels() == 1, "Speech output should be mono")

	empty_speech = app.speak_core("", voice="af_heart", speed=1.0)
	assert_true(empty_speech["runtime"] == "fallback", "Empty speech input should use fast fallback")
	assert_true("empty" in empty_speech["warning"].lower(), "Empty speech input should explain why Kokoro was skipped")

	generated = app.generate_image_core("Tiny accessibility article image.", seed=3)
	assert_true(generated["ok"], "Image generation placeholder should return ok")
	assert_true(isinstance(generated["elapsed_ms"], int), "Image generation should include elapsed_ms")
	assert_true(generated["runtime"] == "fallback", "Image generation without Modal should report fallback runtime")
	assert_true(generated["model"] == app.MODEL_MANIFEST["image_generation"]["id"], "Image generation should report Klein model id")
	assert_true(generated["seed"] == 3, "Image generation should preserve the seed")
	assert_true(generated["image_url"].startswith("/static/generated/"), "Fallback image should use bundled assets")
	assert_true(generated.get("warning") is None, "Fallback without attempted call should have no warning")

	generated_no_seed = app.generate_image_core("Another image prompt.", seed=None)
	assert_true(generated_no_seed["ok"], "Image generation without seed should return ok")
	assert_true(generated_no_seed["runtime"] == "fallback", "Image generation without Modal should report fallback")
	assert_true(generated_no_seed["seed"] is None, "Image generation should pass through None seed")

	article = app.generate_article_core("tiny classroom robotics")
	assert_true(article["ok"], "Article generation should return ok")
	assert_true(article["model"] == app.MODEL_MANIFEST["reader_brain"]["id"], "Article generation should use reader-brain model")
	assert_true(len(article["article"]["sections"]) == 5, "Article generation should return five sections")
	assert_true(
	article["thumbnail"]["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"],
	"Article generation should use the Klein image model for thumbnail receipt",
	)
	assert_true("No words" in article["thumbnail"]["prompt"], "Article thumbnail prompt should forbid unreadable generated text")
	assert_true("no user interface" in article["thumbnail"]["prompt"], "Article thumbnail prompt should avoid UI screenshots")
	assert_true("one centered cohesive scene" in article["thumbnail"]["prompt"], "Article thumbnail prompt should avoid sparse disconnected layouts")


	def verify_modal_klein_integration() -> None:
	"""Test Modal Klein integration with mocked HTTP responses."""
	# Test: no endpoint configured returns deterministic fallback
	with patch.object(app, "KLEIN_MODAL_ENDPOINT", ""):
	result = app.generate_image_core("test prompt", seed=42)
	assert_true(result["ok"], "No-endpoint fallback should return ok")
	assert_true(result["runtime"] == "fallback", "No-endpoint should report fallback runtime")
	assert_true(result["image_url"].startswith("/static/generated/"), "No-endpoint should use bundled assets")
	assert_true(result["model"] == app.MODEL_MANIFEST["image_generation"]["id"], "Fallback should report Klein model")

	# Test: configured endpoint returning valid JSON is surfaced as live Modal inference
	mock_response_data = {
	"ok": True,
	"runtime": "modal-klein",
	"model": "black-forest-labs/FLUX.2-klein-4B",
	"image_url": "/media/klein-abc123.png",
	"prompt": "test prompt",
	"seed": 42,
	"elapsed_ms": 5000,
	}
	mock_response = MagicMock()
	mock_response.read.return_value = json.dumps(mock_response_data).encode("utf-8")
	mock_response.__enter__ = lambda s: s
	mock_response.__exit__ = MagicMock(return_value=False)

	with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
	with patch("urllib.request.urlopen", return_value=mock_response):
	result = app.generate_image_core("test prompt", seed=42)
	assert_true(result["ok"], "Modal success should return ok")
	assert_true(result["runtime"] == "modal-klein", "Modal success should report modal-klein runtime")
	assert_true(
	result["image_url"] == "https://example-modal.modal.run/media/klein-abc123.png",
	"Modal success should return full media URL",
	)
	assert_true(result["prompt"] == "test prompt", "Modal success should preserve prompt")
	assert_true(result["seed"] == 42, "Modal success should preserve seed")

	# Test: configured endpoint failure falls back with a visible warning
	with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
	with patch("urllib.request.urlopen", side_effect=TimeoutError("Connection timed out")):
	result = app.generate_image_core("test prompt", seed=42)
	assert_true(result["ok"], "Modal failure fallback should return ok")
	assert_true(result["runtime"] == "fallback", "Modal failure should report fallback runtime")
	assert_true(
	result["image_url"].startswith("/static/generated/"),
	"Modal failure should use bundled assets",
	)
	assert_true(
	result.get("warning") is not None and "TimeoutError" in result["warning"],
	"Modal failure should include a visible warning with the error class",
	)

	# Test: invalid Modal JSON response falls back instead of pretending success
	invalid_response = MagicMock()
	invalid_response.read.return_value = json.dumps({"ok": False, "error": "prompt is required"}).encode("utf-8")
	invalid_response.__enter__ = lambda s: s
	invalid_response.__exit__ = MagicMock(return_value=False)

	with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
	with patch("urllib.request.urlopen", return_value=invalid_response):
	result = app.generate_image_core("test prompt", seed=42)
	assert_true(result["runtime"] == "fallback", "Invalid Modal response should use fallback runtime")
	assert_true(
	result.get("warning") is not None and "ValueError" in result["warning"],
	"Invalid Modal response should include a validation warning",
	)

	# Test: Modal worker static checks
	worker_path = ROOT / "modal_workers" / "klein_image.py"
	assert_true(worker_path.exists(), "Modal worker file should exist")
	worker_source = worker_path.read_text(encoding="utf-8")
	assert_true("modal.App" in worker_source, "Modal worker should create a Modal App")
	assert_true("modal.Volume" in worker_source, "Modal worker should use a Modal Volume")
	assert_true("FLUX.2-klein-4B" in worker_source, "Modal worker should reference the Klein model")
	assert_true("Flux2KleinPipeline" in worker_source, "Modal worker should use the FLUX.2 Klein Diffusers pipeline")
	assert_true("modal.asgi_app" in worker_source, "Modal worker should expose one ASGI app")
	assert_true('@api.post("/generate")' in worker_source, "Modal worker should expose POST /generate")
	assert_true('@api.get("/health")' in worker_source, "Modal worker should expose GET /health")
	assert_true('@api.get("/media/{filename}")' in worker_source, "Modal worker should expose GET /media/{filename}")
	assert_true("404" in worker_source or "not found" in worker_source.lower(), "Modal worker should handle missing media with 404")
	assert_true("reload.aio()" in worker_source, "Modal worker should reload volume with async API before serving missing media")
	assert_true("path.read_bytes()" in worker_source, "Modal worker should avoid streaming open files from the volume")

	reader_worker_path = ROOT / "modal_workers" / "reader_brain.py"
	assert_true(reader_worker_path.exists(), "Modal reader-brain worker file should exist")
	reader_worker_source = reader_worker_path.read_text(encoding="utf-8")
	assert_true("modal.web_server" in reader_worker_source, "Reader-brain worker should expose llama-server through Modal web_server")
	assert_true("startup_timeout=600" in reader_worker_source, "Reader-brain worker should allow slow first llama.cpp model loads")
	assert_true("ghcr.io/ggml-org/llama.cpp:server-cuda12" in reader_worker_source, "Reader-brain worker should use the prebuilt llama.cpp CUDA server image")
	assert_true("ENTRYPOINT []" in reader_worker_source, "Reader-brain worker should clear the prebuilt image entrypoint for Modal's Python runner")
	assert_true("GGML_CUDA=ON" not in reader_worker_source, "Reader-brain worker should not compile llama.cpp during Modal builds")
	assert_true("cmake --build" not in reader_worker_source, "Reader-brain worker should avoid slow CMake builds on Modal")
	assert_true("NVIDIA-Nemotron-3-Nano-4B-GGUF:Q4_K_M" in reader_worker_source, "Reader-brain worker should serve the Nemotron GGUF")
	assert_true('"--reasoning"' in reader_worker_source and '"off"' in reader_worker_source, "Reader-brain worker should disable reasoning mode")
	assert_true('"--ctx-size"' in reader_worker_source and '"4096"' in reader_worker_source, "Reader-brain worker should use T4-safe context size")
	assert_true('"--parallel"' in reader_worker_source and '"1"' in reader_worker_source, "Reader-brain worker should use one parallel slot on T4")
	assert_true('"--n-gpu-layers"' in reader_worker_source and '"999"' in reader_worker_source, "Reader-brain worker should request full GPU offload")
	assert_true("modal.Volume" in reader_worker_source, "Reader-brain worker should cache model downloads in a Modal volume")
	assert_true("tiny-narrator-reader-brain-token" in reader_worker_source, "Reader-brain worker should use a fixed Modal token secret")
	assert_true('"--api-key"' in reader_worker_source, "Reader-brain worker should pass an API key to llama-server when configured")
	assert_true('display_command[key_index] = "***"' in reader_worker_source, "Reader-brain worker should redact API keys in logs")
	assert_true("_find_llama_server" in reader_worker_source, "Reader-brain worker should resolve the prebuilt llama-server binary path")
	assert_true("/app/llama-server" in reader_worker_source, "Reader-brain worker should check the prebuilt image binary path")
	assert_true("binary was not found" in reader_worker_source, "Reader-brain worker should fail with useful binary diagnostics")

	# Test: reader-brain auth wiring sends bearer tokens when configured
	model_response = MagicMock()
	model_response.read.return_value = json.dumps({"data": [{"id": "narrator-brain"}]}).encode("utf-8")
	model_response.__enter__ = lambda s: s
	model_response.__exit__ = MagicMock(return_value=False)
	with patch.object(app, "LLAMA_CPP_BASE_URL", "https://reader.example/v1"), patch.object(app, "LLAMA_CPP_TOKEN", "reader-secret"):
	with patch("urllib.request.urlopen", return_value=model_response) as urlopen_mock:
	app._runtime_status_core()
	status_request = urlopen_mock.call_args.args[0]
	assert_true(
	status_request.headers.get("Authorization") == "Bearer reader-secret",
	"Runtime status should send reader-brain Bearer token when LLAMA_CPP_TOKEN is configured",
	)

	chat_response = MagicMock()
	chat_response.read.return_value = json.dumps({"choices": [{"message": {"content": "Heading. Token protected narration."}}]}).encode("utf-8")
	chat_response.__enter__ = lambda s: s
	chat_response.__exit__ = MagicMock(return_value=False)
	with patch.object(app, "LLAMA_CPP_BASE_URL", "https://reader.example/v1"), patch.object(app, "LLAMA_CPP_TOKEN", "reader-secret"):
	with patch("urllib.request.urlopen", return_value=chat_response) as urlopen_mock:
	app.reader_brain_core("heading", "Token protected narration", "item 1 of 1", "narrate")
	chat_request = urlopen_mock.call_args.args[0]
	assert_true(
	chat_request.headers.get("Authorization") == "Bearer reader-secret",
	"Reader-brain requests should send Bearer token when LLAMA_CPP_TOKEN is configured",
	)

	# Test: auth wiring — app sends bearer token when configured
	with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"), patch.object(app, "KLEIN_MODAL_TOKEN", "test-secret-token"):
	with patch("urllib.request.urlopen", return_value=mock_response) as urlopen_mock:
	app.generate_image_core("auth test", seed=1)
	sent_request = urlopen_mock.call_args.args[0]
	assert_true(
	sent_request.headers.get("Authorization") == "Bearer test-secret-token",
	"App should send Bearer token when KLEIN_MODAL_TOKEN is configured",
	)

	# Test: auth wiring — health check sends bearer token when configured
	good_health = MagicMock()
	good_health.read.return_value = json.dumps({"ok": True, "model": app.MODEL_MANIFEST["image_generation"]["id"], "runtime": "modal-klein"}).encode("utf-8")
	good_health.__enter__ = lambda s: s
	good_health.__exit__ = MagicMock(return_value=False)
	with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"), patch.object(app, "KLEIN_MODAL_TOKEN", "test-secret-token"):
	with patch("urllib.request.urlopen", return_value=good_health) as urlopen_mock:
	app._runtime_status_core()
	health_request = urlopen_mock.call_args.args[0]
	assert_true(
	health_request.headers.get("Authorization") == "Bearer test-secret-token",
	"App should send Bearer token for health checks when KLEIN_MODAL_TOKEN is configured",
	)

	# Test: .env.example includes KLEIN_MODAL_TOKEN
	env_example = (ROOT / ".env.example").read_text(encoding="utf-8")
	assert_true("KLEIN_MODAL_TOKEN" in env_example, ".env.example should document KLEIN_MODAL_TOKEN")
	assert_true("LLAMA_CPP_TOKEN" in env_example, ".env.example should document LLAMA_CPP_TOKEN")

	# Test: worker validates token
	assert_true("KLEIN_MODAL_TOKEN" in worker_source, "Modal worker should read KLEIN_MODAL_TOKEN")
	assert_true("401" in worker_source, "Modal worker should reject unauthorized requests with 401")
	assert_true("_check_token" in worker_source, "Modal worker should have a token validation helper")
	assert_true(
	"async def health(request: Request)" in worker_source,
	"Modal worker health route should accept the request for token validation",
	)

	# Test: runtime setup does not expose the token value
	with patch.object(app, "KLEIN_MODAL_TOKEN", "super-secret-value"):
	setup = app.runtime_setup_core()
	setup_json = json.dumps(setup)
	assert_true("super-secret-value" not in setup_json, "Runtime setup must never expose the token value")
	image_step = next(step for step in setup["steps"] if step["role"] == "image_generation")
	assert_true(
	"KLEIN_MODAL_TOKEN" in image_step["env"],
	"Runtime setup should document KLEIN_MODAL_TOKEN",
	)
	assert_true(
	image_step["env"]["KLEIN_MODAL_TOKEN"] == "(configured)",
	"Runtime setup should show token as configured without exposing the value",
	)

	with patch.object(app, "LLAMA_CPP_TOKEN", "reader-super-secret"):
	setup = app.runtime_setup_core()
	setup_json = json.dumps(setup)
	assert_true("reader-super-secret" not in setup_json, "Runtime setup must never expose the reader token value")
	reader_step = next(step for step in setup["steps"] if step["role"] == "reader_brain")
	assert_true("LLAMA_CPP_TOKEN" in reader_step["env"], "Runtime setup should document LLAMA_CPP_TOKEN")
	assert_true(
	reader_step["env"]["LLAMA_CPP_TOKEN"] == "(configured)",
	"Runtime setup should show reader token as configured without exposing the value",
	)

	# Test: reader-brain runtime status exposes actionable health details without leaking tokens
	with patch.object(app, "LLAMA_CPP_BASE_URL", "https://reader.example/v1"), patch.object(app, "LLAMA_CPP_TOKEN", "reader-secret"):
	http_error = urllib.error.HTTPError(
	"https://reader.example/v1/models",
	401,
	"Unauthorized",
	{},
	None,
	)
	http_error.fp = MagicMock()
	http_error.fp.read.return_value = b'{"detail":"Unauthorized"}'
	with patch("urllib.request.urlopen", side_effect=http_error) as urlopen_mock:
	status = app._runtime_status_core()
	reader_status = status["reader_brain"]
	health_request = urlopen_mock.call_args.args[0]
	assert_true(
	health_request.headers.get("Authorization") == "Bearer reader-secret",
	"Reader-brain health checks should send Bearer token when configured",
	)
	assert_true(
	"HTTPError status=401" in reader_status["warning"],
	"Reader-brain runtime warning should include HTTP status details",
	)
	assert_true(
	"Unauthorized" in reader_status["warning"],
	"Reader-brain runtime warning should include response body details",
	)
	assert_true(
	"reader-secret" not in json.dumps(reader_status),
	"Reader-brain runtime status should not expose token values",
	)
	assert_true(
	reader_status["health_url"] == "https://reader.example/v1/models",
	"Reader-brain runtime status should expose the health URL",
	)

	# Test: runtime status includes Modal Klein path
	with patch.object(app, "KLEIN_MODAL_ENDPOINT", ""):
	status = app._runtime_status_core()
	assert_true("image_generation" in status, "Runtime status should include image_generation")
	assert_true(
	status["image_generation"]["status"] in {"online", "fallback-ready"},
	"Image generation status should be online or fallback-ready",
	)
	assert_true(
	status["image_generation"]["model"] == app.MODEL_MANIFEST["image_generation"]["id"],
	"Image generation status should reference the Klein model",
	)

	# Test: invalid health payload is fallback-ready, not online
	bad_health = MagicMock()
	bad_health.read.return_value = json.dumps({"ok": True, "model": "wrong", "runtime": "modal-klein"}).encode("utf-8")
	bad_health.__enter__ = lambda s: s
	bad_health.__exit__ = MagicMock(return_value=False)
	with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
	with patch("urllib.request.urlopen", return_value=bad_health):
	status = app._runtime_status_core()
	assert_true(
	status["image_generation"]["status"] == "fallback-ready",
	"Invalid Modal health should not be marked online",
	)
	assert_true("ValueError" in status["image_generation"].get("warning", ""), "Invalid health should report validation warning")

	# Test: runtime setup includes Modal deploy command
	setup = app.runtime_setup_core()
	image_step = next(step for step in setup["steps"] if step["role"] == "image_generation")
	assert_true(
	"modal deploy" in image_step["command"],
	"Runtime setup should include modal deploy command for image generation",
	)
	assert_true(
	"KLEIN_MODAL_ENDPOINT" in image_step["env"],
	"Runtime setup should document KLEIN_MODAL_ENDPOINT",
	)


	def verify_minicpm_vision_integration() -> None:
	with patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
	result = app.describe_image_core("model-map", caption=None, prompt=None)
	assert_true(result["ok"], "No-config MiniCPM fallback should return ok")
	assert_true(result["runtime"] == "fallback", "No-config MiniCPM should report fallback runtime")
	assert_true(result["model"] == app.MODEL_MANIFEST["vision"]["id"], "No-config MiniCPM should report vision model")
	assert_true(result.get("warning") is None, "No-config MiniCPM fallback should stay quiet")

	mock_response_data = {
	"choices": [
	{
	"message": {
	"content": "A compact diagram shows four small AI models connected around an accessibility reader."
	}
	}
	]
	}
	mock_response = MagicMock()
	mock_response.read.return_value = json.dumps(mock_response_data).encode("utf-8")
	mock_response.__enter__ = lambda s: s
	mock_response.__exit__ = MagicMock(return_value=False)

	with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
	with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
	with patch("urllib.request.urlopen", return_value=mock_response) as urlopen_mock:
	result = app.describe_image_core("model-map", caption="diagram", prompt="model map", image_url="/static/generated/model-map.svg")
	assert_true(result["ok"], "Live MiniCPM response should return ok")
	assert_true(result["runtime"] == "minicpm-v4.6", "Live MiniCPM response should report runtime")
	assert_true(result["model"] == app.MINICPM_VISION_MODEL, "Live MiniCPM response should report configured model")
	assert_true("accessibility reader" in result["alt_text"], "Live MiniCPM response should use returned alt text")
	request = urlopen_mock.call_args.args[0]
	assert_true(
	request.full_url == "https://vision.example/v1/chat/completions",
	"MiniCPM client should normalize base URL to chat completions",
	)
	assert_true(
	request.headers.get("Authorization") == "Bearer secret-key",
	"MiniCPM client should send bearer auth",
	)

	with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
	with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
	with patch.object(app, "PUBLIC_BASE_URL", "https://tiny.example"):
	with patch("urllib.request.urlopen", return_value=mock_response) as urlopen_mock:
	result = app.describe_image_core("model-map", caption="diagram", prompt="model map")
	assert_true(result["runtime"] == "minicpm-v4.6", "Default MiniCPM image-id path should use live response")
	request = urlopen_mock.call_args.args[0]
	request_body = json.loads(request.data.decode("utf-8"))
	image_part = request_body["messages"][0]["content"][1]
	assert_true(
	image_part["image_url"]["url"].startswith("data:image/png;base64,"),
	"MiniCPM default article image path should inline PNG companion assets",
	)
	assert_true(
	"https://tiny.example" not in image_part["image_url"]["url"],
	"MiniCPM default article image path should not depend on public URL fetching",
	)

	invalid_response = MagicMock()
	invalid_response.read.return_value = json.dumps({"choices": [{"message": {"content": ""}}]}).encode("utf-8")
	invalid_response.__enter__ = lambda s: s
	invalid_response.__exit__ = MagicMock(return_value=False)

	with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example"):
	with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
	with patch("urllib.request.urlopen", return_value=invalid_response):
	result = app.describe_image_core("custom", caption="fallback caption", prompt=None, image_url="https://example.com/image.png")
	assert_true(result["runtime"] == "fallback", "Invalid MiniCPM response should fall back")
	assert_true(result["alt_text"] == "fallback caption", "Invalid MiniCPM response should preserve fallback text")
	assert_true(
	result.get("warning") is not None and "ValueError" in result["warning"],
	"Invalid MiniCPM response should include validation warning",
	)

	models_response = MagicMock()
	models_response.read.return_value = json.dumps({"data": [{"id": app.MINICPM_VISION_MODEL}]}).encode("utf-8")
	models_response.__enter__ = lambda s: s
	models_response.__exit__ = MagicMock(return_value=False)

	with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
	with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
	with patch("urllib.request.urlopen", return_value=models_response):
	status = app._vision_runtime_status()
	assert_true(status["status"] == "online", "MiniCPM /models response should mark vision online")
	assert_true("secret-key" not in json.dumps(status), "Vision runtime status should not expose API key")

	ready_response = MagicMock()
	ready_response.read.return_value = json.dumps({"choices": [{"message": {"content": "ready"}}]}).encode("utf-8")
	ready_response.__enter__ = lambda s: s
	ready_response.__exit__ = MagicMock(return_value=False)
	with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
	with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
	with patch("urllib.request.urlopen", side_effect=[urllib.error.HTTPError("https://vision.example/v1/models", 404, "Not Found", {}, None), ready_response]):
	status = app._vision_runtime_status()
	assert_true(status["status"] == "online", "MiniCPM chat completions readiness should mark vision online when /models is unavailable")
	assert_true("chat completions ready" in status.get("warning", ""), "Vision status should explain chat-completions readiness fallback")

	setup = app.runtime_setup_core()
	vision_step = next(step for step in setup["steps"] if step["role"] == "vision")
	assert_true("MiniCPM-V-4.6" in vision_step["model"], "Runtime setup should document MiniCPM-V-4.6")
	assert_true("MINICPM_VISION_BASE_URL" in vision_step["env"], "Runtime setup should document MiniCPM base URL")
	assert_true("secret" not in json.dumps(vision_step).lower(), "Runtime setup should not expose MiniCPM API key")


	def verify_output_retention() -> None:
	keep_path = app.OUTPUT_DIR / "speech-retention-keep.wav"
	_ = app.speak_core("Tiny Narrator retention check.", voice="af_heart", speed=1.0)
	keep_path.write_bytes(b"keep")
	stale_files = []
	for index in range(30):
	stale_path = app.OUTPUT_DIR / f"speech-retention-stale-{index:02d}.wav"
	stale_path.write_bytes(b"stale")
	stale_files.append(stale_path)

	app._prune_speech_outputs(keep_path, max_files=4)

	remaining = list(app.OUTPUT_DIR.glob("speech*.wav"))
	assert_true(keep_path.exists(), "Speech retention should keep the active output")
	assert_true(len(remaining) <= 5, "Speech retention should prune stale generated audio")

	keep_path.unlink(missing_ok=True)
	for stale_path in stale_files:
	stale_path.unlink(missing_ok=True)


	def verify_routes() -> None:
	client = TestClient(app.app)

	home = client.get("/")
	assert_true(home.status_code == 200, "Home route should return 200")
	assert_true("Tiny Narrator" in home.text, "Home route should include app title")
	assert_true('href="/generate">Generate' in home.text, "Home route should link to Generate route")
	assert_true("readerToggle" in home.text, "Home route should include reader toggle")
	assert_true("summaryButton" in home.text, "Home route should include summary control")
	assert_true("imageStatus" in home.text, "Home route should include image status")
	assert_true("voiceStatus" in home.text, "Home route should include voice status")
	assert_true("latencyStatus" in home.text, "Home route should include latency status")
	assert_true("voiceControl" in home.text, "Home route should include voice control")
	assert_true("speedValue" in home.text, "Home route should include speed value output")
	assert_true("autoAdvanceControl" in home.text, "Home route should include auto-advance control")
	assert_true("transcriptLog" in home.text, "Home route should include transcript log")
	assert_true("readerQueueList" not in home.text, "Home route should not include reader queue list")
	assert_true("modelBudgetStatus" in home.text, "Home route should include model stack status")
	assert_true("modelStackList" in home.text, "Home route should include model stack list")
	assert_true("/evidence" not in home.text, "Home route should not link to a removed evidence page")
	assert_true("copyEvidenceButton" not in home.text, "Home route should keep judge evidence off the reader sidebar")

	generate_page = client.get("/generate")
	assert_true(generate_page.status_code == 200, "Generate route should return 200")
	assert_true("Generate a readable article" in generate_page.text, "Generate route should include generator title")
	assert_true("articleGeneratorForm" in generate_page.text, "Generate route should include article generator form")
	assert_true("generatedThumbnail" in generate_page.text, "Generate route should include generated thumbnail")
	assert_true("readerToggle" in generate_page.text, "Generate route should include reader toggle")
	assert_true("summaryButton" in generate_page.text, "Generate route should include summary control")
	assert_true("transcriptLog" in generate_page.text, "Generate route should include transcript log")
	assert_true("speechAudio" in generate_page.text, "Generate route should include speech playback")

	health = client.get("/api/health")
	assert_true(health.status_code == 200, "Health route should return 200")
	payload = health.json()
	assert_true(payload["ok"], "Health payload should be ok")
	assert_true(payload["public_base_url"] == app.PUBLIC_BASE_URL, "Health route should expose the public command base URL")
	assert_true(
	payload["models"]["reader_brain"]["runtime"] == "llama.cpp",
	"Health route should document llama.cpp reader-brain runtime",
	)

	manifest = client.get("/api/article-manifest")
	assert_true(manifest.status_code == 200, "Article manifest route should return 200")
	manifest_payload = manifest.json()
	assert_true("Tiny Titan" in manifest_payload["bonus_targets"], "Manifest should include Tiny Titan target")
	reader_controls = manifest_payload["reader_controls"]
	summary_shortcut = next((item for item in reader_controls if item["key"] == "S"), None)
	assert_true(summary_shortcut is not None, "Manifest should include summary shortcut")
	assert_true(
	summary_shortcut["action"] == "Summarize current section"
	and summary_shortcut["aria_keyshortcuts"] == "S",
	"Manifest summary shortcut should include action and aria-keyshortcuts value",
	)
	assert_true(
	{item["aria_keyshortcuts"] for item in reader_controls} >= {"Space", "N", "P", "H", "I", "S", "R", "Escape"},
	"Manifest should expose aria-keyshortcuts values for reader controls",
	)
	assert_true(
	manifest_payload["models"]["speech"]["id"] == "hexgrad/Kokoro-82M",
	"Manifest should document Kokoro speech model",
	)
	assert_true(
	manifest_payload["reader_settings"]["default_voice"] == "af_heart",
	"Manifest should document default Kokoro voice",
	)
	assert_true(
	len(manifest_payload["reader_settings"]["voices"]) >= 4,
	"Manifest should expose multiple Kokoro voice choices",
	)
	assert_true(
	manifest_payload["reader_settings"]["default_auto_advance"] is False,
	"Manifest should default auto-advance off",
	)
	assert_true(
	len(manifest_payload["award_evidence"]) == 4,
	"Manifest should expose four award evidence items",
	)
	assert_true(
	manifest_payload["model_budget"]["all_models_within_limit"],
	"Manifest should prove every model is within the Tiny Titan limit",
	)
	assert_true(
	len(manifest_payload["runtime_setup"]["steps"]) == 4,
	"Manifest should expose setup steps for each model role",
	)
	assert_true(
	len(manifest_payload["demo_script"]["actions"]) >= 4,
	"Manifest should expose a judge demo script",
	)
	assert_true(
	manifest_payload["accessibility_audit"]["all_passed"],
	"Manifest should expose passing accessibility audit evidence",
	)

	awards = client.get("/api/award-evidence")
	assert_true(awards.status_code == 200, "Award evidence route should return 200")
	award_payload = awards.json()
	assert_true(award_payload["ok"], "Award evidence payload should be ok")
	assert_true(
	{item["id"] for item in award_payload["items"]} == {"tiny-titan", "llama-champion", "off-brand", "field-notes"},
	"Award evidence route should cover the targeted bonuses",
	)

	budget = client.get("/api/model-budget")
	assert_true(budget.status_code == 200, "Model budget route should return 200")
	budget_payload = budget.json()
	assert_true(budget_payload["ok"], "Model budget payload should be ok")
	assert_true(budget_payload["limit_billion"] == 4.0, "Tiny Titan limit should be 4B")
	assert_true(budget_payload["all_models_within_limit"], "All models should stay within the Tiny Titan limit")
	assert_true(
	all(item["params_billion"] <= budget_payload["limit_billion"] for item in budget_payload["models"]),
	"Every model budget item should be at or below the limit",
	)

	setup = client.get("/api/runtime-setup")
	assert_true(setup.status_code == 200, "Runtime setup route should return 200")
	setup_payload = setup.json()
	assert_true(setup_payload["ok"], "Runtime setup payload should be ok")
	assert_true(
	{item["role"] for item in setup_payload["steps"]}
	== {"reader_brain", "speech", "vision", "image_generation"},
	"Runtime setup should cover every model path",
	)
	assert_true(
	"llama-server" in setup_payload["steps"][0]["command"],
	"Runtime setup should include the llama.cpp launch command",
	)
	assert_true(
	setup_payload["steps"][0]["modal_command"] == "modal deploy modal_workers/reader_brain.py",
	"Runtime setup should include the Modal reader-brain deploy command",
	)
	assert_true(
	"--reasoning off" in setup_payload["steps"][0]["command"],
	"Runtime setup should document non-reasoning llama.cpp mode",
	)
	assert_true(
	setup_payload["app"]["env"]["PUBLIC_BASE_URL"] == app.PUBLIC_BASE_URL,
	"Runtime setup should expose the public command base URL",
	)

	demo = client.get("/api/demo-script")
	assert_true(demo.status_code == 200, "Demo script route should return 200")
	demo_payload = demo.json()
	assert_true(demo_payload["ok"], "Demo script payload should be ok")
	assert_true(
	"Tiny Narrator judge demo" == demo_payload["title"],
	"Demo script should be labeled for judging",
	)
	assert_true(
	{item["path"] for item in demo_payload["api_checks"]} >= {"/api/model-budget", "/api/runtime-setup"},
	"Demo script should include evidence API checks",
	)
	assert_true(
	any("Tiny Titan" in action["evidence"] for action in demo_payload["actions"]),
	"Demo script should point to targeted award evidence",
	)
	assert_true(
	any(item["path"] == "/api/accessibility-audit" for item in demo_payload["api_checks"]),
	"Demo script should include the accessibility audit check",
	)
	assert_true(
	any(item["path"] == "/api/submission-readiness" for item in demo_payload["api_checks"]),
	"Demo script should include the submission readiness check",
	)
	reader_check = next(item for item in demo_payload["api_checks"] if item["path"] == "/api/reader-brain")
	speech_check = next(item for item in demo_payload["api_checks"] if item["path"] == "/api/speak")
	assert_true(reader_check["sample_body"]["mode"] == "narrate", "Reader-brain demo check should include a sample body")
	assert_true(
	speech_check["sample_body"]["voice"] == app.READER_SETTINGS["default_voice"],
	"Speech demo check should use the default reader voice",
	)
	assert_true(
	all(item.get("sample_body") for item in demo_payload["api_checks"] if item["method"] == "POST"),
	"Every POST demo check should include an executable sample body",
	)
	assert_true(
	all(item["curl"].startswith("curl ") for item in demo_payload["api_checks"]),
	"Every demo API check should include a curl command",
	)
	assert_true(
	all(app.PUBLIC_BASE_URL in item["curl"] for item in demo_payload["api_checks"]),
	"Every curl command should use the public command base URL",
	)
	assert_true(
	all(item["powershell"].startswith("curl.exe ") for item in demo_payload["api_checks"]),
	"Every demo API check should include a PowerShell-friendly curl.exe command",
	)
	assert_true(
	all(app.PUBLIC_BASE_URL in item["powershell"] for item in demo_payload["api_checks"]),
	"Every PowerShell command should use the public command base URL",
	)
	assert_true(
	"-d '" in reader_check["curl"] and "/api/reader-brain" in reader_check["curl"],
	"Reader-brain curl command should include the sample JSON body",
	)
	assert_true(
	'\\"node_type\\"' in reader_check["powershell"] and "/api/reader-brain" in reader_check["powershell"],
	"Reader-brain PowerShell command should include escaped sample JSON",
	)
	reader_sample = client.post(reader_check["path"], json=reader_check["sample_body"])
	assert_true(reader_sample.status_code == 200, "Reader-brain sample payload should be executable")
	reader_sample_payload = reader_sample.json()
	assert_true(reader_sample_payload["ok"], "Reader-brain sample payload should return ok")
	assert_true("narration" in reader_sample_payload, "Reader-brain sample payload should return narration")

	speech_sample = client.post(speech_check["path"], json=speech_check["sample_body"])
	assert_true(speech_sample.status_code == 200, "Speech sample payload should be executable")
	speech_sample_payload = speech_sample.json()
	assert_true(speech_sample_payload["ok"], "Speech sample payload should return ok")
	assert_true(
	speech_sample_payload["audio_url"].startswith("/outputs/"),
	"Speech sample payload should return an output audio URL",
	)

	article_sample = client.post("/api/generate-article", json={"topic": "accessible classroom robotics"})
	assert_true(article_sample.status_code == 200, "Article generation route should return 200")
	article_sample_payload = article_sample.json()
	assert_true(article_sample_payload["ok"], "Article generation payload should return ok")
	assert_true(len(article_sample_payload["article"]["sections"]) == 5, "Article generation payload should include five sections")
	assert_true(
	article_sample_payload["thumbnail"]["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"],
	"Article generation payload should include Klein thumbnail provenance",
	)

	audit = client.get("/api/accessibility-audit")
	assert_true(audit.status_code == 200, "Accessibility audit route should return 200")
	audit_payload = audit.json()
	assert_true(audit_payload["ok"], "Accessibility audit payload should be ok")
	assert_true(audit_payload["all_passed"], "Accessibility audit should pass")
	assert_true(audit_payload["passed_checks"] == audit_payload["total_checks"], "All audit checks should pass")
	assert_true(
	{item["id"] for item in audit_payload["checks"]}
	>= {
	"semantic_queue",
	"keyboard_navigation",
	"reader_cursor",
	"shortcut_safety",
	"live_region",
	"image_alt_text",
	"inspectable_transcript",
	},
	"Accessibility audit should cover reader semantics, keyboard use, cursor state, shortcut safety, live narration, alt text, and transcript",
	)

	readiness = client.get("/api/submission-readiness")
	assert_true(readiness.status_code == 200, "Submission readiness route should return 200")
	readiness_payload = readiness.json()
	assert_true(readiness_payload["ok"], "Submission readiness payload should be ok")
	assert_true(readiness_payload["all_passed"], "Submission readiness checks should pass")
	assert_true(
	{item["id"] for item in readiness_payload["checks"]}
	>= {
	"tiny_titan_budget",
	"award_targets",
	"custom_frontend",
	"runtime_setup",
	"runtime_status",
	"reader_accessibility",
	"image_receipts",
	"demo_api_checks",
	"command_base_url",
	},
	"Submission readiness should aggregate model, award, frontend, runtime, accessibility, image, and demo evidence",
	)
	runtime_status_check = next(item for item in readiness_payload["checks"] if item["id"] == "runtime_status")
	assert_true(runtime_status_check["status"] == "pass", "Submission readiness should pass runtime status checks")
	demo_api_check = next(item for item in readiness_payload["checks"] if item["id"] == "demo_api_checks")
	assert_true(demo_api_check["status"] == "pass", "Submission readiness should pass executable demo API checks")
	command_base_check = next(item for item in readiness_payload["checks"] if item["id"] == "command_base_url")
	assert_true(command_base_check["status"] == "pass", "Submission readiness should pass command base URL checks")

	evidence = client.get("/api/evidence-bundle")
	assert_true(evidence.status_code == 200, "Evidence bundle route should return 200")
	evidence_payload = evidence.json()
	assert_true(evidence_payload["ok"], "Evidence bundle payload should be ok")
	assert_true(evidence_payload["schema_version"] == "1.0", "Evidence bundle should include schema version")
	assert_true(evidence_payload["generated_at"].endswith("Z"), "Evidence bundle should include UTC timestamp")
	assert_true(evidence_payload["public_base_url"] == app.PUBLIC_BASE_URL, "Evidence bundle should include public base URL")
	assert_true(evidence_payload["submission_readiness"]["all_passed"], "Evidence bundle should include passing readiness")
	assert_true(evidence_payload["model_budget"]["all_models_within_limit"], "Evidence bundle should include Tiny Titan proof")
	assert_true(
	{"runtime_status", "demo_script", "accessibility_audit", "image_descriptions"} <= set(evidence_payload),
	"Evidence bundle should include runtime status, demo script, accessibility audit, and image descriptions",
	)
	assert_true(evidence_payload["runtime_status"]["ok"], "Evidence bundle should include ok runtime status")
	assert_true(
	{"reader_brain", "speech", "image_generation"} <= set(evidence_payload["runtime_status"]),
	"Evidence bundle runtime status should include reader brain, speech, and image generation status",
	)
	assert_true(
	evidence_payload["runtime_status"]["reader_brain"]["status"] in {"online", "fallback-ready"},
	"Evidence bundle reader brain status should be online or fallback-ready",
	)
	assert_true(
	evidence_payload["runtime_status"]["speech"]["status"] in {"online", "fallback-ready"},
	"Evidence bundle speech status should be online or fallback-ready",
	)
	assert_true(
	evidence_payload["runtime_status"]["image_generation"]["status"] in {"online", "fallback-ready"},
	"Evidence bundle image generation status should be online or fallback-ready",
	)

	runtime = client.get("/api/runtime-status")
	assert_true(runtime.status_code == 200, "Runtime status route should return 200")
	runtime_payload = runtime.json()
	assert_true(runtime_payload["ok"], "Runtime status payload should be ok")
	assert_true("reader_brain" in runtime_payload, "Runtime status should include reader brain status")
	assert_true("speech" in runtime_payload, "Runtime status should include speech status")
	assert_true("image_generation" in runtime_payload, "Runtime status should include image generation status")
	assert_true(
	runtime_payload["reader_brain"]["status"] in {"online", "fallback-ready"},
	"Reader brain status should be online or fallback-ready",
	)
	assert_true(
	runtime_payload["image_generation"]["status"] in {"online", "fallback-ready"},
	"Image generation status should be online or fallback-ready",
	)
	assert_true(
	runtime_payload["image_generation"]["model"] == app.MODEL_MANIFEST["image_generation"]["id"],
	"Image generation status should reference the Klein model",
	)

	image_descriptions = client.get("/api/image-descriptions")
	assert_true(image_descriptions.status_code == 200, "Image descriptions route should return 200")
	image_payload = image_descriptions.json()
	assert_true(image_payload["model"] == app.MODEL_MANIFEST["vision"]["id"], "Image route should document MiniCPM-V model")
	assert_true(image_payload["runtime"] == "fallback", "Image route should use fallback runtime without MiniCPM config")
	assert_true(
	{item["id"] for item in image_payload["descriptions"]} == {"desk-reader", "model-map"},
	"Image route should describe all visible article images",
	)
	assert_true(
	all(item["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"] for item in image_payload["descriptions"]),
	"Image route should expose image-generation provenance",
	)
	assert_true(
	all(item["generation_status"] == "fallback-ready" for item in image_payload["descriptions"]),
	"Image route should label bundled image fallback status",
	)

	# Verify generate-image endpoint returns fallback when Modal is not configured
	gen_image = client.post("/api/generate-image", json={"prompt": "test thumbnail", "seed": 7})
	assert_true(gen_image.status_code == 200, "Generate image route should return 200")
	gen_image_payload = gen_image.json()
	assert_true(gen_image_payload["ok"], "Generate image payload should be ok")
	assert_true(gen_image_payload["model"] == app.MODEL_MANIFEST["image_generation"]["id"], "Generate image should report Klein model")
	assert_true(gen_image_payload["runtime"] == "fallback", "Generate image without Modal should report fallback")
	assert_true(isinstance(gen_image_payload["elapsed_ms"], int), "Generate image should include elapsed_ms")


	def main() -> None:
	py_compile.compile(str(ROOT / "app.py"), doraise=True)
	py_compile.compile(str(ROOT / "modal_workers" / "klein_image.py"), doraise=True)
	py_compile.compile(str(ROOT / "modal_workers" / "reader_brain.py"), doraise=True)
	verify_static_assets()
	verify_space_metadata()
	verify_dotenv_wiring()
	verify_live_smoke_script()
	verify_core_fallbacks()
	verify_modal_klein_integration()
	verify_minicpm_vision_integration()
	verify_output_retention()
	verify_routes()
	print("Tiny Narrator verification passed.")


	if __name__ == "__main__":
	main()