TinyNarrator / scripts /verify.py
cvpfus
Document Docker Space metadata and fallbacks
4565f15
Raw
History Blame Contribute Delete
75.1 kB
from __future__ import annotations
import json
import py_compile
import sys
import urllib.error
import wave
from pathlib import Path
from unittest.mock import patch, MagicMock
ROOT = Path(__file__).resolve().parents[1]
sys.path.insert(0, str(ROOT))
import app
from fastapi.testclient import TestClient
def assert_true(condition: bool, message: str) -> None:
if not condition:
raise AssertionError(message)
def verify_static_assets() -> None:
required = [
ROOT / "LICENSE",
ROOT / "DEPLOY_SPACES.md",
ROOT / "Dockerfile",
ROOT / "start.sh",
ROOT / "SUBMISSION.md",
ROOT / "static" / "index.html",
ROOT / "static" / "generate.html",
ROOT / "static" / "app.css",
ROOT / "static" / "app.js",
ROOT / "static" / "generate.js",
ROOT / "static" / "generated" / "desk-reader.svg",
ROOT / "static" / "generated" / "desk-reader.png",
ROOT / "static" / "generated" / "model-map.svg",
ROOT / "static" / "generated" / "model-map.png",
ROOT / "static" / "generated" / "field-notes.svg",
]
for path in required:
assert_true(path.exists(), f"Missing required asset: {path}")
try:
from PIL import Image
for path in [ROOT / "static" / "generated" / "desk-reader.png", ROOT / "static" / "generated" / "model-map.png"]:
with Image.open(path) as image:
assert_true(image.size == (1200, 675), f"Vision PNG should match article image ratio: {path}")
assert_true(image.format == "PNG", f"Vision companion asset should be PNG: {path}")
except ImportError:
pass
app_js = (ROOT / "static" / "app.js").read_text(encoding="utf-8")
app_source = (ROOT / "app.py").read_text(encoding="utf-8")
generate_js = (ROOT / "static" / "generate.js").read_text(encoding="utf-8")
index_html = (ROOT / "static" / "index.html").read_text(encoding="utf-8")
generate_html = (ROOT / "static" / "generate.html").read_text(encoding="utf-8")
deploy_spaces = (ROOT / "DEPLOY_SPACES.md").read_text(encoding="utf-8")
dockerfile = (ROOT / "Dockerfile").read_text(encoding="utf-8")
start_script = (ROOT / "start.sh").read_text(encoding="utf-8")
assert_true("FROM python:3.12-slim" in dockerfile, "Spaces Dockerfile should use a free CPU Python base image")
assert_true("nvidia/cuda" not in dockerfile, "Spaces Dockerfile should not require paid HF GPU CUDA image")
assert_true("llama-server" not in start_script, "Spaces start script should not launch local llama.cpp")
assert_true("free CPU" in deploy_spaces, "Spaces deploy guide should describe free CPU deployment")
assert_true("modal_workers/reader_brain.py" in deploy_spaces, "Spaces deploy guide should document Modal reader-brain deployment")
assert_true("CPU Basic" in deploy_spaces, "Spaces deploy guide should recommend CPU Basic hardware")
assert_true("LLAMA_CPP_TOKEN" in deploy_spaces, "Spaces deploy guide should document reader-brain auth token")
assert_true("tiny-narrator-reader-brain-token" in deploy_spaces, "Spaces deploy guide should document the Modal reader token secret")
assert_true('href="/" aria-current="page">Reader' in index_html, "Reader page should mark Reader route current")
assert_true('href="/generate">Generate' in index_html, "Reader page should link to Generate route")
assert_true('href="/">Reader' in generate_html, "Generate page should link back to Reader route")
assert_true('href="/generate" aria-current="page">Generate' in generate_html, "Generate page should mark Generate route current")
assert_true("articleGeneratorForm" in generate_html, "Generate page should expose the article generator form")
assert_true("generatedThumbnail" in generate_html, "Generate page should expose a generated thumbnail preview")
assert_true("readerToggle" in generate_html, "Generate page should expose a screen reader toggle")
assert_true("transcriptLog" in generate_html, "Generate page should expose a narration transcript")
assert_true("speechAudio" in generate_html, "Generate page should expose speech playback")
assert_true("/api/generate-article" in generate_js, "Generate frontend should call article generation API")
assert_true("/api/reader-brain" in generate_js, "Generate frontend should call reader-brain narration API")
assert_true("/api/speak" in generate_js, "Generate frontend should call speech API")
assert_true('node.type === "image"' in generate_js, "Generate reader should reserve reader-brain item narration for images")
assert_true('runtime: "raw text"' in generate_js, "Generate reader should speak text-only nodes without reader-brain")
assert_true("Image description." in generate_js, "Generate reader should force image narration to announce image descriptions")
assert_true("refreshReaderNodes" in generate_js, "Generate frontend should build a generated article reader path")
assert_true('data-reader-type="heading"' in generate_js, "Generated article sections should mark heading reader nodes")
assert_true('data-reader-type="paragraph"' in generate_js, "Generated article sections should mark paragraph reader nodes")
assert_true("thumbnail.generation_model" in generate_js, "Generate frontend should render Klein thumbnail receipt")
assert_true('data-reader-type="heading"' in index_html, "Article should mark heading reader nodes")
assert_true('data-reader-type="image"' in index_html, "Article should mark image reader nodes")
assert_true("vision_asset_url" in app_source, "Article images should expose PNG assets for vision APIs")
assert_true("/static/generated/desk-reader.png" in app_source, "Desk reader should have a PNG vision asset")
assert_true("/static/generated/model-map.png" in app_source, "Model map should have a PNG vision asset")
assert_true('href="#notes"' not in index_html, "Article navigation should not include the Field Notes section")
assert_true('id="notes"' not in index_html, "Article UI should not render the Field Notes section")
assert_true("Field Notes" not in index_html, "Article UI should not render Field Notes copy")
assert_true("Field Notes" not in generate_html, "Generate UI should not render Field Notes copy")
assert_true('alt=""' not in index_html, "Article images should not start with empty alt text")
assert_true(
"reader brain, vision, speech, and image generation models" in index_html,
"Article should include meaningful fallback alt text for generated images",
)
assert_true('aria-live="polite"' in index_html, "Article should expose an aria-live narration region")
for shortcut in ['aria-keyshortcuts="Space"', 'aria-keyshortcuts="N"', 'aria-keyshortcuts="R"', 'aria-keyshortcuts="S"']:
assert_true(shortcut in index_html, f"Reader controls should expose {shortcut}")
assert_true("transcriptLog" in index_html, "Article should expose a visible transcript log")
assert_true("readerQueueList" not in index_html, "Article sidebar should not include a visible reader queue")
assert_true("repeatButton" in index_html, "Reader controls should expose a visible repeat command")
assert_true("stopButton" in index_html, "Reader controls should expose a visible stop command")
assert_true("modelStackList" in index_html, "Article sidebar should expose the model stack panel")
assert_true("modelBudgetStatus" in index_html, "Article sidebar should expose model stack status")
for removed_id in [
"demoScriptList",
"demoApiCheckList",
"imageReceiptList",
"runtimeStatusList",
"submissionReadinessList",
"copyEvidenceButton",
"modelBudgetList",
"runtimeSetupList",
]:
assert_true(removed_id not in index_html, f"Article sidebar should not include removed evidence panel: {removed_id}")
assert_true("loadDemoScript" not in app_js, "Article frontend should not render the structured demo script")
assert_true("loadModelBudget" in app_js, "Article frontend should render the model stack panel")
assert_true("/api/model-budget" in app_js, "Article frontend should fetch model budget data")
assert_true("/api/runtime-status" in app_js, "Article frontend should fetch runtime status")
assert_true("status-pill" in app_js or "statusClass" in app_js, "Article frontend should render per-role status labels")
assert_true("modelStackList.innerHTML" in app_js, "Article frontend should render model stack items")
assert_true("Tiny Titan pass" in app_js, "Article frontend should render per-model Tiny Titan pass labels")
assert_true("/evidence" not in index_html, "Article page should not link to a removed evidence page")
assert_true("copyTextToClipboard" in app_js, "Frontend copy actions should share clipboard fallback handling")
assert_true(
"Transcript is visible, but clipboard access is unavailable." in app_js,
"Transcript copy should report unavailable clipboard access",
)
assert_true("transcript-position" in app_js, "Transcript should render the narrated reader position")
assert_true("readerItemStatus(node)" in app_js, "Narration transcript entries should include reader item position")
assert_true('node.type === "image"' in app_js, "Article reader should reserve reader-brain item narration for images")
assert_true('runtime: "raw text"' in app_js, "Article reader should speak text-only nodes without reader-brain")
assert_true("Image description." in app_js, "Article reader should force image narration to announce image descriptions")
assert_true(
"[${entry.type} / ${entry.position} / ${entry.runtime}]" in app_js,
"Copied transcript should include type, position, and runtime",
)
assert_true("function haltPlayback" in app_js, "Reader controls should expose a shared playback halt helper")
assert_true(
"haltPlayback({ clearAutoAdvance: false });" in app_js,
"New narration commands should interrupt current speech immediately",
)
assert_true("aria-current" in app_js, "Reader mode should expose the active item as current")
assert_true("shouldHandleReaderShortcut" in app_js, "Reader shortcuts should not hijack form controls")
assert_true("controls.repeat.click()" in app_js, "R should route through the visible repeat command")
assert_true("controls.stop.click()" in app_js, "Escape should route through the visible stop command")
assert_true("reader-node-" in app_js, "Reader nodes should receive stable ids for control context")
assert_true("renderReaderQueue" not in app_js, "Frontend should not render a visible reader queue")
assert_true("readerQueueList" not in app_js, "Frontend should not bind a visible reader queue")
assert_true("narrate(node.index)" in app_js, "Reader mode should support click-to-read article items")
assert_true("describeGeneratedThumbnail" in generate_js, "Generate frontend should describe generated thumbnails")
assert_true("/api/describe-image" in generate_js, "Generate frontend should call describe-image for thumbnails")
assert_true("image_url" in generate_js, "Generate frontend should send image_url to describe-image")
assert_true("generatedThumbnail.alt" in generate_js, "Generate frontend should update thumbnail alt from descriptor")
assert_true("fallbackAlt" in generate_js, "Generate frontend should preserve fallback alt on descriptor failure")
submission = (ROOT / "SUBMISSION.md").read_text(encoding="utf-8")
for target in ["Tiny Titan", "Llama Champion", "Off-Brand", "Field Notes"]:
assert_true(target in submission, f"Submission packet should mention {target}")
for endpoint in [
"/api/model-budget",
"/api/runtime-setup",
"/api/accessibility-audit",
"/api/demo-script",
"/api/submission-readiness",
"/api/evidence-bundle",
"/api/generate-article",
]:
assert_true(endpoint in submission, f"Submission packet should mention {endpoint}")
assert_true(
"nvidia/NVIDIA-Nemotron-3-Nano-4B-GGUF" in submission,
"Submission packet should include the reader-brain model",
)
for evidence in ["reader cursor", "shortcut safety", "aria-current"]:
assert_true(evidence in submission, f"Submission packet should mention {evidence}")
for evidence in ["prompt", "seed", "FLUX.2-klein-4B", "fallback asset"]:
assert_true(evidence in submission, f"Submission packet should mention image receipt evidence: {evidence}")
def front_matter_value(readme: str, key: str) -> str:
lines = readme.splitlines()
if not lines or lines[0] != "---":
return ""
for line in lines[1:]:
if line == "---":
break
name, separator, value = line.partition(":")
if separator and name.strip() == key:
return value.strip()
return ""
def verify_space_metadata() -> None:
readme = (ROOT / "README.md").read_text(encoding="utf-8")
requirements = (ROOT / "requirements.txt").read_text(encoding="utf-8").splitlines()
license_text = (ROOT / "LICENSE").read_text(encoding="utf-8")
sdk = front_matter_value(readme, "sdk")
app_port = front_matter_value(readme, "app_port")
emoji = front_matter_value(readme, "emoji")
title = front_matter_value(readme, "title")
license_id = front_matter_value(readme, "license")
assert_true(title == "Tiny Narrator", "Space metadata should name the app")
assert_true(sdk == "docker", "Space metadata should declare the Docker SDK")
assert_true(app_port == "7860", "Docker Space metadata should expose app_port 7860")
assert_true(emoji and "ð" not in emoji, "Space metadata emoji should be valid UTF-8")
assert_true(license_id == "apache-2.0", "Space metadata should declare the Apache-2.0 license")
assert_true("Apache License" in license_text, "Repository should include the Apache license text")
assert_true("Version 2.0" in license_text, "Repository license should match Space metadata")
assert_true(any(line.startswith("gradio==") for line in requirements), "requirements.txt should pin Gradio")
for package in ["pydantic", "kokoro", "soundfile", "python-dotenv"]:
assert_true(
any(
line.startswith(f"{package}>=") or line.startswith(f"{package}==") or line.strip() == package
for line in requirements
),
f"requirements.txt should include {package}",
)
def verify_dotenv_wiring() -> None:
"""Verify that python-dotenv is wired in before core env constants are read."""
requirements = (ROOT / "requirements.txt").read_text(encoding="utf-8").splitlines()
assert_true(
any(line.strip() == "python-dotenv" or line.startswith("python-dotenv>=") for line in requirements),
"requirements.txt should include python-dotenv",
)
app_source = (ROOT / "app.py").read_text(encoding="utf-8")
assert_true("from dotenv import load_dotenv" in app_source, "app.py should import load_dotenv")
assert_true("load_dotenv()" in app_source, "app.py should call load_dotenv()")
import_pos = app_source.index("from dotenv import load_dotenv")
call_pos = app_source.index("load_dotenv()")
llama_const = app_source.index("LLAMA_CPP_BASE_URL = os.getenv")
assert_true(
import_pos < call_pos < llama_const,
"load_dotenv() should be called before LLAMA_CPP_BASE_URL is assigned",
)
env_example = ROOT / ".env.example"
assert_true(env_example.exists(), ".env.example should exist")
env_content = env_example.read_text(encoding="utf-8")
for secret_pattern in ["sk-", "AKIA", "ghp_", "xoxb-"]:
assert_true(
secret_pattern not in env_content,
f".env.example should not contain real-looking secrets ({secret_pattern})",
)
def verify_live_smoke_script() -> None:
"""Verify that the live smoke test script exists, is syntactically valid, and documents redaction."""
smoke_path = ROOT / "scripts" / "live_smoke.py"
assert_true(smoke_path.exists(), "scripts/live_smoke.py should exist")
py_compile.compile(str(smoke_path), doraise=True)
smoke_source = smoke_path.read_text(encoding="utf-8")
assert_true("--base-url" in smoke_source, "Smoke script should support --base-url argument")
assert_true("/api/runtime-status" in smoke_source, "Smoke script should check runtime status")
assert_true("/api/describe-image" in smoke_source, "Smoke script should check describe-image")
assert_true("/api/generate-image" in smoke_source, "Smoke script should check generate-image")
assert_true("_role_is_configured" in smoke_source, "Smoke script should fail configured live paths instead of skipping them")
assert_true('details.get("configured") is True' in smoke_source, "Smoke script should preserve configured metadata from runtime status")
assert_true("SKIP" in smoke_source or "skip" in smoke_source, "Smoke script should document skipping behavior")
assert_true("Secrets" in smoke_source or "secrets" in smoke_source or "never printed" in smoke_source.lower(), "Smoke script should document secret redaction")
def verify_core_fallbacks() -> None:
no_live_reader = [
patch.object(app, "LLAMA_CPP_BASE_URL", ""),
patch.object(app, "MINICPM_VISION_BASE_URL", ""),
patch.object(app, "MINICPM_VISION_API_KEY", ""),
]
for patcher in no_live_reader:
patcher.start()
try:
narration = app.reader_brain_core(
node_type="heading",
text="Why tiny models matter",
position="item 1 of 1",
mode="narrate",
)
finally:
for patcher in reversed(no_live_reader):
patcher.stop()
assert_true(narration["ok"], "Reader-brain fallback did not return ok")
assert_true("Heading." in narration["narration"], "Reader-brain fallback lost heading prefix")
assert_true(isinstance(narration["elapsed_ms"], int), "Reader-brain response should include elapsed_ms")
with patch.object(app, "LLAMA_CPP_BASE_URL", ""), patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
image_fallback = app.reader_brain_core(
node_type="image",
text="A highlighted paragraph sits beside playback controls.",
position="item 1 of 1",
mode="narrate",
)
assert_true(
image_fallback["narration"].startswith("Image description."),
"Image fallback narration should clearly announce image descriptions",
)
with patch.object(app, "LLAMA_CPP_BASE_URL", ""), patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
summary = app.reader_brain_core(
node_type="section",
text="Tiny models can run close to the reader. They keep latency low and preserve privacy.",
position="Why",
mode="summarize",
)
assert_true(summary["ok"], "Reader-brain summary fallback did not return ok")
assert_true(summary["narration"].startswith("Summary."), "Summary fallback should announce summary mode")
with patch.object(app, "LLAMA_CPP_BASE_URL", ""), patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
unconfigured_reader = app.reader_brain_core(
node_type="paragraph",
text="This paragraph should be narrated without a configured endpoint.",
position="item 1 of 1",
mode="narrate",
)
assert_true(unconfigured_reader["runtime"] == "fallback", "Unconfigured reader brain should use fallback")
assert_true(
"not configured" in unconfigured_reader["warning"],
"Unconfigured reader brain should explain the missing endpoint",
)
unconfigured_article = app.generate_article_core("accessible classroom tools")
assert_true(unconfigured_article["runtime"] == "fallback", "Unconfigured article generation should use fallback")
assert_true(
"not configured" in unconfigured_article["warning"],
"Unconfigured article generation should explain the missing endpoint",
)
empty_llama_response = MagicMock()
empty_llama_response.read.return_value = json.dumps({"choices": [{"message": {"content": ""}}]}).encode("utf-8")
empty_llama_response.__enter__ = lambda s: s
empty_llama_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
with patch("urllib.request.urlopen", return_value=empty_llama_response):
empty_narration = app.reader_brain_core(
node_type="paragraph",
text="This paragraph still needs narration.",
position="item 2 of 3",
mode="narrate",
)
assert_true(empty_narration["runtime"] == "fallback", "Empty llama.cpp response should use fallback narration")
assert_true(empty_narration["narration"], "Empty llama.cpp response should not return empty narration")
minicpm_reader_response = MagicMock()
minicpm_reader_response.read.return_value = json.dumps(
{"choices": [{"message": {"content": "Fallback narration from MiniCPM."}}]}
).encode("utf-8")
minicpm_reader_response.__enter__ = lambda s: s
minicpm_reader_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "LLAMA_CPP_BASE_URL", "https://llama.example/v1"):
with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
with patch("urllib.request.urlopen", side_effect=[urllib.error.URLError("llama down"), minicpm_reader_response]) as urlopen_mock:
minicpm_narration = app.reader_brain_core(
node_type="paragraph",
text="This paragraph should use MiniCPM after llama.cpp fails.",
position="item 2 of 3",
mode="narrate",
)
minicpm_request = urlopen_mock.call_args_list[1].args[0]
minicpm_body = json.loads(minicpm_request.data.decode("utf-8"))
assert_true(minicpm_narration["runtime"] == "minicpm-v4.6-fallback", "MiniCPM should run before rule fallback")
assert_true(minicpm_narration["model"] == app.MINICPM_VISION_MODEL, "MiniCPM reader fallback should report MiniCPM model")
assert_true(minicpm_body["model"] == app.MINICPM_VISION_MODEL, "MiniCPM fallback should send MiniCPM model id")
assert_true("llama.cpp unavailable" in minicpm_narration["warning"], "MiniCPM fallback should preserve primary failure warning")
reasoning_response = MagicMock()
reasoning_response.read.return_value = json.dumps(
{"choices": [{"message": {"content": "", "reasoning_content": "Heading. Live narration from llama.cpp."}}]}
).encode("utf-8")
reasoning_response.__enter__ = lambda s: s
reasoning_response.__exit__ = MagicMock(return_value=False)
with patch("urllib.request.urlopen", return_value=reasoning_response):
reasoning_narration = app.reader_brain_core(
node_type="heading",
text="Live heading",
position="item 1 of 1",
mode="narrate",
)
assert_true(reasoning_narration["runtime"] == "llama.cpp", "Reader brain should use alternate llama.cpp message text fields")
assert_true("Live narration" in reasoning_narration["narration"], "Reader brain should extract reasoning_content when content is empty")
image_llama_response = MagicMock()
image_llama_response.read.return_value = json.dumps(
{"choices": [{"message": {"content": "A digital reader shows a highlighted paragraph and playback controls."}}]}
).encode("utf-8")
image_llama_response.__enter__ = lambda s: s
image_llama_response.__exit__ = MagicMock(return_value=False)
with patch("urllib.request.urlopen", return_value=image_llama_response):
image_narration = app.reader_brain_core(
node_type="image",
text="A digital reader shows a highlighted paragraph and playback controls.",
position="item 2 of 3",
mode="narrate",
)
assert_true(image_narration["runtime"] == "llama.cpp", "Image narration should use live reader-brain when available")
assert_true(
image_narration["narration"].startswith("Image description."),
"Live reader-brain image narration should keep an image description prefix",
)
description = app.describe_image_core("model-map", caption=None, prompt=None)
assert_true(description["ok"], "Image description did not return ok")
assert_true("small AI models" in description["alt_text"], "Image description fallback changed unexpectedly")
assert_true(description["runtime"] == "fallback", "Image description without MiniCPM config should use fallback runtime")
assert_true(description["model"] == app.MODEL_MANIFEST["vision"]["id"], "Image description should report the vision model id")
assert_true(isinstance(description["elapsed_ms"], int), "Image description should include elapsed_ms")
article_descriptions = app.describe_article_images_core()
assert_true(article_descriptions["ok"], "Article image descriptions did not return ok")
assert_true(len(article_descriptions["descriptions"]) == 2, "Article should expose two image descriptions")
assert_true(
all(item["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"] for item in article_descriptions["descriptions"]),
"Article image descriptions should include the planned image-generation model",
)
assert_true(
all(isinstance(item["seed"], int) for item in article_descriptions["descriptions"]),
"Article image descriptions should include generation seeds",
)
assert_true(isinstance(article_descriptions["elapsed_ms"], int), "Article image descriptions should include elapsed_ms")
assert_true(article_descriptions["model"] == app.MODEL_MANIFEST["vision"]["id"], "Article image descriptions should report vision model id")
assert_true(article_descriptions["runtime"] == "fallback", "Article image descriptions should use fallback without MiniCPM config")
speech = app.speak_core("Tiny Narrator verification.", voice="af_heart", speed=1.0)
assert_true(speech["ok"], "Speech path did not return ok")
assert_true(isinstance(speech["elapsed_ms"], int), "Speech response should include elapsed_ms")
audio_path = ROOT / speech["audio_url"].lstrip("/")
assert_true(audio_path.exists(), f"Speech output missing: {audio_path}")
with wave.open(str(audio_path), "rb") as wav:
assert_true(wav.getframerate() == 24000, "Speech output should be 24 kHz")
assert_true(wav.getnchannels() == 1, "Speech output should be mono")
empty_speech = app.speak_core("", voice="af_heart", speed=1.0)
assert_true(empty_speech["runtime"] == "fallback", "Empty speech input should use fast fallback")
assert_true("empty" in empty_speech["warning"].lower(), "Empty speech input should explain why Kokoro was skipped")
generated = app.generate_image_core("Tiny accessibility article image.", seed=3)
assert_true(generated["ok"], "Image generation placeholder should return ok")
assert_true(isinstance(generated["elapsed_ms"], int), "Image generation should include elapsed_ms")
assert_true(generated["runtime"] == "fallback", "Image generation without Modal should report fallback runtime")
assert_true(generated["model"] == app.MODEL_MANIFEST["image_generation"]["id"], "Image generation should report Klein model id")
assert_true(generated["seed"] == 3, "Image generation should preserve the seed")
assert_true(generated["image_url"].startswith("/static/generated/"), "Fallback image should use bundled assets")
assert_true(generated.get("warning") is None, "Fallback without attempted call should have no warning")
generated_no_seed = app.generate_image_core("Another image prompt.", seed=None)
assert_true(generated_no_seed["ok"], "Image generation without seed should return ok")
assert_true(generated_no_seed["runtime"] == "fallback", "Image generation without Modal should report fallback")
assert_true(generated_no_seed["seed"] is None, "Image generation should pass through None seed")
article = app.generate_article_core("tiny classroom robotics")
assert_true(article["ok"], "Article generation should return ok")
assert_true(article["model"] == app.MODEL_MANIFEST["reader_brain"]["id"], "Article generation should use reader-brain model")
assert_true(len(article["article"]["sections"]) == 5, "Article generation should return five sections")
assert_true(
article["thumbnail"]["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"],
"Article generation should use the Klein image model for thumbnail receipt",
)
assert_true("No words" in article["thumbnail"]["prompt"], "Article thumbnail prompt should forbid unreadable generated text")
assert_true("no user interface" in article["thumbnail"]["prompt"], "Article thumbnail prompt should avoid UI screenshots")
assert_true("one centered cohesive scene" in article["thumbnail"]["prompt"], "Article thumbnail prompt should avoid sparse disconnected layouts")
def verify_modal_klein_integration() -> None:
"""Test Modal Klein integration with mocked HTTP responses."""
# Test: no endpoint configured returns deterministic fallback
with patch.object(app, "KLEIN_MODAL_ENDPOINT", ""):
result = app.generate_image_core("test prompt", seed=42)
assert_true(result["ok"], "No-endpoint fallback should return ok")
assert_true(result["runtime"] == "fallback", "No-endpoint should report fallback runtime")
assert_true(result["image_url"].startswith("/static/generated/"), "No-endpoint should use bundled assets")
assert_true(result["model"] == app.MODEL_MANIFEST["image_generation"]["id"], "Fallback should report Klein model")
# Test: configured endpoint returning valid JSON is surfaced as live Modal inference
mock_response_data = {
"ok": True,
"runtime": "modal-klein",
"model": "black-forest-labs/FLUX.2-klein-4B",
"image_url": "/media/klein-abc123.png",
"prompt": "test prompt",
"seed": 42,
"elapsed_ms": 5000,
}
mock_response = MagicMock()
mock_response.read.return_value = json.dumps(mock_response_data).encode("utf-8")
mock_response.__enter__ = lambda s: s
mock_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
with patch("urllib.request.urlopen", return_value=mock_response):
result = app.generate_image_core("test prompt", seed=42)
assert_true(result["ok"], "Modal success should return ok")
assert_true(result["runtime"] == "modal-klein", "Modal success should report modal-klein runtime")
assert_true(
result["image_url"] == "https://example-modal.modal.run/media/klein-abc123.png",
"Modal success should return full media URL",
)
assert_true(result["prompt"] == "test prompt", "Modal success should preserve prompt")
assert_true(result["seed"] == 42, "Modal success should preserve seed")
# Test: configured endpoint failure falls back with a visible warning
with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
with patch("urllib.request.urlopen", side_effect=TimeoutError("Connection timed out")):
result = app.generate_image_core("test prompt", seed=42)
assert_true(result["ok"], "Modal failure fallback should return ok")
assert_true(result["runtime"] == "fallback", "Modal failure should report fallback runtime")
assert_true(
result["image_url"].startswith("/static/generated/"),
"Modal failure should use bundled assets",
)
assert_true(
result.get("warning") is not None and "TimeoutError" in result["warning"],
"Modal failure should include a visible warning with the error class",
)
# Test: invalid Modal JSON response falls back instead of pretending success
invalid_response = MagicMock()
invalid_response.read.return_value = json.dumps({"ok": False, "error": "prompt is required"}).encode("utf-8")
invalid_response.__enter__ = lambda s: s
invalid_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
with patch("urllib.request.urlopen", return_value=invalid_response):
result = app.generate_image_core("test prompt", seed=42)
assert_true(result["runtime"] == "fallback", "Invalid Modal response should use fallback runtime")
assert_true(
result.get("warning") is not None and "ValueError" in result["warning"],
"Invalid Modal response should include a validation warning",
)
# Test: Modal worker static checks
worker_path = ROOT / "modal_workers" / "klein_image.py"
assert_true(worker_path.exists(), "Modal worker file should exist")
worker_source = worker_path.read_text(encoding="utf-8")
assert_true("modal.App" in worker_source, "Modal worker should create a Modal App")
assert_true("modal.Volume" in worker_source, "Modal worker should use a Modal Volume")
assert_true("FLUX.2-klein-4B" in worker_source, "Modal worker should reference the Klein model")
assert_true("Flux2KleinPipeline" in worker_source, "Modal worker should use the FLUX.2 Klein Diffusers pipeline")
assert_true("modal.asgi_app" in worker_source, "Modal worker should expose one ASGI app")
assert_true('@api.post("/generate")' in worker_source, "Modal worker should expose POST /generate")
assert_true('@api.get("/health")' in worker_source, "Modal worker should expose GET /health")
assert_true('@api.get("/media/{filename}")' in worker_source, "Modal worker should expose GET /media/{filename}")
assert_true("404" in worker_source or "not found" in worker_source.lower(), "Modal worker should handle missing media with 404")
assert_true("reload.aio()" in worker_source, "Modal worker should reload volume with async API before serving missing media")
assert_true("path.read_bytes()" in worker_source, "Modal worker should avoid streaming open files from the volume")
reader_worker_path = ROOT / "modal_workers" / "reader_brain.py"
assert_true(reader_worker_path.exists(), "Modal reader-brain worker file should exist")
reader_worker_source = reader_worker_path.read_text(encoding="utf-8")
assert_true("modal.web_server" in reader_worker_source, "Reader-brain worker should expose llama-server through Modal web_server")
assert_true("startup_timeout=600" in reader_worker_source, "Reader-brain worker should allow slow first llama.cpp model loads")
assert_true("ghcr.io/ggml-org/llama.cpp:server-cuda12" in reader_worker_source, "Reader-brain worker should use the prebuilt llama.cpp CUDA server image")
assert_true("ENTRYPOINT []" in reader_worker_source, "Reader-brain worker should clear the prebuilt image entrypoint for Modal's Python runner")
assert_true("GGML_CUDA=ON" not in reader_worker_source, "Reader-brain worker should not compile llama.cpp during Modal builds")
assert_true("cmake --build" not in reader_worker_source, "Reader-brain worker should avoid slow CMake builds on Modal")
assert_true("NVIDIA-Nemotron-3-Nano-4B-GGUF:Q4_K_M" in reader_worker_source, "Reader-brain worker should serve the Nemotron GGUF")
assert_true('"--reasoning"' in reader_worker_source and '"off"' in reader_worker_source, "Reader-brain worker should disable reasoning mode")
assert_true('"--ctx-size"' in reader_worker_source and '"4096"' in reader_worker_source, "Reader-brain worker should use T4-safe context size")
assert_true('"--parallel"' in reader_worker_source and '"1"' in reader_worker_source, "Reader-brain worker should use one parallel slot on T4")
assert_true('"--n-gpu-layers"' in reader_worker_source and '"999"' in reader_worker_source, "Reader-brain worker should request full GPU offload")
assert_true("modal.Volume" in reader_worker_source, "Reader-brain worker should cache model downloads in a Modal volume")
assert_true("tiny-narrator-reader-brain-token" in reader_worker_source, "Reader-brain worker should use a fixed Modal token secret")
assert_true('"--api-key"' in reader_worker_source, "Reader-brain worker should pass an API key to llama-server when configured")
assert_true('display_command[key_index] = "***"' in reader_worker_source, "Reader-brain worker should redact API keys in logs")
assert_true("_find_llama_server" in reader_worker_source, "Reader-brain worker should resolve the prebuilt llama-server binary path")
assert_true("/app/llama-server" in reader_worker_source, "Reader-brain worker should check the prebuilt image binary path")
assert_true("binary was not found" in reader_worker_source, "Reader-brain worker should fail with useful binary diagnostics")
# Test: reader-brain auth wiring sends bearer tokens when configured
model_response = MagicMock()
model_response.read.return_value = json.dumps({"data": [{"id": "narrator-brain"}]}).encode("utf-8")
model_response.__enter__ = lambda s: s
model_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "LLAMA_CPP_BASE_URL", "https://reader.example/v1"), patch.object(app, "LLAMA_CPP_TOKEN", "reader-secret"):
with patch("urllib.request.urlopen", return_value=model_response) as urlopen_mock:
app._runtime_status_core()
status_request = urlopen_mock.call_args.args[0]
assert_true(
status_request.headers.get("Authorization") == "Bearer reader-secret",
"Runtime status should send reader-brain Bearer token when LLAMA_CPP_TOKEN is configured",
)
chat_response = MagicMock()
chat_response.read.return_value = json.dumps({"choices": [{"message": {"content": "Heading. Token protected narration."}}]}).encode("utf-8")
chat_response.__enter__ = lambda s: s
chat_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "LLAMA_CPP_BASE_URL", "https://reader.example/v1"), patch.object(app, "LLAMA_CPP_TOKEN", "reader-secret"):
with patch("urllib.request.urlopen", return_value=chat_response) as urlopen_mock:
app.reader_brain_core("heading", "Token protected narration", "item 1 of 1", "narrate")
chat_request = urlopen_mock.call_args.args[0]
assert_true(
chat_request.headers.get("Authorization") == "Bearer reader-secret",
"Reader-brain requests should send Bearer token when LLAMA_CPP_TOKEN is configured",
)
# Test: auth wiring — app sends bearer token when configured
with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"), patch.object(app, "KLEIN_MODAL_TOKEN", "test-secret-token"):
with patch("urllib.request.urlopen", return_value=mock_response) as urlopen_mock:
app.generate_image_core("auth test", seed=1)
sent_request = urlopen_mock.call_args.args[0]
assert_true(
sent_request.headers.get("Authorization") == "Bearer test-secret-token",
"App should send Bearer token when KLEIN_MODAL_TOKEN is configured",
)
# Test: auth wiring — health check sends bearer token when configured
good_health = MagicMock()
good_health.read.return_value = json.dumps({"ok": True, "model": app.MODEL_MANIFEST["image_generation"]["id"], "runtime": "modal-klein"}).encode("utf-8")
good_health.__enter__ = lambda s: s
good_health.__exit__ = MagicMock(return_value=False)
with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"), patch.object(app, "KLEIN_MODAL_TOKEN", "test-secret-token"):
with patch("urllib.request.urlopen", return_value=good_health) as urlopen_mock:
app._runtime_status_core()
health_request = urlopen_mock.call_args.args[0]
assert_true(
health_request.headers.get("Authorization") == "Bearer test-secret-token",
"App should send Bearer token for health checks when KLEIN_MODAL_TOKEN is configured",
)
# Test: .env.example includes KLEIN_MODAL_TOKEN
env_example = (ROOT / ".env.example").read_text(encoding="utf-8")
assert_true("KLEIN_MODAL_TOKEN" in env_example, ".env.example should document KLEIN_MODAL_TOKEN")
assert_true("LLAMA_CPP_TOKEN" in env_example, ".env.example should document LLAMA_CPP_TOKEN")
# Test: worker validates token
assert_true("KLEIN_MODAL_TOKEN" in worker_source, "Modal worker should read KLEIN_MODAL_TOKEN")
assert_true("401" in worker_source, "Modal worker should reject unauthorized requests with 401")
assert_true("_check_token" in worker_source, "Modal worker should have a token validation helper")
assert_true(
"async def health(request: Request)" in worker_source,
"Modal worker health route should accept the request for token validation",
)
# Test: runtime setup does not expose the token value
with patch.object(app, "KLEIN_MODAL_TOKEN", "super-secret-value"):
setup = app.runtime_setup_core()
setup_json = json.dumps(setup)
assert_true("super-secret-value" not in setup_json, "Runtime setup must never expose the token value")
image_step = next(step for step in setup["steps"] if step["role"] == "image_generation")
assert_true(
"KLEIN_MODAL_TOKEN" in image_step["env"],
"Runtime setup should document KLEIN_MODAL_TOKEN",
)
assert_true(
image_step["env"]["KLEIN_MODAL_TOKEN"] == "(configured)",
"Runtime setup should show token as configured without exposing the value",
)
with patch.object(app, "LLAMA_CPP_TOKEN", "reader-super-secret"):
setup = app.runtime_setup_core()
setup_json = json.dumps(setup)
assert_true("reader-super-secret" not in setup_json, "Runtime setup must never expose the reader token value")
reader_step = next(step for step in setup["steps"] if step["role"] == "reader_brain")
assert_true("LLAMA_CPP_TOKEN" in reader_step["env"], "Runtime setup should document LLAMA_CPP_TOKEN")
assert_true(
reader_step["env"]["LLAMA_CPP_TOKEN"] == "(configured)",
"Runtime setup should show reader token as configured without exposing the value",
)
# Test: reader-brain runtime status exposes actionable health details without leaking tokens
with patch.object(app, "LLAMA_CPP_BASE_URL", "https://reader.example/v1"), patch.object(app, "LLAMA_CPP_TOKEN", "reader-secret"):
http_error = urllib.error.HTTPError(
"https://reader.example/v1/models",
401,
"Unauthorized",
{},
None,
)
http_error.fp = MagicMock()
http_error.fp.read.return_value = b'{"detail":"Unauthorized"}'
with patch("urllib.request.urlopen", side_effect=http_error) as urlopen_mock:
status = app._runtime_status_core()
reader_status = status["reader_brain"]
health_request = urlopen_mock.call_args.args[0]
assert_true(
health_request.headers.get("Authorization") == "Bearer reader-secret",
"Reader-brain health checks should send Bearer token when configured",
)
assert_true(
"HTTPError status=401" in reader_status["warning"],
"Reader-brain runtime warning should include HTTP status details",
)
assert_true(
"Unauthorized" in reader_status["warning"],
"Reader-brain runtime warning should include response body details",
)
assert_true(
"reader-secret" not in json.dumps(reader_status),
"Reader-brain runtime status should not expose token values",
)
assert_true(
reader_status["health_url"] == "https://reader.example/v1/models",
"Reader-brain runtime status should expose the health URL",
)
# Test: runtime status includes Modal Klein path
with patch.object(app, "KLEIN_MODAL_ENDPOINT", ""):
status = app._runtime_status_core()
assert_true("image_generation" in status, "Runtime status should include image_generation")
assert_true(
status["image_generation"]["status"] in {"online", "fallback-ready"},
"Image generation status should be online or fallback-ready",
)
assert_true(
status["image_generation"]["model"] == app.MODEL_MANIFEST["image_generation"]["id"],
"Image generation status should reference the Klein model",
)
# Test: invalid health payload is fallback-ready, not online
bad_health = MagicMock()
bad_health.read.return_value = json.dumps({"ok": True, "model": "wrong", "runtime": "modal-klein"}).encode("utf-8")
bad_health.__enter__ = lambda s: s
bad_health.__exit__ = MagicMock(return_value=False)
with patch.object(app, "KLEIN_MODAL_ENDPOINT", "https://example-modal.modal.run"):
with patch("urllib.request.urlopen", return_value=bad_health):
status = app._runtime_status_core()
assert_true(
status["image_generation"]["status"] == "fallback-ready",
"Invalid Modal health should not be marked online",
)
assert_true("ValueError" in status["image_generation"].get("warning", ""), "Invalid health should report validation warning")
# Test: runtime setup includes Modal deploy command
setup = app.runtime_setup_core()
image_step = next(step for step in setup["steps"] if step["role"] == "image_generation")
assert_true(
"modal deploy" in image_step["command"],
"Runtime setup should include modal deploy command for image generation",
)
assert_true(
"KLEIN_MODAL_ENDPOINT" in image_step["env"],
"Runtime setup should document KLEIN_MODAL_ENDPOINT",
)
def verify_minicpm_vision_integration() -> None:
with patch.object(app, "MINICPM_VISION_BASE_URL", ""), patch.object(app, "MINICPM_VISION_API_KEY", ""):
result = app.describe_image_core("model-map", caption=None, prompt=None)
assert_true(result["ok"], "No-config MiniCPM fallback should return ok")
assert_true(result["runtime"] == "fallback", "No-config MiniCPM should report fallback runtime")
assert_true(result["model"] == app.MODEL_MANIFEST["vision"]["id"], "No-config MiniCPM should report vision model")
assert_true(result.get("warning") is None, "No-config MiniCPM fallback should stay quiet")
mock_response_data = {
"choices": [
{
"message": {
"content": "A compact diagram shows four small AI models connected around an accessibility reader."
}
}
]
}
mock_response = MagicMock()
mock_response.read.return_value = json.dumps(mock_response_data).encode("utf-8")
mock_response.__enter__ = lambda s: s
mock_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
with patch("urllib.request.urlopen", return_value=mock_response) as urlopen_mock:
result = app.describe_image_core("model-map", caption="diagram", prompt="model map", image_url="/static/generated/model-map.svg")
assert_true(result["ok"], "Live MiniCPM response should return ok")
assert_true(result["runtime"] == "minicpm-v4.6", "Live MiniCPM response should report runtime")
assert_true(result["model"] == app.MINICPM_VISION_MODEL, "Live MiniCPM response should report configured model")
assert_true("accessibility reader" in result["alt_text"], "Live MiniCPM response should use returned alt text")
request = urlopen_mock.call_args.args[0]
assert_true(
request.full_url == "https://vision.example/v1/chat/completions",
"MiniCPM client should normalize base URL to chat completions",
)
assert_true(
request.headers.get("Authorization") == "Bearer secret-key",
"MiniCPM client should send bearer auth",
)
with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
with patch.object(app, "PUBLIC_BASE_URL", "https://tiny.example"):
with patch("urllib.request.urlopen", return_value=mock_response) as urlopen_mock:
result = app.describe_image_core("model-map", caption="diagram", prompt="model map")
assert_true(result["runtime"] == "minicpm-v4.6", "Default MiniCPM image-id path should use live response")
request = urlopen_mock.call_args.args[0]
request_body = json.loads(request.data.decode("utf-8"))
image_part = request_body["messages"][0]["content"][1]
assert_true(
image_part["image_url"]["url"].startswith("data:image/png;base64,"),
"MiniCPM default article image path should inline PNG companion assets",
)
assert_true(
"https://tiny.example" not in image_part["image_url"]["url"],
"MiniCPM default article image path should not depend on public URL fetching",
)
invalid_response = MagicMock()
invalid_response.read.return_value = json.dumps({"choices": [{"message": {"content": ""}}]}).encode("utf-8")
invalid_response.__enter__ = lambda s: s
invalid_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example"):
with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
with patch("urllib.request.urlopen", return_value=invalid_response):
result = app.describe_image_core("custom", caption="fallback caption", prompt=None, image_url="https://example.com/image.png")
assert_true(result["runtime"] == "fallback", "Invalid MiniCPM response should fall back")
assert_true(result["alt_text"] == "fallback caption", "Invalid MiniCPM response should preserve fallback text")
assert_true(
result.get("warning") is not None and "ValueError" in result["warning"],
"Invalid MiniCPM response should include validation warning",
)
models_response = MagicMock()
models_response.read.return_value = json.dumps({"data": [{"id": app.MINICPM_VISION_MODEL}]}).encode("utf-8")
models_response.__enter__ = lambda s: s
models_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
with patch("urllib.request.urlopen", return_value=models_response):
status = app._vision_runtime_status()
assert_true(status["status"] == "online", "MiniCPM /models response should mark vision online")
assert_true("secret-key" not in json.dumps(status), "Vision runtime status should not expose API key")
ready_response = MagicMock()
ready_response.read.return_value = json.dumps({"choices": [{"message": {"content": "ready"}}]}).encode("utf-8")
ready_response.__enter__ = lambda s: s
ready_response.__exit__ = MagicMock(return_value=False)
with patch.object(app, "MINICPM_VISION_BASE_URL", "https://vision.example/v1"):
with patch.object(app, "MINICPM_VISION_API_KEY", "secret-key"):
with patch("urllib.request.urlopen", side_effect=[urllib.error.HTTPError("https://vision.example/v1/models", 404, "Not Found", {}, None), ready_response]):
status = app._vision_runtime_status()
assert_true(status["status"] == "online", "MiniCPM chat completions readiness should mark vision online when /models is unavailable")
assert_true("chat completions ready" in status.get("warning", ""), "Vision status should explain chat-completions readiness fallback")
setup = app.runtime_setup_core()
vision_step = next(step for step in setup["steps"] if step["role"] == "vision")
assert_true("MiniCPM-V-4.6" in vision_step["model"], "Runtime setup should document MiniCPM-V-4.6")
assert_true("MINICPM_VISION_BASE_URL" in vision_step["env"], "Runtime setup should document MiniCPM base URL")
assert_true("secret" not in json.dumps(vision_step).lower(), "Runtime setup should not expose MiniCPM API key")
def verify_output_retention() -> None:
keep_path = app.OUTPUT_DIR / "speech-retention-keep.wav"
_ = app.speak_core("Tiny Narrator retention check.", voice="af_heart", speed=1.0)
keep_path.write_bytes(b"keep")
stale_files = []
for index in range(30):
stale_path = app.OUTPUT_DIR / f"speech-retention-stale-{index:02d}.wav"
stale_path.write_bytes(b"stale")
stale_files.append(stale_path)
app._prune_speech_outputs(keep_path, max_files=4)
remaining = list(app.OUTPUT_DIR.glob("speech*.wav"))
assert_true(keep_path.exists(), "Speech retention should keep the active output")
assert_true(len(remaining) <= 5, "Speech retention should prune stale generated audio")
keep_path.unlink(missing_ok=True)
for stale_path in stale_files:
stale_path.unlink(missing_ok=True)
def verify_routes() -> None:
client = TestClient(app.app)
home = client.get("/")
assert_true(home.status_code == 200, "Home route should return 200")
assert_true("Tiny Narrator" in home.text, "Home route should include app title")
assert_true('href="/generate">Generate' in home.text, "Home route should link to Generate route")
assert_true("readerToggle" in home.text, "Home route should include reader toggle")
assert_true("summaryButton" in home.text, "Home route should include summary control")
assert_true("imageStatus" in home.text, "Home route should include image status")
assert_true("voiceStatus" in home.text, "Home route should include voice status")
assert_true("latencyStatus" in home.text, "Home route should include latency status")
assert_true("voiceControl" in home.text, "Home route should include voice control")
assert_true("speedValue" in home.text, "Home route should include speed value output")
assert_true("autoAdvanceControl" in home.text, "Home route should include auto-advance control")
assert_true("transcriptLog" in home.text, "Home route should include transcript log")
assert_true("readerQueueList" not in home.text, "Home route should not include reader queue list")
assert_true("modelBudgetStatus" in home.text, "Home route should include model stack status")
assert_true("modelStackList" in home.text, "Home route should include model stack list")
assert_true("/evidence" not in home.text, "Home route should not link to a removed evidence page")
assert_true("copyEvidenceButton" not in home.text, "Home route should keep judge evidence off the reader sidebar")
generate_page = client.get("/generate")
assert_true(generate_page.status_code == 200, "Generate route should return 200")
assert_true("Generate a readable article" in generate_page.text, "Generate route should include generator title")
assert_true("articleGeneratorForm" in generate_page.text, "Generate route should include article generator form")
assert_true("generatedThumbnail" in generate_page.text, "Generate route should include generated thumbnail")
assert_true("readerToggle" in generate_page.text, "Generate route should include reader toggle")
assert_true("summaryButton" in generate_page.text, "Generate route should include summary control")
assert_true("transcriptLog" in generate_page.text, "Generate route should include transcript log")
assert_true("speechAudio" in generate_page.text, "Generate route should include speech playback")
health = client.get("/api/health")
assert_true(health.status_code == 200, "Health route should return 200")
payload = health.json()
assert_true(payload["ok"], "Health payload should be ok")
assert_true(payload["public_base_url"] == app.PUBLIC_BASE_URL, "Health route should expose the public command base URL")
assert_true(
payload["models"]["reader_brain"]["runtime"] == "llama.cpp",
"Health route should document llama.cpp reader-brain runtime",
)
manifest = client.get("/api/article-manifest")
assert_true(manifest.status_code == 200, "Article manifest route should return 200")
manifest_payload = manifest.json()
assert_true("Tiny Titan" in manifest_payload["bonus_targets"], "Manifest should include Tiny Titan target")
reader_controls = manifest_payload["reader_controls"]
summary_shortcut = next((item for item in reader_controls if item["key"] == "S"), None)
assert_true(summary_shortcut is not None, "Manifest should include summary shortcut")
assert_true(
summary_shortcut["action"] == "Summarize current section"
and summary_shortcut["aria_keyshortcuts"] == "S",
"Manifest summary shortcut should include action and aria-keyshortcuts value",
)
assert_true(
{item["aria_keyshortcuts"] for item in reader_controls} >= {"Space", "N", "P", "H", "I", "S", "R", "Escape"},
"Manifest should expose aria-keyshortcuts values for reader controls",
)
assert_true(
manifest_payload["models"]["speech"]["id"] == "hexgrad/Kokoro-82M",
"Manifest should document Kokoro speech model",
)
assert_true(
manifest_payload["reader_settings"]["default_voice"] == "af_heart",
"Manifest should document default Kokoro voice",
)
assert_true(
len(manifest_payload["reader_settings"]["voices"]) >= 4,
"Manifest should expose multiple Kokoro voice choices",
)
assert_true(
manifest_payload["reader_settings"]["default_auto_advance"] is False,
"Manifest should default auto-advance off",
)
assert_true(
len(manifest_payload["award_evidence"]) == 4,
"Manifest should expose four award evidence items",
)
assert_true(
manifest_payload["model_budget"]["all_models_within_limit"],
"Manifest should prove every model is within the Tiny Titan limit",
)
assert_true(
len(manifest_payload["runtime_setup"]["steps"]) == 4,
"Manifest should expose setup steps for each model role",
)
assert_true(
len(manifest_payload["demo_script"]["actions"]) >= 4,
"Manifest should expose a judge demo script",
)
assert_true(
manifest_payload["accessibility_audit"]["all_passed"],
"Manifest should expose passing accessibility audit evidence",
)
awards = client.get("/api/award-evidence")
assert_true(awards.status_code == 200, "Award evidence route should return 200")
award_payload = awards.json()
assert_true(award_payload["ok"], "Award evidence payload should be ok")
assert_true(
{item["id"] for item in award_payload["items"]} == {"tiny-titan", "llama-champion", "off-brand", "field-notes"},
"Award evidence route should cover the targeted bonuses",
)
budget = client.get("/api/model-budget")
assert_true(budget.status_code == 200, "Model budget route should return 200")
budget_payload = budget.json()
assert_true(budget_payload["ok"], "Model budget payload should be ok")
assert_true(budget_payload["limit_billion"] == 4.0, "Tiny Titan limit should be 4B")
assert_true(budget_payload["all_models_within_limit"], "All models should stay within the Tiny Titan limit")
assert_true(
all(item["params_billion"] <= budget_payload["limit_billion"] for item in budget_payload["models"]),
"Every model budget item should be at or below the limit",
)
setup = client.get("/api/runtime-setup")
assert_true(setup.status_code == 200, "Runtime setup route should return 200")
setup_payload = setup.json()
assert_true(setup_payload["ok"], "Runtime setup payload should be ok")
assert_true(
{item["role"] for item in setup_payload["steps"]}
== {"reader_brain", "speech", "vision", "image_generation"},
"Runtime setup should cover every model path",
)
assert_true(
"llama-server" in setup_payload["steps"][0]["command"],
"Runtime setup should include the llama.cpp launch command",
)
assert_true(
setup_payload["steps"][0]["modal_command"] == "modal deploy modal_workers/reader_brain.py",
"Runtime setup should include the Modal reader-brain deploy command",
)
assert_true(
"--reasoning off" in setup_payload["steps"][0]["command"],
"Runtime setup should document non-reasoning llama.cpp mode",
)
assert_true(
setup_payload["app"]["env"]["PUBLIC_BASE_URL"] == app.PUBLIC_BASE_URL,
"Runtime setup should expose the public command base URL",
)
demo = client.get("/api/demo-script")
assert_true(demo.status_code == 200, "Demo script route should return 200")
demo_payload = demo.json()
assert_true(demo_payload["ok"], "Demo script payload should be ok")
assert_true(
"Tiny Narrator judge demo" == demo_payload["title"],
"Demo script should be labeled for judging",
)
assert_true(
{item["path"] for item in demo_payload["api_checks"]} >= {"/api/model-budget", "/api/runtime-setup"},
"Demo script should include evidence API checks",
)
assert_true(
any("Tiny Titan" in action["evidence"] for action in demo_payload["actions"]),
"Demo script should point to targeted award evidence",
)
assert_true(
any(item["path"] == "/api/accessibility-audit" for item in demo_payload["api_checks"]),
"Demo script should include the accessibility audit check",
)
assert_true(
any(item["path"] == "/api/submission-readiness" for item in demo_payload["api_checks"]),
"Demo script should include the submission readiness check",
)
reader_check = next(item for item in demo_payload["api_checks"] if item["path"] == "/api/reader-brain")
speech_check = next(item for item in demo_payload["api_checks"] if item["path"] == "/api/speak")
assert_true(reader_check["sample_body"]["mode"] == "narrate", "Reader-brain demo check should include a sample body")
assert_true(
speech_check["sample_body"]["voice"] == app.READER_SETTINGS["default_voice"],
"Speech demo check should use the default reader voice",
)
assert_true(
all(item.get("sample_body") for item in demo_payload["api_checks"] if item["method"] == "POST"),
"Every POST demo check should include an executable sample body",
)
assert_true(
all(item["curl"].startswith("curl ") for item in demo_payload["api_checks"]),
"Every demo API check should include a curl command",
)
assert_true(
all(app.PUBLIC_BASE_URL in item["curl"] for item in demo_payload["api_checks"]),
"Every curl command should use the public command base URL",
)
assert_true(
all(item["powershell"].startswith("curl.exe ") for item in demo_payload["api_checks"]),
"Every demo API check should include a PowerShell-friendly curl.exe command",
)
assert_true(
all(app.PUBLIC_BASE_URL in item["powershell"] for item in demo_payload["api_checks"]),
"Every PowerShell command should use the public command base URL",
)
assert_true(
"-d '" in reader_check["curl"] and "/api/reader-brain" in reader_check["curl"],
"Reader-brain curl command should include the sample JSON body",
)
assert_true(
'\\"node_type\\"' in reader_check["powershell"] and "/api/reader-brain" in reader_check["powershell"],
"Reader-brain PowerShell command should include escaped sample JSON",
)
reader_sample = client.post(reader_check["path"], json=reader_check["sample_body"])
assert_true(reader_sample.status_code == 200, "Reader-brain sample payload should be executable")
reader_sample_payload = reader_sample.json()
assert_true(reader_sample_payload["ok"], "Reader-brain sample payload should return ok")
assert_true("narration" in reader_sample_payload, "Reader-brain sample payload should return narration")
speech_sample = client.post(speech_check["path"], json=speech_check["sample_body"])
assert_true(speech_sample.status_code == 200, "Speech sample payload should be executable")
speech_sample_payload = speech_sample.json()
assert_true(speech_sample_payload["ok"], "Speech sample payload should return ok")
assert_true(
speech_sample_payload["audio_url"].startswith("/outputs/"),
"Speech sample payload should return an output audio URL",
)
article_sample = client.post("/api/generate-article", json={"topic": "accessible classroom robotics"})
assert_true(article_sample.status_code == 200, "Article generation route should return 200")
article_sample_payload = article_sample.json()
assert_true(article_sample_payload["ok"], "Article generation payload should return ok")
assert_true(len(article_sample_payload["article"]["sections"]) == 5, "Article generation payload should include five sections")
assert_true(
article_sample_payload["thumbnail"]["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"],
"Article generation payload should include Klein thumbnail provenance",
)
audit = client.get("/api/accessibility-audit")
assert_true(audit.status_code == 200, "Accessibility audit route should return 200")
audit_payload = audit.json()
assert_true(audit_payload["ok"], "Accessibility audit payload should be ok")
assert_true(audit_payload["all_passed"], "Accessibility audit should pass")
assert_true(audit_payload["passed_checks"] == audit_payload["total_checks"], "All audit checks should pass")
assert_true(
{item["id"] for item in audit_payload["checks"]}
>= {
"semantic_queue",
"keyboard_navigation",
"reader_cursor",
"shortcut_safety",
"live_region",
"image_alt_text",
"inspectable_transcript",
},
"Accessibility audit should cover reader semantics, keyboard use, cursor state, shortcut safety, live narration, alt text, and transcript",
)
readiness = client.get("/api/submission-readiness")
assert_true(readiness.status_code == 200, "Submission readiness route should return 200")
readiness_payload = readiness.json()
assert_true(readiness_payload["ok"], "Submission readiness payload should be ok")
assert_true(readiness_payload["all_passed"], "Submission readiness checks should pass")
assert_true(
{item["id"] for item in readiness_payload["checks"]}
>= {
"tiny_titan_budget",
"award_targets",
"custom_frontend",
"runtime_setup",
"runtime_status",
"reader_accessibility",
"image_receipts",
"demo_api_checks",
"command_base_url",
},
"Submission readiness should aggregate model, award, frontend, runtime, accessibility, image, and demo evidence",
)
runtime_status_check = next(item for item in readiness_payload["checks"] if item["id"] == "runtime_status")
assert_true(runtime_status_check["status"] == "pass", "Submission readiness should pass runtime status checks")
demo_api_check = next(item for item in readiness_payload["checks"] if item["id"] == "demo_api_checks")
assert_true(demo_api_check["status"] == "pass", "Submission readiness should pass executable demo API checks")
command_base_check = next(item for item in readiness_payload["checks"] if item["id"] == "command_base_url")
assert_true(command_base_check["status"] == "pass", "Submission readiness should pass command base URL checks")
evidence = client.get("/api/evidence-bundle")
assert_true(evidence.status_code == 200, "Evidence bundle route should return 200")
evidence_payload = evidence.json()
assert_true(evidence_payload["ok"], "Evidence bundle payload should be ok")
assert_true(evidence_payload["schema_version"] == "1.0", "Evidence bundle should include schema version")
assert_true(evidence_payload["generated_at"].endswith("Z"), "Evidence bundle should include UTC timestamp")
assert_true(evidence_payload["public_base_url"] == app.PUBLIC_BASE_URL, "Evidence bundle should include public base URL")
assert_true(evidence_payload["submission_readiness"]["all_passed"], "Evidence bundle should include passing readiness")
assert_true(evidence_payload["model_budget"]["all_models_within_limit"], "Evidence bundle should include Tiny Titan proof")
assert_true(
{"runtime_status", "demo_script", "accessibility_audit", "image_descriptions"} <= set(evidence_payload),
"Evidence bundle should include runtime status, demo script, accessibility audit, and image descriptions",
)
assert_true(evidence_payload["runtime_status"]["ok"], "Evidence bundle should include ok runtime status")
assert_true(
{"reader_brain", "speech", "image_generation"} <= set(evidence_payload["runtime_status"]),
"Evidence bundle runtime status should include reader brain, speech, and image generation status",
)
assert_true(
evidence_payload["runtime_status"]["reader_brain"]["status"] in {"online", "fallback-ready"},
"Evidence bundle reader brain status should be online or fallback-ready",
)
assert_true(
evidence_payload["runtime_status"]["speech"]["status"] in {"online", "fallback-ready"},
"Evidence bundle speech status should be online or fallback-ready",
)
assert_true(
evidence_payload["runtime_status"]["image_generation"]["status"] in {"online", "fallback-ready"},
"Evidence bundle image generation status should be online or fallback-ready",
)
runtime = client.get("/api/runtime-status")
assert_true(runtime.status_code == 200, "Runtime status route should return 200")
runtime_payload = runtime.json()
assert_true(runtime_payload["ok"], "Runtime status payload should be ok")
assert_true("reader_brain" in runtime_payload, "Runtime status should include reader brain status")
assert_true("speech" in runtime_payload, "Runtime status should include speech status")
assert_true("image_generation" in runtime_payload, "Runtime status should include image generation status")
assert_true(
runtime_payload["reader_brain"]["status"] in {"online", "fallback-ready"},
"Reader brain status should be online or fallback-ready",
)
assert_true(
runtime_payload["image_generation"]["status"] in {"online", "fallback-ready"},
"Image generation status should be online or fallback-ready",
)
assert_true(
runtime_payload["image_generation"]["model"] == app.MODEL_MANIFEST["image_generation"]["id"],
"Image generation status should reference the Klein model",
)
image_descriptions = client.get("/api/image-descriptions")
assert_true(image_descriptions.status_code == 200, "Image descriptions route should return 200")
image_payload = image_descriptions.json()
assert_true(image_payload["model"] == app.MODEL_MANIFEST["vision"]["id"], "Image route should document MiniCPM-V model")
assert_true(image_payload["runtime"] == "fallback", "Image route should use fallback runtime without MiniCPM config")
assert_true(
{item["id"] for item in image_payload["descriptions"]} == {"desk-reader", "model-map"},
"Image route should describe all visible article images",
)
assert_true(
all(item["generation_model"] == app.MODEL_MANIFEST["image_generation"]["id"] for item in image_payload["descriptions"]),
"Image route should expose image-generation provenance",
)
assert_true(
all(item["generation_status"] == "fallback-ready" for item in image_payload["descriptions"]),
"Image route should label bundled image fallback status",
)
# Verify generate-image endpoint returns fallback when Modal is not configured
gen_image = client.post("/api/generate-image", json={"prompt": "test thumbnail", "seed": 7})
assert_true(gen_image.status_code == 200, "Generate image route should return 200")
gen_image_payload = gen_image.json()
assert_true(gen_image_payload["ok"], "Generate image payload should be ok")
assert_true(gen_image_payload["model"] == app.MODEL_MANIFEST["image_generation"]["id"], "Generate image should report Klein model")
assert_true(gen_image_payload["runtime"] == "fallback", "Generate image without Modal should report fallback")
assert_true(isinstance(gen_image_payload["elapsed_ms"], int), "Generate image should include elapsed_ms")
def main() -> None:
py_compile.compile(str(ROOT / "app.py"), doraise=True)
py_compile.compile(str(ROOT / "modal_workers" / "klein_image.py"), doraise=True)
py_compile.compile(str(ROOT / "modal_workers" / "reader_brain.py"), doraise=True)
verify_static_assets()
verify_space_metadata()
verify_dotenv_wiring()
verify_live_smoke_script()
verify_core_fallbacks()
verify_modal_klein_integration()
verify_minicpm_vision_integration()
verify_output_retention()
verify_routes()
print("Tiny Narrator verification passed.")
if __name__ == "__main__":
main()