Spaces:

rohitsar567
/

InsuranceBot

Sleeping

App Files Files Community

InsuranceBot / backend /main.py

rohitsar567

feat(single_brain): wire view_context → ACTIVE POLICY DIVE-IN block (KI-330)

2a58c28 about 1 month ago

Raw

History Blame Contribute Delete

227 kB

	"""FastAPI app — the backend API for the Insurance Sales Portfolio Expert.

	Run locally:
	uvicorn backend.main:app --reload --host 0.0.0.0 --port 8000

	Interactive docs at http://localhost:8000/docs
	"""

	from __future__ import annotations

	import asyncio
	import base64
	import json
	import logging
	import re
	import time
	import uuid
	from pathlib import Path
	from typing import Optional

	from fastapi import FastAPI, File, Form, Header, HTTPException, Request, UploadFile
	from fastapi.exceptions import RequestValidationError
	from fastapi.middleware.cors import CORSMiddleware
	from fastapi.responses import FileResponse, JSONResponse
	from fastapi.staticfiles import StaticFiles
	from pydantic import BaseModel, Field, field_validator

	from backend.config import settings
	from backend import nim_fallback
	from backend import brain_tools # KI-271 — SLOT_UNION-driven profile_dict in 3 endpoints
	from backend import sum_insured as _si # SI rationalisation (D1/D3) — source-quote corroboration
	from backend.providers.sarvam_stt import SarvamSTT
	from backend.providers.sarvam_tts import SarvamTTS

	# Single-LLM brain toggle. Off by default; flip via env var. When on, the
	# /api/chat hot path runs single_brain.handle_turn and falls back to
	# nim_fallback.handle_turn_fallback on any SingleBrainError (so users
	# always get a reply). When off, /api/chat routes directly through
	# nim_fallback.handle_turn_fallback.
	import os as _os # local alias to avoid stomping any later `import os`

	USE_SINGLE_BRAIN = _os.environ.get("USE_SINGLE_BRAIN", "false").lower() in (
	"1", "true", "yes", "on",
	)

	# Safety net for RULE 7. If Gemini does not call mark_recommendation when
	# the user clearly commits to a policy ("I'll go with that one", "let's do
	# #2", "buy this"), the post-turn detector below auto-calls
	# mark_recommendation against session.last_recommendation_ids[:1] so the
	# closure event is recorded for analytics.
	# Word-boundary anchored; case-insensitive at match-time.
	_CLOSER_KEYWORD_RE = re.compile(
	r"\b(go with\|i'?ll take\|i will take\|let'?s do\|let me get\|sign me up\|"
	r"purchase\|buy this\|i want to purchase\|i'?ll go with\|i want to buy)\b",
	re.IGNORECASE,
	)

	# Singleton provider instances (initialized on first call)
	_stt: Optional[SarvamSTT] = None
	_tts: Optional[SarvamTTS] = None

	def get_stt() -> SarvamSTT:
	global _stt
	if _stt is None:
	_stt = SarvamSTT()
	return _stt

	def get_tts() -> SarvamTTS:
	global _tts
	if _tts is None:
	_tts = SarvamTTS()
	return _tts


	# ---------- log helpers ----------

	LOG_DIR = settings.CORPUS_DIR.parent.parent / "logs"
	LOG_DIR.mkdir(exist_ok=True)
	TURNS_LOG = LOG_DIR / "turns.jsonl"


	def log_turn(event: dict) -> None:
	event["ts"] = time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime())
	with open(TURNS_LOG, "a") as f:
	f.write(json.dumps(event) + "\n")


	# ---------- API schemas ----------

	class HealthResponse(BaseModel):
	status: str
	providers_ok: dict[str, bool]
	missing_keys: list[str]


	class TranscribeResponse(BaseModel):
	text: str
	language_code: Optional[str] = None
	confidence: Optional[float] = None
	latency_ms: int
	# KI-242 — When Sarvam STT fails, the endpoint returns HTTP 200 with
	# `text=""` plus these two fields set so the frontend can render a
	# friendly message instead of parsing raw httpx error strings.
	# error_code is a closed enum: rate_limit \| service_unavailable \|
	# network \| auth \| unknown. Absent on the success path.
	error_code: Optional[str] = None
	user_message: Optional[str] = None


	class CitationOut(BaseModel):
	policy_id: str
	policy_name: str
	insurer_slug: str
	page_start: int
	page_end: int
	source_url: str
	score: float


	class ChatRequest(BaseModel):
	user_text: str = Field(..., description="The user's question or utterance")
	session_id: Optional[str] = Field(None, description="Stable per-session ID for logging")
	chat_history: list[dict] = Field(default_factory=list, description="[{role, content}, ...]")
	profile: dict = Field(default_factory=dict, description="User profile (age, dependents, etc.)")
	policy_filter_ids: Optional[list[str]] = Field(None, description="Restrict retrieval to these policies")
	return_audio: bool = Field(False, description="If true, also return TTS audio (base64 WAV)")
	tts_language_code: str = Field("en-IN", description="Language for TTS playback")
	view_context: Optional[dict] = Field(
	None,
	description=(
	"Frontend-supplied snapshot of what the user is looking at right now: "
	"{active_view, active_policy_id, filters}. Injected into the system prompt "
	"so the bot can ground 'this policy' / 'these filters' references."
	),
	)


	class ChatResponse(BaseModel):
	reply_text: str
	citations: list[CitationOut]
	brain_used: str
	intent: str
	language: str
	latency_ms: int
	session_id: str
	audio_base64: Optional[str] = None
	audio_mime: Optional[str] = None # X8 — "audio/wav" \| "audio/mp4" \| "audio/webm"
	# TTS voice-output failures are surfaced to the client (text reply is
	# unaffected): the frontend renders a small inline "voice unavailable"
	# notice under the bot bubble. tts_error_code is a closed enum mirroring
	# the STT path's contract so the client never parses raw httpx text:
	# rate_limit — Sarvam 429 / insufficient_quota / no credits
	# service_unavailable — Sarvam 5xx / 503
	# auth — Sarvam 401/403 / missing SARVAM_API_KEY
	# network — connect/read timeout, DNS, conn reset
	# unknown — anything else
	tts_error_code: Optional[str] = None
	tts_user_message: Optional[str] = None
	faithfulness_passed: bool = True
	faithfulness_reasons: list[str] = Field(default_factory=list)
	blocked: bool = False
	profile_updates: dict = Field(
	default_factory=dict,
	description=(
	"Any profile fields auto-extracted from the user's free-form message "
	"this turn (age, dependents, health_conditions, etc.). Frontend can "
	"flash an acknowledgment + refresh the completeness panel."
	),
	)
	# Whether the 7 required profile slots are captured. Surfaced in the
	# primary chat response so the UI can flip to 100% in the same render
	# cycle without a second roundtrip to /api/profile/completeness.
	# Computed via brain_tools._REQUIRED_FOR_READY (same slot list used by
	# retrieve_policies' profile-complete gate) so client + server never
	# disagree.
	profile_complete: bool = Field(
	False,
	description=(
	"True when every required profile slot (name, age, dependents, "
	"location_tier, income_band, primary_goal, health_conditions) is "
	"non-empty on the live session.profile at end-of-turn."
	),
	)
	# KI-Z7 (2026-05-15) — Feature B. True when single_brain.handle_turn's
	# turn-1 name heuristic matched a stored profile and hydrated the
	# session. Frontend renders a "Welcome back, <name>!" banner with the
	# last predicted-premium band when this flips True on the first turn.
	returning_user_recalled: bool = Field(
	False,
	description=(
	"True iff a stored named-profile was matched + hydrated on the "
	"current turn (typically only on turn 1)."
	),
	)


	class TTSRequest(BaseModel):
	text: str
	language_code: str = "en-IN"
	speaker: Optional[str] = None


	class PolicyEntry(BaseModel):
	name: str
	source_url: str = "" # PDF URL, verified at download time


	class InsurerCoverage(BaseModel):
	slug: str
	name: str
	home_url: str # insurer's main website (manually curated, verified)
	policy_count: int
	sample_policies: list[PolicyEntry]
	# KI-141 (2026-05-15) — backward-compatible default empty. Per-product
	# alias list isn't actually surfaced on the coverage card today, but the
	# field is mirrored from MarketplacePolicy so callers that union the two
	# endpoints see a consistent schema. Total aliases collapsed into this
	# insurer's parents — useful for QA + future UI surfacing.
	alias_count: int = 0


	class CoverageResponse(BaseModel):
	total_chunks: int
	total_policies: int
	# KI-130 (2026-05-15) — totals reflect REAL insurers and their products
	# ONLY. The 'regulatory' slug (18 IRDAI/NHA documents) is excluded from
	# the marketplace surface entirely; those documents are still retrieved
	# and cited inside chat answers, they just don't belong in a "policy
	# marketplace" UI.
	total_insurers: int
	insurers: list[InsurerCoverage]


	class UploadResponse(BaseModel):
	policy_id: str
	policy_name: str
	chunks_added: int
	pages_indexed: int
	elapsed_ms: int
	# #47 (2026-05-21) — UIN net-new dedup. When the uploaded PDF's IRDAI
	# UIN already belongs to a catalogue policy, the upload is NOT indexed
	# as a new card; these fields point the caller at the existing policy.
	already_in_catalogue: bool = False
	existing_policy_id: Optional[str] = None
	existing_policy_name: Optional[str] = None


	# ---------------------------------------------------------------------------
	# #47 (2026-05-21) — UIN net-new dedup for user uploads. Before a freshly
	# uploaded PDF is indexed as a brand-new marketplace card, check whether its
	# IRDAI UIN already belongs to a catalogued policy; if so it is NOT net-new
	# and the caller is pointed at the existing card. All imports are lazy — the
	# upload route imports `re` locally, so `re` is not module-level here.
	_UIN_PATTERN = r"\b[A-Z]{5,9}\d{5}V\d{6}\b"
	_catalogue_uin_cache = None # type: Optional[dict]


	def _catalogue_uin_index() -> dict:
	"""Map every catalogue policy's IRDAI UIN -> (policy_id, policy_name).
	Built once from 40-data/policy_facts/*.json, then cached."""
	global _catalogue_uin_cache
	if _catalogue_uin_cache is not None:
	return _catalogue_uin_cache
	import json as _json
	import pathlib as _pl
	import re as _re

	def _find_uin(o):
	if isinstance(o, dict):
	if "uin_code" in o:
	v = o["uin_code"]
	return v.get("value") if isinstance(v, dict) else v
	for x in o.values():
	r = _find_uin(x)
	if r:
	return r
	elif isinstance(o, list):
	for x in o:
	r = _find_uin(x)
	if r:
	return r
	return None

	idx: dict = {}
	pf_dir = _pl.Path(__file__).resolve().parent.parent / "40-data" / "policy_facts"
	for fp in sorted(pf_dir.glob("*.json")):
	try:
	uin = _find_uin(_json.loads(fp.read_text()))
	except Exception:
	continue
	if not uin or not isinstance(uin, str):
	continue
	uin = uin.strip().upper()
	# Only index modern-format IRDAI UINs — those are the only ones the
	# uploaded-text matcher (_UIN_PATTERN) can ever extract. Legacy
	# registration codes (e.g. "IRDAI/HLT/CTTK/...") are unmatchable,
	# so indexing them would be dead weight.
	if not _re.fullmatch(r"[A-Z]{5,9}\d{5}V\d{6}", uin):
	continue
	stem = fp.stem
	for suf in ("__wordings", "__cis", "__brochure", "__prospectus"):
	if stem.endswith(suf):
	stem = stem[: -len(suf)]
	nm = stem.split("__")[-1].replace("-", " ").title()
	idx.setdefault(uin, (stem, nm))
	_catalogue_uin_cache = idx
	return idx


	def _match_catalogue_uin(text: str):
	"""Return (policy_id, policy_name) if `text` carries the IRDAI UIN of an
	already-catalogued policy; else None."""
	import re as _re

	idx = _catalogue_uin_index()
	# Case-insensitive extraction — a UIN may appear in any case in the
	# uploaded text / after PDF extraction; normalise to upper for lookup.
	for u in {m.upper() for m in _re.findall(_UIN_PATTERN, text or "", _re.IGNORECASE)}:
	if u in idx:
	return idx[u]
	return None


	# ---------------------------------------------------------------------------
	# Quarantine TTL auto-purge (2026-05-16)
	#
	# User-uploaded PDFs land in the SEPARATE `user_uploads_quarantine` Chroma
	# collection, scoped per session_id. They are intentionally ephemeral — NOT
	# durable corpus. Two risks if they linger forever:
	# 1. The quarantine HNSW index grows unbounded across thousands of one-off
	# uploads (a soft version of the 2026-05-14 link_lists.bin bloat).
	# 2. A user's private policy document stays queryable long after their
	# session is over.
	#
	# Mechanism (mirrors the existing in-memory ledgers in security.py /
	# session_state.py — process-local, resets on restart, v2 → Redis):
	# - `_quarantine_last_seen`: {session_id: epoch_seconds} updated on every
	# successful upload via `_quarantine_touch`.
	# - A periodic asyncio task (`_quarantine_purge_loop`) sweeps every
	# settings.QUARANTINE_PURGE_INTERVAL_SEC and deletes all quarantine
	# chunks whose session_id has had no upload for
	# settings.QUARANTINE_TTL_SECONDS (default 24h).
	# Deletion is `where={"session_id": sid}` — strictly scoped, can never touch
	# the curated `policies` collection (different collection entirely).
	# ---------------------------------------------------------------------------

	_quarantine_last_seen: dict[str, float] = {}
	_quarantine_lock = asyncio.Lock()


	def _quarantine_touch(session_id: str, policy_id: str = "") -> None:
	"""Record that `session_id` just wrote to the quarantine collection.

	Synchronous + best-effort: bookkeeping must never break an upload.
	"""
	try:
	if session_id:
	_quarantine_last_seen[session_id] = time.time()
	except Exception: # noqa: BLE001 — bookkeeping never breaks the upload
	pass


	def _purge_expired_quarantine(now: Optional[float] = None) -> int:
	"""Delete quarantine chunks for every session idle longer than the TTL.

	Returns the number of sessions purged. Pure/synchronous so it can be
	unit-tested directly and run via asyncio.to_thread (Chroma client is
	blocking). Never raises — a Chroma hiccup must not crash the loop.
	"""
	now = now if now is not None else time.time()
	ttl = settings.QUARANTINE_TTL_SECONDS
	expired = [
	sid for sid, ts in list(_quarantine_last_seen.items())
	if now - ts >= ttl
	]
	if not expired:
	return 0
	purged = 0
	try:
	from rag.ingest import get_quarantine_collection
	coll = get_quarantine_collection()
	except Exception as e: # noqa: BLE001
	logging.warning(
	"quarantine TTL: could not open quarantine collection (%s: %s)",
	type(e).__name__, e,
	)
	return 0
	for sid in expired:
	try:
	coll.delete(where={"session_id": sid})
	_quarantine_last_seen.pop(sid, None)
	purged += 1
	logging.info(
	"quarantine TTL: purged session %s (idle > %ds)",
	sid[:12], ttl,
	)
	except Exception as e: # noqa: BLE001 — one bad delete must not abort the sweep
	logging.warning(
	"quarantine TTL: delete(where session=%s) failed (%s: %s)",
	sid[:12], type(e).__name__, e,
	)
	return purged


	async def _quarantine_purge_loop() -> None:
	"""Periodic background sweep — registered at startup. Mirrors the
	llm_health.background_probe_loop pattern (sleep → work → repeat,
	swallow all errors so the loop never dies)."""
	interval = max(60, settings.QUARANTINE_PURGE_INTERVAL_SEC)
	while True:
	try:
	await asyncio.sleep(interval)
	await asyncio.to_thread(_purge_expired_quarantine)
	except asyncio.CancelledError:
	raise
	except Exception as e: # noqa: BLE001 — loop must survive any error
	logging.warning(
	"quarantine TTL purge loop iteration failed (%s: %s)",
	type(e).__name__, e,
	)


	# Single source of truth for "is this profile ready to recommend against".
	# brain_tools._profile_complete uses the same _REQUIRED_FOR_READY tuple; we
	# _FEATURE_B_SLOT_LIST + _every_filled_slot_was_set_this_turn were the
	# heuristic that distinguished "first-time capture on turn 1" from
	# "stored profile recalled on turn 1" for the returning-user banner.
	# Removed in ADR-043 (2026-05-27) — no cross-session recall, so there is
	# no banner to flip.


	def _compute_profile_complete(session_id: str) -> bool:
	"""Read the live session profile and return True iff every required slot
	is populated. Tolerant of every failure mode (no session yet, session
	state import explodes, profile missing attrs) — returns False on any
	error so the frontend NEVER sees a stale `true` from a partial profile.
	"""
	try:
	from backend.session_state import get_session
	from backend.brain_tools import _profile_complete

	sess = get_session(session_id)
	return bool(_profile_complete(sess.profile))
	except Exception: # noqa: BLE001 — never block a chat reply for this
	return False


	# ---------- app ----------

	app = FastAPI(
	title="Insurance Sales Portfolio Expert API",
	description="Backend for the Sarvam AI take-home assignment.",
	version="0.1.0",
	)

	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"], # tighten for production deploy
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)


	# Bug B (2026-05-15) — /api/chat raw 422 leak. Live smoke saw the frontend
	# render `{"detail":[{"type":"missing","loc":["body","user_text"]...}]}` as
	# the bot reply because a malformed POST (missing user_text) hit FastAPI's
	# default RequestValidationError handler — that body bypasses our
	# ChatResponse envelope and the frontend has no shape-mapping for it.
	# We intercept the chat endpoint specifically and return a clean
	# ChatResponse-shaped JSON so frontend parsing never errors out. Other
	# endpoints keep FastAPI's default 422 behaviour (which their callers
	# already handle).
	@app.exception_handler(RequestValidationError)
	async def _validation_exception_handler(request: Request, exc: RequestValidationError):
	if request.url.path == "/api/chat":
	logging.warning(
	"chat endpoint received malformed body — returning graceful "
	"ChatResponse-shaped 200 instead of raw 422. errors=%r",
	exc.errors()[:3],
	)
	return JSONResponse(
	status_code=200,
	content={
	"reply_text": (
	"Sorry, something went wrong — try again."
	),
	"citations": [],
	"brain_used": "error_fallback",
	"intent": "qa",
	"language": "en",
	"latency_ms": 0,
	"session_id": "",
	"audio_base64": None,
	"audio_mime": None,
	"faithfulness_passed": True,
	"faithfulness_reasons": [],
	"blocked": False,
	"profile_updates": {},
	"profile_complete": False,
	},
	)
	# Default behaviour for every other endpoint.
	return JSONResponse(
	status_code=422,
	content={"detail": exc.errors()},
	)


	# ---------- Admin panel + LLM health background loop ----------
	# Mount the password-gated admin endpoints. Unauthorized callers get
	# 401 Unauthorized. Access is gated by a strong password only (no IP
	# allowlist, which would lock the operator out when switching networks
	# without adding real security).
	from backend import admin as _admin_router_module
	app.include_router(_admin_router_module.router)


	@app.on_event("startup")
	async def _startup_load_admin_overrides():
	"""Re-apply any persisted chain reorderings from the previous process."""
	import asyncio
	from pathlib import Path
	override_path = settings.DATA_DIR / "admin_overrides.json"
	if override_path.exists():
	try:
	overrides = json.loads(override_path.read_text())
	from backend.providers import nvidia_nim_llm as nim
	name_map = {"brain": "BRAIN_CHAIN", "fast_brain": "FAST_BRAIN_CHAIN", "judge": "JUDGE_CHAIN"}
	for role, attr in name_map.items():
	if role in overrides and isinstance(overrides[role], list):
	setattr(nim, attr, list(overrides[role]))
	except Exception:
	pass # bad override file shouldn't crash boot — fall back to defaults


	@app.on_event("startup")
	async def _startup_llm_health_probe():
	"""Launch the background probe loop — pings every NIM model every 5 min,
	auto-marks 'down' models, NimChainLLM uses filter_chain() to skip them."""
	import asyncio
	from backend import llm_health
	asyncio.create_task(llm_health.background_probe_loop())


	@app.on_event("startup")
	async def _startup_quarantine_ttl_purge():
	"""Launch the periodic quarantine TTL sweep (2026-05-16).

	Evicts user-uploaded PDF chunks whose session has been idle longer than
	settings.QUARANTINE_TTL_SECONDS so the quarantine index can't grow
	unbounded and stale private docs don't linger. Mirrors the
	_startup_llm_health_probe fire-and-forget create_task pattern.
	"""
	asyncio.create_task(_quarantine_purge_loop())


	@app.on_event("startup")
	async def _startup_upload_extraction_backfill():
	"""ADR-044 (2026-05-27) — on every container boot, run LLM-assisted
	extraction on any persisted upload that doesn't yet have a
	`rag/extracted/<policy_id>.json` file. This upgrades old uploads
	(persisted before the LLM-extraction pipeline was wired, OR before
	a fix to the pipeline was deployed) to the same data depth a fresh
	upload now gets. Idempotent: extracts that already exist are skipped.
	Fire-and-forget so it doesn't delay app readiness.
	"""
	from backend import uploaded_docs as _udocs
	asyncio.create_task(_udocs.backfill_extractions(force=False))


	@app.on_event("startup")
	async def _startup_single_brain_warmup():
	"""Pre-warm the Gemini single-brain connection so the FIRST /api/chat turn
	doesn't eat 4-5s of cold-start latency (TLS + auth + cache init).

	Wrapped in try/except — warmup is an optimization, not a boot
	requirement. A failed warmup must NEVER crash the server.
	"""
	try:
	from backend import single_brain
	latency = await single_brain.warmup()
	if latency is not None:
	logging.info(
	"single_brain warmup completed at boot (%.2fs)", latency,
	)
	except Exception as e: # noqa: BLE001
	logging.warning(
	"single_brain warmup raised at top level (%s: %s) — boot continues",
	type(e).__name__, e,
	)


	@app.on_event("startup")
	async def _startup_reingest_uploaded_docs():
	"""#52 — re-materialise persisted uploaded-policy docs after a restart.

	On the HF Space, rag/vectors is the EPHEMERAL container FS (KI-119):
	every rebuild pulls a fresh Chroma snapshot, so an uploaded doc's
	chunks indexed last boot are GONE. The PDF + curated-facts JSON + chunk
	payload were persisted to the /data disk (settings.UPLOADED_DOCS_DIR),
	so here we re-embed those chunks back into the fresh `policies`
	collection. The cards themselves reappear automatically because
	_load_curated_facts merges the persisted JSON records.

	Wrapped so a re-ingest hiccup never crashes boot — but it logs LOUDLY
	(no silent failure): an uploaded card with no retrievable chunks is a
	real degradation operators must see.
	"""
	try:
	from backend import uploaded_docs as _udocs

	summary = await _udocs.reingest_persisted_into_policies()
	if summary.get("docs") or summary.get("skipped"):
	logging.info(
	"#52 startup re-ingest: %d uploaded docs / %d chunks "
	"re-indexed into `policies` (%d skipped)",
	summary.get("docs", 0), summary.get("chunks", 0),
	summary.get("skipped", 0),
	)
	# Bust the #40 grade cache so the restored cards grade on first hit.
	try:
	with _MG_LOCK:
	_MG_CACHE["sig"] = None
	_MG_CACHE["index"] = None
	except Exception: # noqa: BLE001
	pass
	except Exception as e: # noqa: BLE001 — re-ingest failure must not block boot
	logging.warning(
	"#52 startup re-ingest FAILED (%s: %s) — uploaded-doc cards "
	"will show but their chunks are NOT retrievable until next "
	"successful re-ingest",
	type(e).__name__, e,
	)


	async def _startup_purge_dangling_profile_chunks():
	"""KI-117 — boot-time self-heal of dangling `doc_type='profile'` chunks.

	Background: KI-102's earliest deploy wrote a `profile_anonymous` chunk
	WITHOUT a `session_id` metadata field. That legacy row poisoned every
	subsequent retrieval whose `where` clause referenced session_id, because
	Chroma raises when a filtered row is missing the filtered key. KI-112
	added input guards so no new bad rows can be written, and the local DB
	was cleaned manually. But the HF Space carries its OWN copy of the
	Chroma DB and still contains the dangling row.

	This handler scans the collection for any `doc_type='profile'` chunks
	whose metadata lacks a non-empty `session_id` and deletes them. Runs
	idempotently — if there are no bad rows, it's a no-op. After HF rebuilds
	with this code, the boot task self-heals HF's DB on first request.

	Wrapped in try/except so a Chroma hiccup never crashes boot.
	"""
	def _do_purge() -> None:
	from rag.retrieve import get_collection

	coll = get_collection()
	try:
	res = coll.get(
	where={"doc_type": "profile"},
	limit=10000,
	include=["metadatas"],
	)
	except Exception as e:
	logging.warning(
	"KI-117: profile-chunk scan failed (%s: %s) — skipping cleanup",
	type(e).__name__, e,
	)
	return

	ids = res.get("ids") or []
	metas = res.get("metadatas") or []
	bad_ids: list[str] = []
	for cid, meta in zip(ids, metas):
	# KI-118 (2026-05-15) — profile chunks are now keyed by name_slug;
	# accept EITHER a non-empty name_slug (new) OR a non-empty
	# session_id (legacy KI-102 row) as proof-of-ownership. A profile
	# chunk with neither key is the dangling-row corruption case and
	# must be purged.
	slug = (meta or {}).get("name_slug")
	sid = (meta or {}).get("session_id")
	slug_ok = isinstance(slug, str) and slug.strip()
	sid_ok = isinstance(sid, str) and sid.strip()
	if not (slug_ok or sid_ok):
	bad_ids.append(cid)

	if bad_ids:
	try:
	coll.delete(ids=bad_ids)
	logging.info(
	"KI-117: purged %d dangling profile chunks at boot (ids=%s)",
	len(bad_ids),
	bad_ids[:10] + (["..."] if len(bad_ids) > 10 else []),
	)
	except Exception as e:
	logging.warning(
	"KI-117: delete(ids=...) failed (%s: %s) — bad rows remain",
	type(e).__name__, e,
	)
	return
	else:
	logging.info("KI-117: no dangling profile chunks found (DB clean)")

	try:
	total = coll.count()
	logging.info("KI-117: total chunks after cleanup: %d", total)
	except Exception as e:
	logging.warning(
	"KI-117: post-cleanup count() failed (%s: %s)",
	type(e).__name__, e,
	)

	try:
	await asyncio.to_thread(_do_purge)
	except Exception as e:
	# Belt + suspenders — boot must never crash.
	logging.warning(
	"KI-117: boot cleanup raised at top level (%s: %s) — continuing boot",
	type(e).__name__, e,
	)


	@app.on_event("startup")
	async def _startup_purge_dangling_profile_chunks_handler():
	"""KI-117 — register the boot-time cleanup as a FastAPI startup hook."""
	await _startup_purge_dangling_profile_chunks()


	@app.get("/api/health", response_model=HealthResponse)
	async def health():
	missing = settings.validate()
	# Post-D-019 the stack is Sarvam (voice + Indic) + NVIDIA NIM (brain +
	# judge). GROQ + OpenRouter were retired; don't reference them here or
	# this endpoint AttributeError's on every call.
	providers_ok = {
	"sarvam": bool(settings.SARVAM_API_KEY),
	"nvidia_nim": bool(settings.NVIDIA_NIM_API_KEY),
	}
	return HealthResponse(
	status="ok" if not missing else "degraded",
	providers_ok=providers_ok,
	missing_keys=missing,
	)


	# KI-096 — public deploy-verification endpoint. No auth (deliberate) so any
	# caller can confirm which commit the HF Space is actually serving without
	# needing the admin password. Cached at module import so we don't spawn
	# `git` per request.
	def _compute_build_sha() -> str:
	import os
	import subprocess
	env_sha = os.environ.get("BUILD_SHA") or os.environ.get("HF_SPACE_GIT_REV")
	if env_sha:
	return env_sha[:12]
	try:
	out = subprocess.check_output(
	["git", "rev-parse", "HEAD"],
	cwd=Path(__file__).resolve().parent.parent,
	stderr=subprocess.DEVNULL,
	timeout=2,
	).decode().strip()
	return out[:12] if out else "unknown"
	except Exception:
	return "unknown"


	_BUILD_SHA = _compute_build_sha()
	_BUILD_STARTED_AT = time.time()


	@app.get("/api/version")
	async def version():
	"""Public deploy-verification endpoint — no auth required.

	Returns the git SHA the running app was built from + the process start
	timestamp. Used by deploy probes (and humans) to confirm which commit
	HF Space is actually serving. The admin /api/admin/* endpoints are
	password-gated (KI-097) and return 401; this endpoint is the auth-free
	escape hatch for deploy verification.
	"""
	return {
	"sha": _BUILD_SHA,
	"started_at": _BUILD_STARTED_AT,
	"uptime_s": round(time.time() - _BUILD_STARTED_AT, 1),
	}


	@app.post("/api/transcribe", response_model=TranscribeResponse)
	async def transcribe(
	file: UploadFile = File(...),
	language_code: Optional[str] = Form(None),
	):
	"""Speech-to-text. Accepts an audio file upload (WAV/MP3/etc.).

	KI-242 — Sarvam errors are classified into a closed `error_code` enum
	and the endpoint always returns HTTP 200 with a friendly `user_message`
	on failure. The frontend never parses raw httpx text. 429 (rate limit)
	is retried ONCE with a 2 s backoff before being surfaced as
	`error_code: "rate_limit"`.
	"""
	import httpx as _httpx
	from backend.providers.sarvam_stt import (
	classify_stt_exception,
	STT_ERROR_USER_MESSAGES,
	STT_ERROR_RATE_LIMIT,
	)

	t0 = time.time()
	audio_bytes = await file.read()
	ext = (file.filename or "audio.wav").rsplit(".", 1)[-1].lower()
	audio_format = (
	ext if ext in ("wav", "mp3", "flac", "ogg", "m4a", "webm", "opus", "mp4")
	else "wav"
	)

	async def _try_once():
	return await get_stt().transcribe(
	audio_bytes=audio_bytes,
	audio_format=audio_format,
	language_code=language_code,
	)

	last_exc: Optional[BaseException] = None
	try:
	result = await _try_once()
	except Exception as e: # noqa: BLE001 — classifier narrows
	last_exc = e
	# 429-only single retry with 2s backoff, mirroring KI-242. Only retry
	# on a positively identified rate-limit; other failures surface fast.
	is_rate_limited = (
	isinstance(e, _httpx.HTTPStatusError)
	and e.response is not None
	and e.response.status_code == 429
	)
	if is_rate_limited:
	await asyncio.sleep(2.0)
	try:
	result = await _try_once()
	last_exc = None
	except Exception as e2: # noqa: BLE001
	last_exc = e2

	latency = int((time.time() - t0) * 1000)

	if last_exc is not None:
	code = classify_stt_exception(last_exc)
	# Log the underlying error server-side so we keep diagnostics, but
	# never leak the raw httpx string to the user-facing response.
	logging.warning(
	"STT failed: error_code=%s exc=%s: %s",
	code,
	type(last_exc).__name__,
	last_exc,
	)
	# Force rate_limit code when the retry-arm exhausted on 429 too.
	if (
	isinstance(last_exc, _httpx.HTTPStatusError)
	and last_exc.response is not None
	and last_exc.response.status_code == 429
	):
	code = STT_ERROR_RATE_LIMIT
	return TranscribeResponse(
	text="",
	language_code=language_code,
	confidence=0.0,
	latency_ms=latency,
	error_code=code,
	user_message=STT_ERROR_USER_MESSAGES.get(
	code, STT_ERROR_USER_MESSAGES["unknown"]
	),
	)

	return TranscribeResponse(
	text=result.text,
	language_code=result.language_code,
	confidence=result.confidence,
	latency_ms=latency,
	)


	@app.post("/api/chat", response_model=ChatResponse)
	async def chat(req: ChatRequest, request: Request):
	session_id = req.session_id or str(uuid.uuid4())
	# X8 (2026-05-15) — frontend sends X-Preferred-Codec so the browser can
	# decode the TTS payload natively (WebM/Opus on Chrome+Firefox, MP4/AAC on
	# Safari, WAV as universal fallback). Default to WAV if the header is
	# missing or invalid.
	_allowed_codecs = {"audio/wav", "audio/mp4", "audio/webm"}
	# KI-278 (2026-05-16) — the frontend sends a full MediaSource codec
	# string, e.g. "audio/webm; codecs=opus". The previous exact-match
	# against _allowed_codecs NEVER matched that (the "; codecs=opus"
	# suffix), so webm/opus-capable browsers were ALWAYS silently
	# downgraded to wav. Strip the codec parameter + whitespace before
	# the membership test so the negotiated container is honoured.
	preferred_codec = (
	request.headers.get("X-Preferred-Codec", "audio/wav") or "audio/wav"
	).split(";")[0].strip().lower()
	if preferred_codec not in _allowed_codecs:
	preferred_codec = "audio/wav"
	t_chat0 = time.time()
	# Never let an inner TimeoutError / unhandled exception bubble out of
	# handle_turn as a 500. The whole call is wrapped in an outer 45s
	# budget so even a pathological hang inside handle_turn surfaces as a
	# graceful reply, not a connection-reset to the user. 45s is generous
	# but tighter than HF Space's gateway timeout, so the user always gets
	# a response.
	try:
	if USE_SINGLE_BRAIN:
	# One Gemini call per turn with native function-calling.
	# Falls back to nim_fallback on SingleBrainError so a missing
	# GOOGLE_API_KEY / model outage never breaks the chat.
	from backend import single_brain
	from backend.session_state import get_session

	_sb_session = get_session(session_id)
	# Once a session has had ANY successful single_brain turn, it
	# must stay on single_brain for the rest of its lifetime.
	# Switching brains mid-stream would discard everything
	# single_brain captured in last_recommendation_ids /
	# last_retrieved_chunks / slug_to_insurer. Sticky check below.
	_sb_was_sticky = getattr(_sb_session, "single_brain_sticky", False)
	try:
	turn = await asyncio.wait_for(
	single_brain.handle_turn(
	session=_sb_session,
	user_text=req.user_text,
	chat_history=req.chat_history,
	# KI-330 (2026-05-27) — pipe view_context through so
	# single_brain can build an ACTIVE POLICY DIVE-IN
	# block when the frontend tells us the user is
	# focused on a specific policy. Field was declared
	# on ChatRequest since launch but never consumed.
	view_context=req.view_context or None,
	),
	timeout=45.0,
	)
	# First successful single_brain turn stamps the flag so
	# every subsequent turn on this session is locked in.
	try:
	_sb_session.single_brain_sticky = True
	except Exception: # noqa: BLE001
	pass
	except single_brain.SingleBrainError as _sb_err:
	if _sb_was_sticky:
	# Session already had a clean single_brain turn. Do NOT
	# cross-fade to the fallback brain (loses turn state +
	# frontend sees the brain hop). Emit a graceful retry
	# prompt instead.
	logging.warning(
	"single_brain failed on STICKY session (session=%s); "
	"emitting graceful retry, NOT falling back: %s",
	session_id, _sb_err,
	)
	turn = single_brain.TurnResult(
	reply_text=(
	# 2026-05-27 — honest copy. Previous text falsely
	# blamed comprehension ("could you say that
	# again?") when the actual cause was an upstream
	# Gemini transient (HTTP 503 / timeout / etc.)
	# that survived the internal retry schedule.
	# Tells the user exactly what to do (resend the
	# same message) and locates blame correctly.
	"My model service had a brief blip on that turn "
	"— please send the same message again, it should "
	"go through now."
	),
	citations=[],
	retrieved_chunk_ids=[],
	brain_used="single_brain::sticky_graceful_retry",
	intent="qa",
	language="en",
	latency_ms=int((time.time() - t_chat0) * 1000),
	raw_reply=f"SingleBrainError: {_sb_err}",
	faithfulness_passed=True,
	faithfulness_reasons=[],
	blocked=False,
	profile_updates={},
	)
	else:
	logging.warning(
	"single_brain failed, falling back to nim_fallback "
	"(session=%s): %s",
	session_id, _sb_err,
	)
	turn = await asyncio.wait_for(
	nim_fallback.handle_turn_fallback(
	session=_sb_session,
	user_text=req.user_text,
	chat_history=req.chat_history,
	),
	timeout=20.0,
	)
	else:
	# When USE_SINGLE_BRAIN is off, route directly through the
	# minimal NIM fallback so the bot still serves a reply.
	from backend.session_state import get_session as _get_session
	turn = await asyncio.wait_for(
	nim_fallback.handle_turn_fallback(
	session=_get_session(session_id),
	user_text=req.user_text,
	chat_history=req.chat_history,
	),
	timeout=20.0,
	)
	except asyncio.TimeoutError:
	logging.warning(
	"handle_turn outer TimeoutError; returning graceful reply (session=%s)",
	session_id,
	)
	log_turn({
	"session_id": session_id,
	"user_text": req.user_text,
	"error": "asyncio.TimeoutError (outer 45s budget or inner wait_for)",
	"graceful": True,
	})
	return ChatResponse(
	reply_text=(
	"That took longer than expected — let me try a smaller answer. "
	"Could you ask me again, maybe more specifically?"
	),
	citations=[],
	brain_used="timeout_fallback",
	intent="qa",
	language="en",
	latency_ms=int((time.time() - t_chat0) * 1000),
	session_id=session_id,
	audio_base64=None,
	faithfulness_passed=True,
	faithfulness_reasons=[],
	blocked=False,
	profile_updates={},
	profile_complete=_compute_profile_complete(session_id),
	)
	except Exception as e:
	logging.exception(
	"handle_turn unhandled exception (session=%s)", session_id
	)
	log_turn({
	"session_id": session_id,
	"user_text": req.user_text,
	"error": f"{type(e).__name__}: {e}",
	"graceful": True,
	})
	return ChatResponse(
	reply_text=(
	"Hmm, something went wrong on my end. Could you try once more?"
	),
	citations=[],
	brain_used="error_fallback",
	intent="qa",
	language="en",
	latency_ms=int((time.time() - t_chat0) * 1000),
	session_id=session_id,
	audio_base64=None,
	faithfulness_passed=True,
	faithfulness_reasons=[],
	blocked=False,
	profile_updates={},
	profile_complete=_compute_profile_complete(session_id),
	)

	# Server-side closer-keyword safety net for RULE 7.
	# If the user clearly committed to a policy this turn but Gemini did
	# NOT call mark_recommendation (single_brain stamps "mark_recommendation"
	# into turn.brain_used when the tool fires — see single_brain.py:1052),
	# auto-call mark_recommendation against session.last_recommendation_ids[:1]
	# so the closure event is recorded for analytics regardless of whether
	# the LLM remembered to pull the tool. Best-effort; never blocks the
	# reply if anything goes wrong.
	try:
	if (
	USE_SINGLE_BRAIN
	and turn is not None
	and getattr(turn, "reply_text", None)
	and _CLOSER_KEYWORD_RE.search(req.user_text or "")
	and "mark_recommendation" not in (turn.brain_used or "")
	):
	from backend.session_state import get_session as _get_session
	from backend import brain_tools as _brain_tools

	_closer_session = _get_session(session_id)
	_last_recs = list(
	getattr(_closer_session, "last_recommendation_ids", []) or []
	)
	if _last_recs:
	_result = _brain_tools.mark_recommendation(
	session=_closer_session,
	policy_ids=_last_recs[:1],
	is_final=True,
	)
	logging.info(
	"U1-T9 closer auto-mark (session=%s) user_text=%r "
	"policy_ids=%s result=%s",
	session_id, req.user_text, _last_recs[:1], _result,
	)
	except Exception as _closer_err: # noqa: BLE001
	# Safety-net must never break the reply.
	logging.warning(
	"U1-T9 closer auto-mark failed (session=%s): %s: %s",
	session_id, type(_closer_err).__name__, _closer_err,
	)

	# KI-254 — auto-mark_recommendation when single_brain emits a
	# recommendation turn (retrieve_policies fired + citations non-empty)
	# but Gemini skipped calling mark_recommendation. This populates
	# session.last_recommendation_ids so the NEXT turn's ordinal follow-up
	# ("tell me about #2", "the second one", "first option") can resolve.
	# Without this, RULE 3 ("call mark_recommendation alongside retrieve")
	# depends on Gemini remembering; smoke-3-personas showed it forgets
	# on recommendation turns ~70% of the time, breaking T4 ordinal routing.
	# Safety net mirrors the U1-T9 closer pattern: best-effort, never blocks.
	try:
	if (
	USE_SINGLE_BRAIN
	and turn is not None
	and getattr(turn, "citations", None)
	and "retrieve_policies" in (turn.brain_used or "")
	and "mark_recommendation" not in (turn.brain_used or "")
	):
	from backend.session_state import get_session as _get_session_r
	from backend import brain_tools as _brain_tools_r

	_rec_session = _get_session_r(session_id)
	_cited_ids: list[str] = []
	_seen: set[str] = set()
	for _c in (turn.citations or []):
	pid = _c.get("policy_id") if isinstance(_c, dict) else getattr(_c, "policy_id", None)
	pid = (pid or "").strip()
	if pid and pid not in _seen:
	_seen.add(pid)
	_cited_ids.append(pid)
	if _cited_ids:
	# KI-278 — turn.citations is now the prose-aligned
	# recommendation set (single source of truth), so it equals
	# exactly the cards the user sees. Back-fill the FULL set so
	# ordinal follow-ups ("the 4th one") resolve against the same
	# list. The old [:4] cap existed only because citations used
	# to be the raw recall dump; it would now wrongly truncate a
	# legitimate 5-policy shortlist.
	_result_r = _brain_tools_r.mark_recommendation(
	session=_rec_session,
	policy_ids=_cited_ids,
	is_final=False,
	)
	logging.info(
	"KI-254 auto-mark on rec turn (session=%s) "
	"policy_ids=%s result=%s",
	session_id, _cited_ids, _result_r,
	)
	except Exception as _rec_err: # noqa: BLE001
	logging.warning(
	"KI-254 auto-mark on rec turn failed (session=%s): %s: %s",
	session_id, type(_rec_err).__name__, _rec_err,
	)

	# F3 — confirmation auto-extract safety net.
	# Symptom: Gemini emits a recap bullet list ("Primary Goal: first
	# family policy ...") from conversation context but skips one or more
	# save_profile_field calls. User says "yes this is correct"; the
	# _profile_complete gate refuses retrieval and the bot embarrassingly
	# re-asks. This block parses the bot's prior recap turn, maps slot
	# labels -> _REQUIRED_FOR_READY field names, and backfills any slot
	# that's STILL missing on the live profile. Best-effort; never blocks.
	# Mirror of KI-253 closer regex + KI-254 auto-mark pattern.
	try:
	_CONFIRM_RE = re.compile(
	r"\b(yes\|correct\|that'?s right\|all correct\|looks good)\b",
	re.IGNORECASE,
	)
	_RECAP_BULLET_RE = re.compile(r"^\s\\s\\[^:]+:\\*", re.MULTILINE)
	_RECAP_LINE_RE = re.compile(
	r"^\s\\s\\([^:]+):\\\s(.+?)\s*$",
	re.MULTILINE,
	)
	# Slot label aliases -> canonical _REQUIRED_FOR_READY field names.
	# Keys are lowercased + whitespace-collapsed.
	_SLOT_ALIASES = {
	"name": "name",
	"full name": "name",
	"age": "age",
	"dependents": "dependents",
	"family": "dependents",
	"family members": "dependents",
	"location": "location_tier",
	"city": "location_tier",
	"location tier": "location_tier",
	"city tier": "location_tier",
	"income": "income_band",
	"income band": "income_band",
	"annual income": "income_band",
	"primary goal": "primary_goal",
	"goal": "primary_goal",
	"objective": "primary_goal",
	"health conditions": "health_conditions",
	"health": "health_conditions",
	"medical conditions": "health_conditions",
	"pre-existing conditions": "health_conditions",
	"medical history": "health_conditions",
	}

	if (
	USE_SINGLE_BRAIN
	and turn is not None
	and _CONFIRM_RE.search(req.user_text or "")
	and not getattr(turn, "profile_complete", False)
	):
	# Locate the most recent bot/assistant message in chat_history.
	_prior_bot_text = ""
	for _msg in reversed(req.chat_history or []):
	if not isinstance(_msg, dict):
	continue
	_role = (_msg.get("role") or "").lower()
	if _role in ("assistant", "bot", "model"):
	_prior_bot_text = _msg.get("content") or ""
	break

	if _prior_bot_text and _RECAP_BULLET_RE.search(_prior_bot_text):
	from backend.session_state import get_session as _get_session_f3
	from backend import brain_tools as _brain_tools_f3

	_f3_session = _get_session_f3(session_id)
	_profile_f3 = _f3_session.profile

	_parsed: dict[str, str] = {}
	for _label, _value in _RECAP_LINE_RE.findall(_prior_bot_text):
	_key = " ".join(_label.strip().lower().split())
	_slot = _SLOT_ALIASES.get(_key)
	if not _slot:
	continue
	_val = (_value or "").strip().rstrip(".")
	if not _val:
	continue
	# Don't override slots that already have values.
	_existing = getattr(_profile_f3, _slot, None)
	if _existing not in (None, "", []):
	continue
	# First mapping wins (in case a label appears twice).
	_parsed.setdefault(_slot, _val)

	_backfilled: list[str] = []
	for _slot in _brain_tools_f3._REQUIRED_FOR_READY:
	if _slot not in _parsed:
	continue
	_existing = getattr(_profile_f3, _slot, None)
	if _existing not in (None, "", []):
	continue
	try:
	_r = _brain_tools_f3.save_profile_field(
	session=_f3_session,
	field=_slot,
	value=_parsed[_slot],
	)
	if isinstance(_r, dict) and _r.get("saved"):
	_backfilled.append(_slot)
	except Exception: # noqa: BLE001 — best-effort
	continue

	if _backfilled:
	logging.info(
	"F3 confirmation auto-extract (session=%s): backfilled %s",
	session_id, _backfilled,
	)
	except Exception as _f3_err: # noqa: BLE001
	# Safety-net must never break the reply.
	logging.warning(
	"F3 confirmation auto-extract failed (session=%s): %s: %s",
	session_id, type(_f3_err).__name__, _f3_err,
	)

	audio_b64 = None
	audio_mime: Optional[str] = None
	# When TTS fails we propagate a STRUCTURED, user-facing notice instead
	# of silently dropping the audio. The text reply is still returned in
	# full; the frontend renders a small inline "voice unavailable" line
	# under the bot bubble so the user understands why there's no voice
	# (e.g. Sarvam 429 / no credits).
	tts_error_code: Optional[str] = None
	tts_user_message: Optional[str] = None
	if req.return_audio and turn.reply_text:
	try:
	from backend.voice_format import tts_preprocess
	# Send a CLEANED version of the reply to TTS — strip markdown,
	# citations, expand acronyms, truncate. The text in the chat
	# bubble remains the full structured reply.
	spoken = tts_preprocess(
	turn.reply_text,
	language="indic" if req.tts_language_code.startswith("hi") else "en",
	max_words=55,
	)
	# X8 — honor X-Preferred-Codec; on transcoding failure the provider
	# falls back to raw WAV and reports audio_mime="audio/wav".
	audio, audio_mime = await get_tts().synthesize_with_mime(
	spoken,
	language_code=req.tts_language_code,
	preferred_codec=preferred_codec,
	)
	audio_b64 = base64.b64encode(audio).decode("utf-8")
	except Exception as e:
	# Don't fail the whole turn if TTS hiccups — but make the failure
	# LOUD: classify it once at the boundary (closed enum, same
	# contract as STT) so the client can render a friendly notice
	# instead of showing a voice-less reply with no explanation.
	from backend.providers.sarvam_tts import (
	classify_tts_exception,
	TTS_ERROR_USER_MESSAGES,
	TTS_ERROR_UNKNOWN,
	)
	tts_error_code = classify_tts_exception(e)
	tts_user_message = TTS_ERROR_USER_MESSAGES.get(
	tts_error_code, TTS_ERROR_USER_MESSAGES[TTS_ERROR_UNKNOWN]
	)
	audio_b64 = None
	audio_mime = None
	# Server-side diagnostics keep the raw error; the client never
	# sees the raw httpx string.
	logging.warning(
	"TTS failed (session=%s): error_code=%s exc=%s: %s",
	session_id, tts_error_code, type(e).__name__, e,
	)
	log_turn({
	"session_id": session_id,
	"tts_error": f"{type(e).__name__}: {e}",
	"tts_error_code": tts_error_code,
	})

	try:
	log_turn({
	"session_id": session_id,
	"user_text": req.user_text,
	"reply_text": turn.reply_text,
	"brain_used": turn.brain_used,
	"intent": turn.intent,
	"language": turn.language,
	"latency_ms": turn.latency_ms,
	"retrieved_chunk_ids": turn.retrieved_chunk_ids,
	"citation_count": len(turn.citations),
	"faithfulness_passed": turn.faithfulness_passed,
	"faithfulness_reasons": turn.faithfulness_reasons,
	"blocked": turn.blocked,
	})
	except Exception: # noqa: BLE001 — log IO must never block a reply
	pass

	# Cross-session profile persistence + returning-user detection removed
	# in ADR-043 (2026-05-27). Sessions are in-memory only.
	_returning_user_recalled = False

	# Bug B defense — CitationOut requires page_start/page_end as ints, but
	# single_brain.TurnResult.citations dicts don't carry those fields (its
	# citation shape is {chunk_id, policy_id, policy_name, insurer_slug,
	# doc_type, source_url, score}). Without this normalisation the
	# Pydantic constructor below would raise ValidationError, the
	# exception would escape /api/chat, and FastAPI would return a raw
	# 500 (or its default JSON error envelope) that the frontend can't
	# parse as a ChatResponse. We patch every citation dict to satisfy
	# CitationOut's required fields and wrap the whole response build in
	# an explicit try/except so a malformed citation can never silently
	# bypass our envelope.
	try:
	from backend.policy_identity import clean_display_policy_name
	safe_citations: list[CitationOut] = []
	for c in turn.citations or []:
	if not isinstance(c, dict):
	continue
	try:
	safe_citations.append(
	CitationOut(
	policy_id=str(c.get("policy_id", "") or ""),
	policy_name=clean_display_policy_name(
	str(c.get("policy_name", "") or "")
	),
	insurer_slug=str(c.get("insurer_slug", "") or ""),
	page_start=int(c.get("page_start", 0) or 0),
	page_end=int(c.get("page_end", 0) or 0),
	source_url=str(c.get("source_url", "") or ""),
	score=float(c.get("score", 0.0) or 0.0),
	)
	)
	except Exception as _cite_err: # noqa: BLE001
	logging.warning(
	"drop malformed citation (session=%s): %s — payload=%r",
	session_id, _cite_err, c,
	)

	return ChatResponse(
	reply_text=turn.reply_text,
	citations=safe_citations,
	brain_used=turn.brain_used,
	intent=turn.intent,
	language=turn.language,
	latency_ms=turn.latency_ms,
	session_id=session_id,
	audio_base64=audio_b64,
	audio_mime=audio_mime,
	tts_error_code=tts_error_code,
	tts_user_message=tts_user_message,
	faithfulness_passed=turn.faithfulness_passed,
	faithfulness_reasons=turn.faithfulness_reasons,
	blocked=turn.blocked,
	profile_updates=turn.profile_updates,
	profile_complete=_compute_profile_complete(session_id),
	returning_user_recalled=_returning_user_recalled,
	)
	except Exception as _resp_err: # noqa: BLE001
	# Anything else (TypeError/AttributeError/ValidationError) on the
	# response-build path — return the standard error_fallback shape
	# so the frontend always parses cleanly. Bug B catch-all.
	logging.exception(
	"chat response-build failed (session=%s): %s",
	session_id, _resp_err,
	)
	return ChatResponse(
	reply_text=(
	"Sorry, something went wrong — try again"
	),
	citations=[],
	brain_used="error_fallback",
	intent="qa",
	language="en",
	latency_ms=int((time.time() - t_chat0) * 1000),
	session_id=session_id,
	audio_base64=None,
	audio_mime=None,
	faithfulness_passed=True,
	faithfulness_reasons=[],
	blocked=False,
	profile_updates={},
	profile_complete=_compute_profile_complete(session_id),
	)


	@app.get("/api/coverage", response_model=CoverageResponse)
	async def coverage():
	"""What policies/insurers are indexed in the corpus.

	Drives the UI's "what's covered" panel — sets user expectations + reduces
	over-refusals from off-corpus queries.
	"""
	try:
	from rag.retrieve import get_collection
	coll = get_collection()
	total = coll.count()
	except Exception:
	total = 0

	# Insurer metadata — names + home URLs are curated + verified
	# (see eval/verified_urls.json + tools/verify_urls.py).
	# KI-132 (2026-05-15) — expanded to all 19 real insurers so /api/coverage
	# also returns proper display names (was 10 of 19).
	insurer_meta = {
	"acko": ("Acko Health Insurance", "https://www.acko.com/health-insurance/"),
	"aditya-birla": ("Aditya Birla Health Insurance", "https://www.adityabirlacapital.com/healthinsurance"),
	"bajaj-allianz": ("Bajaj Allianz General Insurance", "https://www.bajajallianz.com/"),
	"care-health": ("Care Health Insurance", "https://www.careinsurance.com/"),
	"cholamandalam": ("Cholamandalam MS General Insurance", "https://www.cholainsurance.com/"),
	"go-digit": ("Go Digit General Insurance", "https://www.godigit.com/"),
	"hdfc-ergo": ("HDFC ERGO General Insurance", "https://www.hdfcergo.com/"),
	"icici-lombard": ("ICICI Lombard General Insurance", "https://www.icicilombard.com/"),
	"iffco-tokio": ("IFFCO Tokio General Insurance", "https://www.iffcotokio.co.in/"),
	"manipalcigna": ("ManipalCigna Health Insurance", "https://www.manipalcigna.com/"),
	"national-insurance": ("National Insurance Company", "https://nationalinsurance.nic.co.in/"),
	"new-india": ("New India Assurance", "https://www.newindia.co.in/"),
	"niva-bupa": ("Niva Bupa Health Insurance", "https://www.nivabupa.com/"),
	"indusind-general": ("IndusInd General Insurance (formerly Reliance General)", "https://www.indusind.com/general-insurance/"),
	"oriental-insurance": ("Oriental Insurance Company", "https://orientalinsurance.org.in/"),
	"reliance-general": ("Reliance General Insurance", "https://www.reliancegeneral.co.in/"),
	"royal-sundaram": ("Royal Sundaram General Insurance", "https://www.royalsundaram.in/"),
	"sbi-general": ("SBI General Insurance", "https://www.sbigeneral.in/"),
	"star-health": ("Star Health & Allied Insurance", "https://www.starhealth.in/"),
	"tata-aig": ("Tata AIG General Insurance", "https://www.tataaig.com/"),
	"user-upload": ("Your uploaded policies", ""),
	}

	# policy -> source_url (verified at download time)
	policy_urls: dict[tuple[str, str], str] = {}
	by_insurer: dict[str, dict] = {}

	# KI-135 (2026-05-15) — count policies the SAME way /api/policies/all
	# does (extracted/*.json + curated-facts pass-2) so the marketplace badge
	# ALWAYS matches the marketplace card count. Previously this loop read
	# Chroma metadata, which under-counted by ~20 because ~15 curated-facts
	# policies (Activ One, Optima Secure, Reassure 2/3, Health Guard Gold,
	# etc.) are legitimate distinct products that have no Chroma chunks yet,
	# plus ~5 display-name mismatches collapsed two policies into one. After
	# this refactor: badge = cards = 158 / 19.
	# KI-129 + KI-130 invariants still hold (profile + regulatory excluded).
	import json as _json
	from backend.policy_identity import clean_display_policy_name
	_DOCTYPE_RANK_COV = {"wordings": 0, "prospectus": 1, "cis": 2, "brochure": 3}
	_doctype_of_cov = lambda stem: stem.rsplit("__", 1)[1] if "__" in stem else ""
	_product_key_of_cov = lambda pid: pid.rsplit("__", 1)[0] if "__" in pid else pid

	curated_facts = _load_curated_facts()
	sorted_files = sorted(
	settings.EXTRACTED_DIR.glob("*.json"),
	key=lambda fp: (_DOCTYPE_RANK_COV.get(_doctype_of_cov(fp.stem), 99), fp.stem),
	)
	seen_product_keys: set[str] = set()
	seen_policy_ids: set[str] = set()

	# KI-141 (2026-05-15) — pre-compute the alias mapping (curated marketing
	# renames whose source PDF maps to an extracted parent). These curated
	# entries collapse onto the parent card; they DO NOT count separately.
	# Same algorithm as /api/policies/all so the totals stay in sync.
	#
	# KI-142 (2026-05-15, REFACTORED) — UIN-primary invariant: 1 unique UIN
	# = 1 unique marketplace card. Mirrors the /api/policies/all algorithm
	# so the coverage policy_count stays in lockstep with the marketplace
	# card count. See the long-form comment block in that endpoint for the
	# full algorithm rationale.
	extracted_stems_cov = {fp.stem for fp in sorted_files}

	# Phase A — extracted parents claim their UINs first. We also retain the
	# parsed extracted JSON so Phase B can run the KI-145 material-diff check
	# without re-reading from disk.
	uin_to_parent_cov: dict[str, str] = {}
	extracted_uin_cov: dict[str, str] = {}
	extracted_data_cov: dict[str, dict] = {}
	for fp in sorted_files:
	try:
	_d = _json.loads(fp.read_text())
	except Exception:
	continue
	extracted_data_cov[fp.stem] = _d
	_u = _d.get("uin_code")
	if isinstance(_u, dict):
	_u = _u.get("value")
	_u = (_u or "").strip() if isinstance(_u, str) else ""
	if _u:
	extracted_uin_cov[fp.stem] = _u
	uin_to_parent_cov.setdefault(_u, fp.stem)

	direct_parent_cov: dict[str, str] = {}
	curated_canonical_ids_cov: list[str] = []
	# KI-145 — curated entries that failed the material-diffs gate (same UIN
	# or source-PDF as a pass-1 card but >= 2 decision-critical fields
	# disagree). These must emit as standalone pass-2 cards so the coverage
	# policy_count stays in lockstep with /api/policies/all.
	ki145_variant_curated_ids_cov: set[str] = set()

	# Phase B — walk curated entries deterministically (sorted by policy_id).
	for curated_pid, cdata in sorted(curated_facts.items()):
	if curated_pid != cdata.get("policy_id", curated_pid):
	continue
	if any(curated_pid.endswith(f"__{dt}")
	for dt in ("wordings", "brochure", "cis", "prospectus")):
	continue
	curated_canonical_ids_cov.append(curated_pid)

	curated_uin = cdata.get("uin_code")
	if isinstance(curated_uin, dict):
	curated_uin = curated_uin.get("value")
	curated_uin = (curated_uin or "").strip() if isinstance(curated_uin, str) else ""

	parent_id: str \| None = None
	if curated_uin and curated_uin in uin_to_parent_cov \
	and uin_to_parent_cov[curated_uin] != curated_pid:
	# KI-145 (2026-05-15) — same UIN ≠ same product. Compare
	# decision-critical fields against the candidate extracted
	# parent; if 2+ disagree (non-null on both sides) this is a
	# VARIANT and stays as its own card. Pure RENAME (< 2 diffs)
	# falls through to the alias-merge as before.
	candidate = uin_to_parent_cov[curated_uin]
	# Candidate may be extracted OR curated — fall back to curated
	# facts when no extracted JSON exists, so the diff has real data.
	cand_data = extracted_data_cov.get(candidate) or curated_facts.get(candidate, {})
	if _ki145_material_diffs(cdata, cand_data) < 2:
	parent_id = candidate
	else:
	ki145_variant_curated_ids_cov.add(curated_pid)
	elif curated_uin:
	# New UIN — claim it. KI-145 spec: UIN unmatched against any
	# extracted parent = standalone. Flag so pass-2 emits even if
	# policy_id is a prefix of a seen extracted id.
	uin_to_parent_cov[curated_uin] = curated_pid
	ki145_variant_curated_ids_cov.add(curated_pid)

	if parent_id is None and not curated_uin:
	# KI-142 (preserved): source-PDF fallback only when curated entry
	# has NO UIN. When UIN is present but unmatched, KI-145 spec
	# mandates standalone — PDF coincidence cannot override.
	fb_parent = _source_pdf_to_policy_id(cdata.get("_primary_source_pdf"))
	if fb_parent and fb_parent in extracted_stems_cov and fb_parent != curated_pid:
	ext_data = extracted_data_cov.get(fb_parent, {})
	if _ki145_material_diffs(cdata, ext_data) < 2:
	parent_id = fb_parent
	else:
	ki145_variant_curated_ids_cov.add(curated_pid)

	if parent_id:
	direct_parent_cov[curated_pid] = parent_id

	# Phase C — chain-compress (see /api/policies/all for rationale).
	aliased_curated_ids_cov: set[str] = set()
	parent_pkey_alias_count: dict[str, int] = {}

	def _terminal_parent_cov(start: str) -> str \| None:
	seen_chain: set[str] = set()
	cur = start
	while True:
	nxt = direct_parent_cov.get(cur)
	if not nxt:
	return cur if cur != start else None
	if nxt in seen_chain or nxt == start:
	return None
	seen_chain.add(nxt)
	cur = nxt

	for curated_pid in curated_canonical_ids_cov:
	if curated_pid not in direct_parent_cov:
	continue
	terminal = _terminal_parent_cov(curated_pid)
	if not terminal:
	continue
	if terminal in extracted_stems_cov:
	terminal_pkey = _product_key_of_cov(terminal)
	else:
	terminal_pkey = terminal
	aliased_curated_ids_cov.add(curated_pid)
	parent_pkey_alias_count[terminal_pkey] = parent_pkey_alias_count.get(terminal_pkey, 0) + 1

	# by_insurer entries:
	# products: set of product_keys (matches /api/policies/all card count)
	# names: ordered dict of policy_NAME -> first product_key (for sample display)
	# aliases: KI-141 — count of curated marketing-rename entries merged
	# into this insurer's parent cards (for the alias_count field).
	# KI-135 (2026-05-15) — track product_keys (not names) for counting so the
	# ~1 within-insurer policy_name collision (e.g. new-india Floater listed
	# as both extracted + curated_facts) doesn't collapse the count below the
	# marketplace card count. Both representations are still distinct products.

	# Pass 1: extracted JSONs (KI-133 dedup by product_key — wordings wins)
	for fp in sorted_files:
	try:
	data = _json.loads(fp.read_text())
	except Exception:
	continue
	pid = data.get("policy_id", fp.stem)
	seen_policy_ids.add(pid)
	slug = data.get("insurer_slug", "")
	if slug == "regulatory":
	continue
	pkey = _product_key_of_cov(pid)
	if pkey in seen_product_keys:
	continue
	seen_product_keys.add(pkey)
	name = clean_display_policy_name(data.get("policy_name", "") or pid)
	url = data.get("source_pdf_url", "")
	if slug not in by_insurer:
	by_insurer[slug] = {"products": set(), "names": [], "chunks": 0, "aliases": 0}
	by_insurer[slug]["products"].add(pkey)
	# KI-141 — accumulate alias count from the pre-pass
	by_insurer[slug]["aliases"] += parent_pkey_alias_count.get(pkey, 0)
	if name not in by_insurer[slug]["names"]:
	by_insurer[slug]["names"].append(name)
	by_insurer[slug]["chunks"] += 1
	if url and (slug, name) not in policy_urls:
	policy_urls[(slug, name)] = url

	# Pass 2: curated-facts policies that have no extracted counterpart
	for curated_pid, data in curated_facts.items():
	if curated_pid != data.get("policy_id", curated_pid):
	continue # permutation alias
	if curated_pid in seen_policy_ids:
	continue
	# KI-145 — bypass the startswith dedup for genuine variants (same
	# UIN/source-PDF as a pass-1 card but materially different fields).
	# Otherwise variant cards would be silently dropped here.
	if curated_pid not in ki145_variant_curated_ids_cov \
	and any(eid.startswith(curated_pid + "__") for eid in seen_policy_ids):
	continue
	# KI-141 — skip curated entries that have already been collapsed into
	# a pass-1 parent's alias list.
	if curated_pid in aliased_curated_ids_cov:
	continue
	seen_policy_ids.add(curated_pid)
	slug = data.get("insurer_slug", "")
	if slug == "regulatory":
	continue
	# Curated entries don't have a __doctype suffix, so use the full
	# policy_id as the product_key.
	pkey = curated_pid
	# KI-145 — variants share product_key with their pass-1 sibling
	# (different doctype-stripped stems are identical). Allow them past
	# this dedup so coverage policy_count = marketplace card count.
	if pkey in seen_product_keys and curated_pid not in ki145_variant_curated_ids_cov:
	continue
	seen_product_keys.add(pkey)
	name = clean_display_policy_name(
	data.get("policy_name", "") or curated_pid
	)
	url = data.get("source_pdf_url", "")
	if slug not in by_insurer:
	by_insurer[slug] = {"products": set(), "names": [], "chunks": 0, "aliases": 0}
	# KI-145 — variants share pkey with a pass-1 sibling, so adding the
	# bare pkey to the set would be a no-op (set semantics). Tag variant
	# pkeys with a suffix in the counting set so the per-insurer count
	# increments by 1, matching the marketplace card count.
	if curated_pid in ki145_variant_curated_ids_cov:
	by_insurer[slug]["products"].add(f"{pkey}__ki145variant")
	else:
	by_insurer[slug]["products"].add(pkey)
	# KI-142 — accumulate alias count for curated parents (curated entries
	# that themselves became the claimant of a new UIN, with later curated
	# siblings aliasing onto them).
	by_insurer[slug]["aliases"] += parent_pkey_alias_count.get(pkey, 0)
	if name not in by_insurer[slug]["names"]:
	by_insurer[slug]["names"].append(name)
	by_insurer[slug]["chunks"] += 1
	if url and (slug, name) not in policy_urls:
	policy_urls[(slug, name)] = url

	# #80 — SINGLE SOURCE OF TRUTH. Derive the catalogue counts from the SAME
	# de-duplicated marketplace the cards render from, so the header count can
	# never drift from what the user actually sees (1 product = 1 card
	# everywhere). The old parallel product_key tally double-counted the
	# doctype-sibling permutations the marketplace collapses.
	from collections import Counter as _Counter
	_mp = await policies_all()
	_pc = _Counter(p.insurer_slug for p in _mp.policies)

	insurers_out = []
	for slug, info in sorted(by_insurer.items()):
	# KI-130 — regulatory is not an insurer; never a marketplace card.
	if slug == "regulatory":
	continue
	product_count = _pc.get(slug, 0)
	if product_count == 0:
	continue
	sample_names = sorted(info["names"])[:8]
	name, home_url = insurer_meta.get(slug, (slug, ""))
	sample_entries = [
	PolicyEntry(name=p, source_url=policy_urls.get((slug, p), ""))
	for p in sample_names
	]
	insurers_out.append(
	InsurerCoverage(
	slug=slug,
	name=name,
	home_url=home_url,
	policy_count=product_count,
	sample_policies=sample_entries,
	alias_count=info.get("aliases", 0),
	)
	)

	return CoverageResponse(
	total_chunks=total,
	total_policies=_mp.total,
	total_insurers=_mp.insurers_indexed,
	insurers=insurers_out,
	)


	@app.post("/api/upload-policy", response_model=UploadResponse)
	async def upload_policy(
	request: Request,
	file: UploadFile = File(...),
	session_id: Optional[str] = Form(None),
	):
	"""Accept a user-uploaded PDF policy doc, chunk + embed it, add to the
	quarantine collection (NOT the shared `policies` corpus).

	Each upload is tagged with the caller's session_id so retrieval can scope
	quarantine queries to the uploader only. If no session_id is supplied,
	falls back to "anonymous" for backwards compatibility.
	"""
	import re
	import tempfile
	import time as _time
	from pathlib import Path as _PathLib

	t0 = _time.time()
	contents = await file.read()
	if not contents.startswith(b"%PDF"):
	raise HTTPException(400, "File does not look like a PDF (magic bytes wrong).")
	if len(contents) > 25 * 1024 * 1024:
	raise HTTPException(413, "PDF too large (>25 MB). Use a smaller file.")

	sid = session_id or "anonymous"

	# Slugify filename for policy_id
	raw = file.filename or "user_upload.pdf"
	stem = _PathLib(raw).stem
	slug = re.sub(r"[^a-zA-Z0-9]+", "-", stem.lower()).strip("-")[:80] or "user-upload"
	policy_id = f"user-upload__{sid[:12]}__{slug}"
	policy_name = stem.replace("_", " ").replace("-", " ").title()

	# Save to disk so ingest can read with pdfplumber
	user_dir = settings.CORPUS_DIR / "user-upload"
	user_dir.mkdir(parents=True, exist_ok=True)
	out_path = user_dir / f"{slug}.pdf"
	out_path.write_bytes(contents)

	# Orphan-file guard (2026-05-16) — the PDF is written to disk BEFORE the
	# 8 security gates run (pdfplumber needs a path). On ANY non-success exit
	# — security reject, empty-text reject, embed failure, bloat trip, the
	# broad 500 catch — the file must NOT be left lying in rag/corpus/
	# user-upload/. `indexed_ok` is flipped True only after a successful
	# quarantine collection.add(); the finally block deletes the file unless
	# it was actually indexed (or short-circuited via the dedupe accept
	# cache, where the bytes are already represented by cached chunks).
	indexed_ok = False

	# Ingest just this one file
	try:
	from rag.ingest import (
	_abort_if_hnsw_bloated,
	chunk_pages,
	get_quarantine_collection,
	read_pdf_pages,
	)
	from backend.providers.local_embeddings import LocalEmbeddings as _Emb
	from backend.security import check_upload, rate_limiter

	pages = read_pdf_pages(out_path)
	# Run 8-gate security check (dedupe + mechanics + encrypted + content +
	# page ceiling + injection + per-session + per-IP rate limit + LLM judge)
	full_text = "\n".join(t for _, t in pages)
	# #47 — UIN net-new dedup: if the uploaded PDF's IRDAI UIN already
	# belongs to a catalogue policy it is NOT net-new — return the
	# existing card instead of indexing a duplicate. `indexed_ok` stays
	# False so the finally block deletes the freshly-written temp file.
	_uin_hit = _match_catalogue_uin(full_text)
	if _uin_hit:
	return UploadResponse(
	policy_id=_uin_hit[0],
	policy_name=_uin_hit[1],
	chunks_added=0,
	pages_indexed=len(pages),
	elapsed_ms=int((_time.time() - t0) * 1000),
	already_in_catalogue=True,
	existing_policy_id=_uin_hit[0],
	existing_policy_name=_uin_hit[1],
	)
	client_ip = (request.client.host if request and request.client else "") or request.headers.get("X-Forwarded-For", "").split(",")[0].strip()
	verdict = await check_upload(
	content=contents,
	extracted_text=full_text,
	page_count=len(pages),
	session_id=sid,
	ip=client_ip,
	)
	if not verdict.accepted:
	# File cleanup handled uniformly in the finally block (orphan
	# guard) — no explicit unlink needed here.
	raise HTTPException(
	400,
	f"Upload rejected by security gates: {', '.join(verdict.reasons[:3])}",
	)
	# If the dedupe gate found this exact (hash, session) already indexed,
	# skip chunking + embedding entirely and return the cached chunk count.
	# The bytes are already represented by the previously-indexed chunks,
	# so this freshly-written duplicate file is redundant — let the
	# finally block delete it (indexed_ok stays False).
	if verdict.cached_chunks is not None:
	return UploadResponse(
	policy_id=policy_id,
	policy_name=policy_name,
	chunks_added=verdict.cached_chunks,
	pages_indexed=len(pages),
	elapsed_ms=int((_time.time() - t0) * 1000),
	)
	# Successful pass — record IP-level upload for rate-limit ledger
	from backend.security import record_ip_upload, record_accept
	import hashlib as _hashlib
	record_ip_upload(client_ip)

	chunks = list(chunk_pages(pages))
	if not chunks:
	raise HTTPException(400, "Could not extract any text from the PDF (scanned image-only?).")

	# Quarantine HNSW bloat guard (2026-05-16) — fail fast BEFORE we
	# spend an embed call if a prior ingest/upload already bloated the
	# on-disk index. The guard scans ALL link_lists.bin under
	# VECTORS_DIR, so it covers both `policies` and the
	# `user_uploads_quarantine` collection. Raises RuntimeError on
	# trip; the broad except below converts it to a clean HTTP 500
	# rather than letting the index grow into a disk-fill incident.
	_abort_if_hnsw_bloated()

	embedder = _Emb()
	texts = [c["text"] for c in chunks]
	vectors = await embedder.embed(texts, input_type="document")

	ids = [f"{policy_id}::chunk{c['chunk_idx']}" for c in chunks]
	metadatas = [
	{
	"policy_id": policy_id,
	"insurer_slug": "user-upload",
	"policy_name": policy_name,
	"doc_type": "user_upload",
	"source_url": "",
	"page_start": c["page_start"],
	"page_end": c["page_end"],
	"chunk_idx": c["chunk_idx"],
	"local_path": str(out_path),
	"session_id": sid,
	}
	for c in chunks
	]
	collection = get_quarantine_collection()
	# Remove any existing chunks under this policy_id (re-upload case)
	try:
	collection.delete(where={"policy_id": policy_id})
	except Exception:
	pass
	collection.add(ids=ids, documents=texts, embeddings=vectors, metadatas=metadatas)
	# Index write succeeded — the on-disk file is now legitimately
	# referenced by chunk metadata.local_path; the finally block must
	# NOT delete it.
	indexed_ok = True
	# Post-add bloat guard — catch a bloat THIS upload caused (e.g. a
	# ChromaDB version / batch-size pathology). Mirrors ingest.py's
	# _abort_if_hnsw_bloated() after collection.add().
	_abort_if_hnsw_bloated()
	# TTL bookkeeping — remember when this session last touched the
	# quarantine collection so the periodic purge task can evict its
	# chunks after the configured idle window (default 24h).
	_quarantine_touch(sid, policy_id)
	# Update rate-limit ledger after successful index
	rate_limiter.record_upload(sid, len(chunks))
	# Cache this content hash → chunk count so an identical re-upload in
	# the same session short-circuits via gate_hash_dedupe.
	try:
	sha = _hashlib.sha256(contents).hexdigest()
	record_accept(sha, sid, len(chunks))
	except Exception:
	pass

	# ---- #52: PERSIST + add to THE (global) marketplace ----------------
	# The session-scoped quarantine add above is the immediate, private
	# path. #52 additionally requires the uploaded doc to become a REAL,
	# GRADED, PERSISTENT marketplace card that survives an HF Space
	# restart. So we:
	# (1) persist the raw PDF + a curated-facts-shaped JSON record +
	# the chunk payload under the PERSISTENT UPLOADED_DOCS_DIR,
	# (2) add the SAME chunks to the GLOBAL `policies` Chroma
	# collection (doc_type='user_upload') so they're retrievable
	# for everyone — per spec the doc is added to THE marketplace,
	# so global visibility is intentional; only the uploaded
	# document itself is exposed, never any session profile,
	# (3) invalidate the #40 marketplace-grade cache so the new card
	# grades immediately (the curated record flows through the
	# EXISTING _marketplace_catalogue Pass-2 + build_scorecard).
	# ANY failure here MUST surface (no silent failure): a 200 that
	# didn't persist would violate the #52 contract.
	from backend import uploaded_docs as _udocs

	_record = _udocs.persist_upload(
	policy_id=policy_id,
	policy_name=policy_name,
	pdf_bytes=contents,
	full_text=full_text,
	chunks=chunks,
	session_id=sid,
	)
	# Global-collection ingest (idempotent — keyed by policy_id).
	from rag.ingest import get_chroma_collection as _get_pol_coll
	_pol = _get_pol_coll()
	_g_ids = [f"{policy_id}::chunk{c['chunk_idx']}" for c in chunks]
	# Use whatever insurer_slug build_record resolved (detected from
	# PDF text via detect_insurer_slug, or UPLOAD_INSURER_SLUG on no
	# match) so chunk metadata + scorecard reviews lookup agree.
	_resolved_insurer_slug = _record.get("insurer_slug", _udocs.UPLOAD_INSURER_SLUG)
	_g_meta = [
	{
	"policy_id": policy_id,
	"insurer_slug": _resolved_insurer_slug,
	"policy_name": policy_name,
	"doc_type": _udocs.UPLOAD_DOC_TYPE,
	"source_url": "",
	"page_start": c["page_start"],
	"page_end": c["page_end"],
	"chunk_idx": c["chunk_idx"],
	# GLOBAL by design — NO session_id on these chunks.
	}
	for c in chunks
	]
	try:
	_pol.delete(where={"policy_id": policy_id})
	except Exception: # noqa: BLE001 — nothing to delete on first upload
	pass
	_pol.add(ids=_g_ids, documents=texts, embeddings=vectors, metadatas=_g_meta)
	_abort_if_hnsw_bloated()
	# Bust the #40 grade cache + the corpus-pdf index so the new card
	# appears immediately with a real grade.
	try:
	global _CORPUS_PDF_IDX
	_CORPUS_PDF_IDX = None
	with _MG_LOCK:
	_MG_CACHE["sig"] = None
	_MG_CACHE["index"] = None
	except Exception: # noqa: BLE001 — cache bust is best-effort
	pass

	# ── Fire LLM-assisted extraction in background (ADR-044) ─────────
	# Same extractor as the catalogued 148. Runs ~30-60s; the upload
	# HTTP response returns now and the frontend polls
	# /api/upload/extraction-status/{policy_id} (see below) to know
	# when the card-bearing chat message should be pushed.
	# Fail-silent: a failed LLM pass leaves the heuristic record
	# intact, so the card still has SOMETHING to show — never blocks
	# the user. NEVER blocks this request.
	try:
	from pathlib import Path as _PathLib2
	_persisted_pdf = _udocs.uploaded_docs_dir() / policy_id / "source.pdf"
	_detected_insurer_name = _record.get(
	"insurer_name",
	_udocs.detected_insurer_name(_resolved_insurer_slug)
	if _resolved_insurer_slug != _udocs.UPLOAD_INSURER_SLUG
	else _udocs.UPLOAD_INSURER_NAME,
	)
	# Pre-stamp "pending" so a frontend poll that arrives BEFORE
	# extract_one_for_upload's first await still sees a known
	# state instead of HTTP 404.
	await _udocs._set_extraction_status(
	policy_id,
	status="pending",
	policy_name=policy_name,
	insurer_slug=_resolved_insurer_slug,
	started_at=None,
	completed_at=None,
	completeness_pct=None,
	overall_grade=None,
	error=None,
	)
	asyncio.create_task(
	_udocs.extract_one_for_upload(
	policy_id=policy_id,
	pdf_path=_persisted_pdf,
	policy_name=policy_name,
	insurer_slug=_resolved_insurer_slug,
	insurer_name=_detected_insurer_name,
	)
	)
	except Exception: # noqa: BLE001 — extraction is async + optional
	pass
	except HTTPException:
	raise
	except Exception as e:
	raise HTTPException(500, f"Indexing failed: {type(e).__name__}: {e}")
	finally:
	# Orphan-file guard — delete the on-disk PDF unless it was actually
	# indexed into the quarantine collection. Covers EVERY non-success
	# exit (security reject, empty-text, dedupe short-circuit, embed
	# failure, bloat trip, 500 catch). Best-effort: a cleanup failure
	# must never mask the real response/exception.
	if not indexed_ok:
	try:
	out_path.unlink(missing_ok=True)
	except Exception: # noqa: BLE001
	pass

	return UploadResponse(
	policy_id=policy_id,
	policy_name=policy_name,
	chunks_added=len(chunks),
	pages_indexed=len(pages),
	elapsed_ms=int((_time.time() - t0) * 1000),
	)


	# ---------------------------------------------------------------------------
	# GET /api/upload/extraction-status/{policy_id} — frontend poll target
	# (ADR-044, 2026-05-27).
	#
	# After the upload endpoint returns, the chat flow needs to know when
	# the background LLM extraction completes so it can push the card-bearing
	# assistant message into chat with the FULL data (not the heuristic
	# stub). This endpoint exposes _UPLOAD_EXTRACTION_STATUS so the
	# frontend can poll every ~3s for up to ~120s.
	# ---------------------------------------------------------------------------


	class ExtractionStatusResponse(BaseModel):
	policy_id: str
	status: str # "pending" \| "running" \| "complete" \| "failed" \| "unknown"
	policy_name: Optional[str] = None
	insurer_slug: Optional[str] = None
	started_at: Optional[str] = None
	completed_at: Optional[str] = None
	completeness_pct: Optional[float] = None
	overall_grade: Optional[str] = None
	error: Optional[str] = None
	# 2026-05-27 — provenance: which LLM landed the extraction
	# ('gemini-2.5-flash#1' / 'gemini-2.5-flash#2' / 'gemini-2.5-flash#3' /
	# 'nim-fallback' / None on heuristic-only fallback).
	llm_used: Optional[str] = None
	llm_response_chars: Optional[int] = None


	@app.post("/api/admin/upload/reextract")
	async def admin_reextract_uploads(
	request: Request,
	x_admin_password: Optional[str] = Header(default=None, alias="X-Admin-Password"),
	force: bool = False,
	):
	"""Run LLM-assisted extraction on every persisted upload that doesn't
	yet have a `rag/extracted/<id>.json` (or `force=true` to re-extract all).
	Admin-gated; fires synchronously so the response carries the summary.

	Use when an upload was persisted before the LLM-extraction pipeline was
	wired and needs to be upgraded without re-uploading.
	"""
	from backend.admin import _check_admin
	_check_admin(request, x_admin_password)
	from backend import uploaded_docs as _udocs
	summary = await _udocs.backfill_extractions(force=force)
	return summary


	@app.get(
	"/api/upload/extraction-status/{policy_id}",
	response_model=ExtractionStatusResponse,
	)
	async def upload_extraction_status(policy_id: str):
	"""Return the live status of a per-upload LLM-assisted extraction.

	Returns `status="unknown"` for an unrecognised policy_id (e.g. the
	frontend polled a stale id or a policy that was uploaded on a prior
	container) so the client can stop polling without ambiguity.
	"""
	from backend import uploaded_docs as _udocs
	state = _udocs.get_extraction_status(policy_id)
	if not state:
	return ExtractionStatusResponse(policy_id=policy_id, status="unknown")
	return ExtractionStatusResponse(
	policy_id=policy_id,
	status=state.get("status", "unknown"),
	policy_name=state.get("policy_name"),
	insurer_slug=state.get("insurer_slug"),
	started_at=state.get("started_at"),
	completed_at=state.get("completed_at"),
	completeness_pct=state.get("completeness_pct"),
	overall_grade=state.get("overall_grade"),
	error=state.get("error"),
	llm_used=state.get("llm_used"),
	llm_response_chars=state.get("llm_response_chars"),
	)


	class ScorecardSubScore(BaseModel):
	name: str
	score: int
	summary: str
	signals: list[str]


	class ProfileSummaryModel(BaseModel):
	"""Deterministic, profile-aware {strengths, caveat} (see
	backend.scorecard.build_profile_summary). Rendered at the TOP of every
	scorecard surface; the frontend falls back to one_liner when strengths
	is empty / insufficient. Optional with a default so every existing
	construction path (compare, insufficient-data) stays valid."""
	strengths: list[str] = Field(default_factory=list)
	caveat: Optional[str] = None


	class ProfileCompletenessResponse(BaseModel):
	completeness: float # 0.0 - 1.0
	completeness_pct: int # 0 - 100
	fields_collected: list[str]
	fields_missing: list[str]
	is_personalized: bool # True if completeness >= threshold
	gate_threshold: float = 0.6
	next_question_hint: Optional[str] = None
	profile: dict = Field(default_factory=dict) # current profile state for UI to render
	session_id: Optional[str] = None


	class ProfileUpdateRequest(BaseModel):
	session_id: str
	name: Optional[str] = None # KI-077
	age: Optional[int] = None
	dependents: Optional[str] = None
	income_band: Optional[str] = None
	existing_cover_inr: Optional[int] = None
	primary_goal: Optional[str] = None
	location_tier: Optional[str] = None
	parents_to_insure: Optional[bool] = None
	parents_age_max: Optional[int] = None
	parents_has_ped: Optional[bool] = None
	health_conditions: Optional[list[str]] = None
	budget_band: Optional[str] = None
	budget_inr: Optional[int] = None # #64 — exact ₹/yr from the slider
	# Collected by the profile-builder UI; also present on the Profile
	# dataclass + chat-path save_profile_field. Whitelisted here so
	# POST /api/profile accepts them.
	desired_sum_insured_inr: Optional[int] = None
	copay_pct: Optional[int] = None
	family_medical_history: Optional[list[str]] = None
	smoker: Optional[bool] = None


	class SessionResetRequest(BaseModel):
	session_id: str
	drop_profile: bool = False # True = nuke session entirely; False = clear chat only
	confirm: bool = False # KI-095 — must be True when drop_profile=True; guards accidental wipes


	class SessionResetResponse(BaseModel):
	ok: bool
	session_id: Optional[str] = None # new session_id when drop_profile=True
	cleared_state: bool


	class SessionClearRequest(BaseModel):
	session_id: str


	class SessionClearResponse(BaseModel):
	cleared: bool
	new_session_id: str


	@app.post("/api/session/clear", response_model=SessionClearResponse)
	async def session_clear(req: SessionClearRequest):
	"""Clean Clear-chat semantic. Wipes the in-memory session state for the
	supplied session_id and ALWAYS returns a freshly minted UUID the
	frontend must adopt as its new session_id going forward.

	Post-ADR-043 (2026-05-27) there is nothing to preserve across sessions
	— there is no on-disk profile to "leave intact". A clear is a complete
	forget.

	Body : {session_id: str}
	Reply: {cleared: bool, new_session_id: str}
	"""
	from backend.session_state import clear_session
	cleared = clear_session(req.session_id) if req.session_id else False
	return SessionClearResponse(
	cleared=cleared,
	new_session_id=uuid.uuid4().hex[:12],
	)


	@app.post("/api/session/reset", response_model=SessionResetResponse)
	async def session_reset(req: SessionResetRequest):
	"""KI-020 — User-facing chat clear / fresh-start toggle.

	Two modes:
	- drop_profile=False: caller (frontend) wipes its own message history; the
	server-side profile is preserved so the next message resumes with what
	the bot already knows. Light-touch "clear visible chat".
	- drop_profile=True: server-side session state (profile + awaiting_question
	+ free_form_session flag + on-disk JSON) is deleted entirely. The response
	returns a fresh session_id the frontend should adopt as its new id.
	"""
	from backend.session_state import reset_session
	cleared = False
	new_sid: Optional[str] = None
	if req.drop_profile:
	# KI-095 — require explicit confirm=True so a misclick or replayed
	# request cannot wipe a populated session by accident.
	if not req.confirm:
	raise HTTPException(status_code=400, detail="confirm=true required to drop session")
	cleared = reset_session(req.session_id)
	new_sid = uuid.uuid4().hex[:12]
	return SessionResetResponse(ok=True, session_id=new_sid, cleared_state=cleared)


	@app.post("/api/profile", response_model=ProfileCompletenessResponse)
	async def profile_update(req: ProfileUpdateRequest):
	"""Write user-provided profile fields into session_state. Returns the new
	completeness so the frontend can immediately reveal personalized scores.

	ALSO ingests the profile as a chunk into Chroma (doc_type='profile',
	policy_id='profile_<session_id>') so the brain sees user context
	alongside policy + regulatory chunks at retrieval time. This is the
	"profile RAG" architecture — every recommendation grounds in (policy
	text + IRDAI mandate + user's own situation) jointly.
	"""
	from backend.scorecard import profile_completeness as _completeness
	from backend.session_state import get_session

	sess = get_session(req.session_id)
	# Update only fields the client explicitly sent (non-None) — keeps partial
	# save flows clean
	for field_name in (
	"name", # KI-077 — accept name updates from the profile-builder UI
	"age", "dependents", "income_band", "existing_cover_inr", "primary_goal",
	"location_tier", "parents_to_insure", "parents_age_max", "parents_has_ped",
	"health_conditions", "budget_band", "budget_inr",
	"desired_sum_insured_inr", "copay_pct", "family_medical_history", "smoker",
	):
	v = getattr(req, field_name, None)
	if v in (None, "", []):
	# KI-095 — never clobber a filled field with empty input from the client
	continue
	setattr(sess.profile, field_name, v)
	# KI-196 (ADR-041) — mark the slot as explicitly answered so the
	# completeness scorer recognises it. Without this, builder-form
	# captures land on the profile but the badge still reads 0% because
	# profile_completeness_view now gates on `Profile.asked`.
	if field_name not in sess.profile.asked:
	sess.profile.asked.append(field_name)

	# ADR-043 (2026-05-27) — cross-session persistence + profile_rag
	# upsert removed. The captured fields live only in the in-memory
	# SessionState for this session's lifetime (1 h idle TTL).

	p = sess.profile
	# KI-271 — SLOT_UNION-driven profile_dict (15 fields) so copay_pct +
	# family_medical_history + desired_sum_insured_inr propagate to the
	# save endpoint's response + RAG chunk.
	profile_dict = {
	slot: getattr(p, slot, None) for slot in brain_tools.SLOT_UNION
	}
	# KI-196 (ADR-041) — same answered-only gate as profile_completeness_view.
	answered = set(getattr(p, "asked", []) or [])
	completeness_input = {
	k: (v if k in answered else None) for k, v in profile_dict.items()
	}
	c = _completeness(completeness_input)
	collected = [k for k, v in profile_dict.items() if k in answered and v not in (None, "", [], False)]
	missing = [k for k, v in profile_dict.items() if k not in answered or v in (None, "", [])]

	# profile_rag upsert removed in ADR-043 (2026-05-27). Captured fields
	# remain in the in-memory SessionState only.

	return ProfileCompletenessResponse(
	completeness=c,
	completeness_pct=int(c * 100),
	fields_collected=collected,
	fields_missing=missing,
	is_personalized=c >= 0.6,
	profile=profile_dict,
	session_id=req.session_id,
	)


	@app.get("/api/profile/completeness", response_model=ProfileCompletenessResponse)
	async def profile_completeness_view(session_id: Optional[str] = None):
	"""Returns how much we know about the user. Frontend uses this to gate the
	personalized scorecard render — until completeness >= 0.6 we show the
	insurer-level metrics only, NOT the per-user grade.
	"""
	from backend.scorecard import profile_completeness as _completeness
	from backend.session_state import get_session
	from backend.needs_finder import next_question

	if not session_id:
	return ProfileCompletenessResponse(
	completeness=0.0, completeness_pct=0,
	fields_collected=[], fields_missing=[],
	is_personalized=False,
	next_question_hint="Start the chat and tell me about your situation",
	)
	sess = get_session(session_id)
	p = sess.profile
	# KI-271 — profile_dict now built from brain_tools.SLOT_UNION (15 fields)
	# so every captured slot (including B5 desired_sum_insured_inr, D2 copay_pct,
	# D2 family_medical_history) propagates through to /api/profile/completeness,
	# /api/profile/predicted-premium-band, /api/profile/recall-by-name. Prior
	# 12-key hand-roll caused E3 to discover the band endpoint ignoring copay
	# + family entirely.
	profile_dict = {
	slot: getattr(p, slot, None) for slot in brain_tools.SLOT_UNION
	}
	# KI-196 (ADR-041) — Profile completeness gates on Profile.asked.
	answered = set(getattr(p, "asked", []) or [])
	completeness_input = {
	k: (v if k in answered else None) for k, v in profile_dict.items()
	}
	c = _completeness(completeness_input)
	collected = [k for k, v in profile_dict.items() if k in answered and v not in (None, "", [], False)]
	missing = [k for k, v in profile_dict.items() if k not in answered or v in (None, "", [])]
	hint = None
	try:
	# next_question returns the field name (str) of the next missing
	# slot. The frontend uses it as a slot-hint; the actual phrasing
	# is generated by the single-brain LLM.
	hint = next_question(p)
	except Exception:
	pass
	return ProfileCompletenessResponse(
	completeness=c,
	completeness_pct=int(c * 100),
	fields_collected=collected,
	fields_missing=missing,
	is_personalized=c >= 0.6,
	next_question_hint=hint,
	profile=profile_dict,
	session_id=session_id,
	)


	class ScorecardResponse(BaseModel):
	policy_id: str
	policy_name: str
	insurer_slug: str
	overall_score: int
	grade: str
	one_liner: str
	sub_scores: list[ScorecardSubScore]
	data_completeness_pct: float
	methodology_link: str
	# True ⇒ this policy had too little structured data to grade honestly.
	# The response is still a valid HTTP-200 ScorecardResponse (grade "—",
	# overall_score 0, empty sub_scores, an honest one_liner) so the frontend
	# renders a truthful "not enough data yet" state instead of the generic
	# Retry fallback or a fabricated grade. Optional w/ default so the
	# existing /api/policies/compare construction (no flag) stays valid.
	insufficient_data: bool = False
	# Deterministic, profile-aware {strengths, caveat} computed on the same
	# pass as the grade. Optional w/ default so every construction path
	# (compare with no summary, insufficient-data) stays valid.
	profile_summary: Optional[ProfileSummaryModel] = None


	class CompareEntry(BaseModel):
	policy_id: str
	policy_name: str
	insurer_slug: str
	fields: dict
	scorecard: Optional[ScorecardResponse] = None


	class CompareResponse(BaseModel):
	policies: list[CompareEntry]
	field_order: list[str]


	class MarketplacePolicy(BaseModel):
	policy_id: str
	policy_name: str
	insurer_slug: str
	insurer_name: str
	insurer_home_url: str
	source_pdf_url: Optional[str] = None
	grade: str
	overall_score: int
	one_liner: str
	data_completeness_pct: float
	# Deterministic, profile-aware {strengths, caveat}. Populated from the
	# SAME build_scorecard pass that produced `grade`. None when the catalogue
	# was built profile-neutrally and no facts qualified.
	profile_summary: Optional[ProfileSummaryModel] = None
	# Headline filterable fields
	min_entry_age: Optional[int] = None
	max_entry_age: Optional[int] = None
	sum_insured_options: list[int] = Field(default_factory=list)
	# #81 — cover presented as a RANGE (min – max), never a discrete ladder
	# or a single deterministic number.
	# SI RATIONALISATION (D1/D3) — sum_insured_options / _min / _max are now
	# the SOURCE-QUOTE-CORROBORATED set only (backend/sum_insured.py). Values
	# the field's own source_quote does not genuinely state are dropped, so
	# the marketplace never shows an SI the policy document doesn't back.
	# • sum_insured_is_band — True only when the corroborated set is a
	# genuine continuous band (range language + wide min→max). The
	# frontend renders "₹X – ₹Y"; otherwise it lists the discrete tiers.
	# • sum_insured_tiers — the corroborated discrete plan amounts
	# (== sum_insured_options; kept as an explicit, named field so the
	# display contract is unambiguous on the frontend).
	sum_insured_min: Optional[int] = None
	sum_insured_max: Optional[int] = None
	sum_insured_is_band: bool = False
	sum_insured_tiers: list[int] = Field(default_factory=list)
	pre_existing_disease_waiting_months: Optional[int] = None
	initial_waiting_period_days: Optional[int] = None
	maternity_waiting_months: Optional[int] = None
	copayment_pct: Optional[float] = None
	network_hospital_count: Optional[int] = None
	no_claim_bonus_pct: Optional[int] = None
	ayush_coverage: Optional[bool] = None
	maternity_coverage: Optional[bool] = None
	cashless_treatment_supported: Optional[bool] = None
	room_rent_capping: Optional[str] = None
	# #86 — sourced insurer-level network: the official list URL + the
	# official stated count (when the insurer publishes one). Replaces the
	# web-backfilled per-policy network_hospital_count for display.
	network_list_url: Optional[str] = None
	network_count_official: Optional[int] = None
	network_list_is_pdf: bool = False

	# #73/#76 — the curated re-extraction legitimately writes non-numeric
	# honest values (e.g. max_entry_age "No maximum age (Lifelong)", a
	# fractional no_claim_bonus_pct). Previously these raised ValidationError
	# and the ENTIRE policy was dropped from the marketplace. Coerce at the
	# model so any construction path self-heals: keep a parseable number,
	# else degrade that ONE field to None — never drop the policy.
	@field_validator(
	"min_entry_age", "max_entry_age", "pre_existing_disease_waiting_months",
	"initial_waiting_period_days", "maternity_waiting_months",
	"network_hospital_count", "no_claim_bonus_pct",
	"network_count_official", mode="before",
	)
	@classmethod
	def _coerce_optional_int(cls, v):
	if v is None or isinstance(v, bool):
	return None
	if isinstance(v, int):
	return v
	try:
	return int(round(float(str(v).replace(",", "").strip())))
	except (ValueError, TypeError):
	return None

	@field_validator("copayment_pct", mode="before")
	@classmethod
	def _coerce_optional_float(cls, v):
	if v is None or isinstance(v, bool):
	return None
	try:
	return float(str(v).replace("%", "").replace(",", "").strip())
	except (ValueError, TypeError):
	return None

	@field_validator("sum_insured_options", "sum_insured_tiers", mode="before")
	@classmethod
	def _coerce_int_list(cls, v):
	if not isinstance(v, list):
	return []
	out = []
	for x in v:
	try:
	out.append(int(round(float(str(x).replace(",", "").strip()))))
	except (ValueError, TypeError):
	continue
	return out

	@field_validator(
	"ayush_coverage", "maternity_coverage", "cashless_treatment_supported",
	mode="before",
	)
	@classmethod
	def _coerce_optional_bool(cls, v):
	if v is None or isinstance(v, bool):
	return v
	s = str(v).strip().lower()
	if s in ("true", "yes", "covered", "y", "1"):
	return True
	if s in ("false", "no", "not covered", "excluded", "n", "0"):
	return False
	return None

	# KI-141 (2026-05-15) — marketing-rename aliases that share the same
	# source PDF (e.g. "Activ One" and "Activ Health" both point to the
	# activ-health-individual__wordings.pdf parent). Default empty list so
	# the field is backward-compatible. Frontend renders these as small
	# "Also known as: X, Y" sub-labels under the parent card title.
	aliases: list[str] = Field(default_factory=list)


	class MarketplaceResponse(BaseModel):
	policies: list[MarketplacePolicy]
	total: int
	insurers_indexed: int


	@app.get("/api/scorecard/methodology")
	async def scorecard_methodology():
	"""Transparency endpoint — returns the 6-criterion blueprint with weights,
	consumer rationale, fields driving each sub-score, and regulatory anchors.

	Frontend renders this inside PolicyDetailModal so the user can see exactly
	how the headline number is computed and which of the HealthPolicy schema
	fields feed into which criterion. Both counts below are DERIVED (single
	source of truth) — never hardcode them on the frontend; consume these.
	"""
	from backend.scorecard import (
	METHODOLOGY_BLUEPRINT, WEIGHTS, SCORED_FIELDS, grade_for,
	)
	from rag.schema import HealthPolicy
	# grade_thresholds DERIVED from grade_for() — the single source of truth
	# for the frozen cutoffs (2026-05-16). Never restate the numbers here:
	# the old hardcoded "≥85/70–84/…" had drifted out of sync with the
	# recalibrated A≥76/B≥69/C≥61/D≥54/F<54 scoring, so the disclosed bands
	# did not match how grades were actually assigned. Introspecting grade_for
	# makes a future recalibration propagate automatically.
	_band_lo: dict[str, int] = {}
	_band_desc: dict[str, str] = {}
	for _s in range(0, 101):
	_g, _d = grade_for(_s)
	if _g not in _band_lo:
	_band_lo[_g] = _s
	_band_desc[_g] = _d
	_f_cut = min(v for k, v in _band_lo.items() if k != "F")
	_grade_thresholds = {
	g: (f"<{_f_cut} — {_band_desc[g]}" if g == "F"
	else f"≥{_band_lo[g]} — {_band_desc[g]}")
	for g in ("A", "B", "C", "D", "F")
	}
	return {
	"weights": WEIGHTS,
	"scored_fields_count": len(SCORED_FIELDS),
	"total_schema_fields": len(HealthPolicy.model_fields),
	"criteria": METHODOLOGY_BLUEPRINT,
	"grade_thresholds": _grade_thresholds,
	"scoring_approach": (
	"Rules-based (deterministic), no LLM-in-the-loop. Each criterion produces a "
	"0–100 sub-score from concrete schema fields; the overall score is the weighted "
	"average. Weights adapt to user profile when age/parents/budget are known."
	),
	}


	def _build_corpus_url_index() -> dict[str, str]:
	"""Parse 40-data/corpus_urls.md and return {policy_id: source_url}. Used to
	backfill source_pdf_url when the LLM extraction didn't capture it."""
	import re as _re
	out: dict[str, str] = {}
	md_path = settings.DATA_DIR / "corpus_urls.md"
	if not md_path.exists():
	return out
	for line in md_path.read_text().splitlines():
	if not line.startswith("\|") or "insurer_slug" in line or "---" in line:
	continue
	parts = [p.strip() for p in line.strip("\|").split("\|")]
	if len(parts) < 5:
	continue
	insurer_slug = parts[0]
	policy_name = parts[2]
	doc_type = parts[3]
	m = _re.search(r"https?://\S+", parts[4])
	if not (insurer_slug and m):
	continue
	url = m.group(0)
	# Primary key — match rag.ingest.policy_id_for: <insurer>__<filename-stem>
	# where filename-stem is the URL's PDF filename without extension.
	url_stem = url.rsplit("/", 1)[-1].rsplit("?", 1)[0].rsplit(".", 1)[0]
	url_slug = _re.sub(r"[^a-z0-9]+", "-", url_stem.lower()).strip("-")
	out[f"{insurer_slug}__{url_slug}"] = url
	# Secondary key — derived from policy_name + doc_type (some extracted
	# JSONs use a name-based slug when the original URL filename differs)
	if policy_name and doc_type:
	name_slug = _re.sub(r"[^a-z0-9]+", "-", policy_name.lower()).strip("-")
	out.setdefault(f"{insurer_slug}__{name_slug}__{doc_type.lower()}", url)
	out.setdefault(f"{insurer_slug}__{name_slug}", url)
	return out


	def _load_curated_facts() -> dict[str, dict]:
	"""Load the 40-data/policy_facts/*.json curated layer. Each file has a
	`{field: {value, source_pdf_path, source_quote}}` shape. We unwrap to a
	flat `{field: value}` dict for the marketplace endpoint, preserving the
	provenance in a `_facts_provenance` field for transparency.

	KI-141 (2026-05-15) — also computes `_primary_source_pdf`, the most-common
	`source_pdf_path` across this curated entry's fields. Used by both
	/api/policies/all and /api/coverage to alias-merge marketing-rename
	curated entries into their extracted-JSON parent card.

	KI-219 (2026-05-15) — CANONICAL PRECEDENCE. When the curated dir has BOTH
	a canonical (`<insurer>__<product>.json`) and one or more doctype-suffixed
	siblings (`<insurer>__<product>__wordings.json`, `__brochure.json`,
	`__cis.json`, `__prospectus.json`) for the same product, the canonical
	file's content is the source of truth. The suffixed-sibling keys point
	AT the canonical entry so any downstream lookup by either form resolves
	to the richer canonical data. Previously the order of `glob('*.json')`
	+ `setdefault` made the loser non-deterministic; the more complete
	canonical entry (e.g. `hdfc-ergo__optima-secure.json` says "No room rent
	cap") was getting shadowed by the suffixed sibling (`...__wordings.json`
	says "Room rent capped at 1%"), collapsing scorecards to 72/100.
	"""
	import json as _json
	from collections import Counter
	facts: dict[str, dict] = {}
	facts_dir = settings.DATA_DIR / "policy_facts"
	if not facts_dir.exists():
	return facts

	_DOCTYPE_SUFFIXES = ("__wordings", "__brochure", "__cis", "__prospectus")

	def _flatten(d: dict, fallback_id: str) -> dict:
	policy_id = d.get("policy_id") or fallback_id
	flat: dict = {}
	provenance: dict = {}
	all_source_pdfs: list[str] = []
	for k, v in d.items():
	if k.startswith("_") or k in ("policy_id", "policy_name", "insurer_slug"):
	flat[k] = v
	continue
	if isinstance(v, dict) and "value" in v:
	flat[k] = v["value"]
	if v.get("source_pdf_path") or v.get("source_quote") or v.get("source_url"):
	provenance[k] = {
	"source_pdf_path": v.get("source_pdf_path"),
	"source_quote": v.get("source_quote"),
	"source_url": v.get("source_url"),
	}
	if v.get("source_pdf_path"):
	all_source_pdfs.append(v["source_pdf_path"])
	else:
	flat[k] = v
	flat.setdefault("policy_id", policy_id)
	flat["_facts_provenance"] = provenance
	flat["_primary_source_pdf"] = (
	Counter(all_source_pdfs).most_common(1)[0][0]
	if all_source_pdfs else None
	)
	return flat

	# Pass 1 — load every curated JSON, indexed by its on-disk stem, AND
	# group siblings by their canonical product_key (stem with any trailing
	# __doctype suffix stripped).
	by_stem: dict[str, dict] = {}
	siblings: dict[str, list[tuple[str, bool]]] = {} # product_key → [(stem, is_canonical), ...]
	for f in sorted(facts_dir.glob("*.json")):
	try:
	d = _json.loads(f.read_text())
	except Exception:
	continue
	stem = f.stem
	flat = _flatten(d, stem)
	by_stem[stem] = flat
	# Determine canonical-ness by FILE STEM (not by policy_id field).
	# A stem ending in one of the four doctype tokens is a non-canonical
	# sibling; everything else is canonical.
	is_canonical = not any(stem.endswith(suf) for suf in _DOCTYPE_SUFFIXES)
	if is_canonical:
	product_key = stem
	else:
	# Strip the matching suffix to find the canonical sibling.
	for suf in _DOCTYPE_SUFFIXES:
	if stem.endswith(suf):
	product_key = stem[: -len(suf)]
	break
	else:
	product_key = stem
	siblings.setdefault(product_key, []).append((stem, is_canonical))

	# Pass 2 — for each product_key, pick the canonical entry's flat dict if
	# present; otherwise fall back to the first suffixed sibling (sorted to
	# be deterministic). Then make every sibling key (canonical stem + each
	# __doctype variant + each sibling's own stem + each sibling's
	# policy_id) point at the chosen flat dict so the source-of-truth wins
	# regardless of which key the caller looked up by.
	#
	# KI-251 (2026-05-16) — FIELD-LEVEL canonical precedence. The original
	# KI-219 logic chose ONE entry (canonical) wholesale. That silently
	# dropped real curated data whenever the canonical file had a field
	# extracted as null (`{"value": null, ... "source_quote": "not stated
	# in <pdf>"}`) while a doctype sibling had the genuine value. Concrete
	# incident: `icici-lombard__health-elite-plus.json` (canonical, every
	# field null) shadowed `icici-lombard__health-elite-plus__wordings.json`
	# whose `sum_insured_options` is a real list — so the marketplace card
	# rendered "COVER UP TO —" despite the value existing in the curated
	# layer. Affected 8 products on sum_insured_options + 3 on entry-age.
	#
	# Fix: keep canonical precedence for every field the canonical populates
	# (KI-219 preserved exactly — `hdfc-ergo__optima-secure` "No room rent
	# cap" still wins over its sibling's "1%"), but for any field the
	# canonical leaves null/empty, backfill from the highest-ranked sibling
	# that has a genuine value. Doctype rank: wordings > prospectus > cis >
	# brochure (most authoritative source first). This ONLY surfaces data
	# that already exists verbatim in 40-data/policy_facts — nothing is
	# fabricated; the per-field provenance pointer is backfilled too so the
	# UI still shows the correct source quote for the borrowed field.
	_SIB_FILL_RANK = {"__wordings": 0, "__prospectus": 1, "__cis": 2, "__brochure": 3}

	def _is_empty(val) -> bool:
	return val is None or val == "" or val == [] or val == {}

	# Fields that are pure metadata / structural and must NOT be borrowed
	# across siblings (they describe the chosen entry itself, not a fact).
	_NON_FACT_KEYS = {
	"policy_id", "policy_name", "insurer_slug",
	"_facts_provenance", "_primary_source_pdf",
	}

	for product_key, entries in siblings.items():
	canonical_entries = [s for s, c in entries if c]
	if canonical_entries:
	chosen_stem = canonical_entries[0]
	else:
	chosen_stem = sorted(s for s, _ in entries)[0]
	chosen = dict(by_stem[chosen_stem])

	# Deterministic sibling order for field-level backfill: by doctype
	# authority rank, then stem (stable tiebreak). The chosen stem is
	# excluded — it is already the base.
	def _rank(stem: str) -> tuple:
	for suf, r in _SIB_FILL_RANK.items():
	if stem.endswith(suf):
	return (r, stem)
	return (99, stem)

	fill_order = sorted(
	(s for s, _ in entries if s != chosen_stem),
	key=_rank,
	)
	if fill_order:
	chosen_prov = dict(chosen.get("_facts_provenance") or {})
	for sib_stem in fill_order:
	sib = by_stem[sib_stem]
	sib_prov = sib.get("_facts_provenance") or {}
	for k, v in sib.items():
	if k in _NON_FACT_KEYS:
	continue
	# Canonical/base value wins whenever it is populated.
	if not _is_empty(chosen.get(k)):
	continue
	if _is_empty(v):
	continue
	chosen[k] = v
	# Carry the borrowed field's provenance so the UI still
	# shows the correct verbatim source quote for it.
	if k in sib_prov:
	chosen_prov[k] = sib_prov[k]
	chosen["_facts_provenance"] = chosen_prov

	# Register the canonical product_key.
	facts[product_key] = chosen
	# Register every doctype-suffix permutation pointing at the chosen
	# flat (back-compat with code that looks up by the suffixed name).
	for suf in _DOCTYPE_SUFFIXES:
	facts.setdefault(f"{product_key}{suf}", chosen)
	# Register every sibling's actual on-disk stem AND policy_id field
	# so callers that already hold a stem-like ID still resolve to the
	# canonical content.
	for sib_stem, _is_can in entries:
	facts[sib_stem] = chosen
	sib_pid = by_stem[sib_stem].get("policy_id")
	if isinstance(sib_pid, str) and sib_pid:
	facts[sib_pid] = chosen

	# #52 — merge PERSISTED user-uploaded docs into the curated layer so each
	# surfaces as a marketplace card via the EXISTING _marketplace_catalogue
	# Pass-2 + build_scorecard path (NO grading re-implementation). Records
	# are already in the curated `{field:{value,source_*}}` shape; run them
	# through the same _flatten so per-field provenance is preserved. They
	# have unique `user-upload__*` policy_ids so they can never collide with
	# a real curated product key. A failure here must NOT break the curated
	# layer for the 200+ real policies — log + continue.
	try:
	from backend import uploaded_docs as _udocs

	for _pid, _rec in _udocs.load_persisted_records().items():
	if not isinstance(_rec, dict):
	continue
	facts[_pid] = _flatten(_rec, _pid)
	except Exception as e: # noqa: BLE001 — uploaded layer is additive
	logging.warning(
	"uploaded-docs curated merge failed (%s: %s) — "
	"marketplace falls back to corpus-only cards",
	type(e).__name__, e,
	)

	return facts


	def _source_pdf_to_policy_id(pdf_path: str \| None) -> str \| None:
	"""KI-141 — map a curated `source_pdf_path` like
	'rag/corpus/aditya-birla/activ-health-individual__wordings.pdf' to the
	extracted-JSON policy_id 'aditya-birla__activ-health-individual__wordings'.

	Returns None if the input is empty/None.
	"""
	if not pdf_path:
	return None
	s = pdf_path
	if s.startswith("rag/corpus/"):
	s = s[len("rag/corpus/"):]
	if s.endswith(".pdf"):
	s = s[: -len(".pdf")]
	return s.replace("/", "__")


	_INSURER_NET: dict \| None = None


	def _insurer_network(slug: str) -> dict:
	"""#86 — official insurer-level network source (40-data/insurer_network
	.json): the official list URL + the official stated count where the
	insurer publishes one. Sourced, not web-backfilled. Cached."""
	global _INSURER_NET
	if _INSURER_NET is None:
	p = settings.DATA_DIR / "insurer_network.json"
	try:
	_INSURER_NET = (
	json.loads(p.read_text()).get("insurers", {}) if p.exists() else {}
	)
	except Exception:
	_INSURER_NET = {}
	return _INSURER_NET.get(slug, {}) or {}


	def _recover_scorecard_facts(sc) -> dict:
	"""#48 — port of the frontend parseScorecardFacts. The detail-modal
	snapshot recovers facts (co-pay, PED wait, network, cashless, …) from
	the scorecard's signal strings when the flat policy field is null. The
	marketplace CARD only had the flat fields, so it showed "—" where the
	modal showed a real value. Recover the SAME facts server-side and
	backfill `data` so card == modal everywhere, with no extra client call."""
	import re as _re

	f: dict = {}
	sub = getattr(sc, "sub_scores", None) or []
	for s in sub:
	for raw in getattr(s, "signals", None) or []:
	sig = str(raw).strip()
	low = sig.lower()
	m = _re.search(r"(\d+(?:\.\d+)?)%\s*copay", sig, _re.I)
	if m:
	f["copayment_pct"] = float(m.group(1))
	elif _re.search(r"0% copayment", sig, _re.I):
	f["copayment_pct"] = 0
	m = _re.search(r"(\d+)\smo\sPED\s*waiting", sig, _re.I)
	if m:
	f["pre_existing_disease_waiting_months"] = int(m.group(1))
	m = _re.search(r"([\d,]+)\+?\s*network hospitals", sig, _re.I)
	if m:
	f["network_hospital_count"] = int(m.group(1).replace(",", ""))
	if _re.search(r"cashless supported", low, _re.I):
	f["cashless_treatment_supported"] = True
	elif _re.search(r"no cashless", low, _re.I):
	f["cashless_treatment_supported"] = False
	if _re.search(r"ayush covered", low, _re.I):
	f["ayush_coverage"] = True
	elif _re.search(r"no ayush", low, _re.I):
	f["ayush_coverage"] = False
	if _re.search(r"maternity covered", low, _re.I):
	f["maternity_coverage"] = True
	if _re.search(r"no room rent cap", low, _re.I):
	f["_room_no_cap"] = True
	else:
	rr = _re.search(r"room rent capped:\s*(.+)$", sig, _re.I)
	if rr:
	f["_room_cap_text"] = rr.group(1).strip()
	m = _re.search(r"entry up to\s*(\d+)", sig, _re.I)
	if m:
	f["max_entry_age"] = int(m.group(1))
	return f


	_CORPUS_PDF_IDX: dict[str, str] \| None = None


	def _corpus_pdf_index() -> dict[str, str]:
	"""Every policy in the catalogue exists ONLY because its source PDF was
	downloaded into rag/corpus to build the vectors + policy_facts. This maps
	each policy_id (full id, file stem, AND the #80 dedup-stripped id) to the
	absolute corpus PDF that physically exists on disk — so the marketplace
	can always link the real document even when no public origin URL was ever
	recorded. Wordings/policy docs win over CIS/brochure/prospectus. Built
	once and cached for the process lifetime."""
	global _CORPUS_PDF_IDX
	if _CORPUS_PDF_IDX is not None:
	return _CORPUS_PDF_IDX
	from collections import Counter

	prio = {"wordings": 0, "policy": 1, "cis": 2, "prospectus": 3, "brochure": 4}

	def _rank(path: str) -> int:
	low = path.lower()
	for k, v in prio.items():
	if k in low:
	return v
	return 9

	idx: dict[str, str] = {}
	best: dict[str, int] = {}
	root = settings.CORPUS_DIR.parent.parent
	corpus_root = str(settings.CORPUS_DIR.resolve())
	facts_dir = settings.DATA_DIR / "policy_facts"
	if facts_dir.exists():
	for fp in sorted(facts_dir.glob("*.json")):
	try:
	d = json.loads(fp.read_text())
	except Exception:
	continue
	pid = d.get("policy_id") or fp.stem
	paths = [
	v.get("source_pdf_path")
	for v in d.values()
	if isinstance(v, dict) and v.get("source_pdf_path")
	]
	if not paths:
	continue
	cand = Counter(paths).most_common(1)[0][0]
	ap = (root / cand).resolve()
	try:
	ok = ap.is_file() and str(ap).startswith(corpus_root)
	except Exception:
	ok = False
	if not ok:
	continue
	rank = _rank(cand)
	keys = {pid, fp.stem}
	for suff in ("__wordings", "__brochure", "__cis", "__prospectus", "__policy"):
	if pid.endswith(suff):
	keys.add(pid[: -len(suff)])
	break
	for k in keys:
	if k not in idx or rank < best.get(k, 9):
	idx[k] = str(ap)
	best[k] = rank

	# #52 — persisted uploaded docs keep their real PDF in the persistent
	# UPLOADED_DOCS_DIR (NOT rag/corpus). Map their policy_id → that file so
	# the marketplace card's /api/policy-pdf link resolves to the exact
	# document the user uploaded and that the card was graded from.
	try:
	for d in sorted(settings.UPLOADED_DOCS_DIR.glob("*/source.pdf")):
	meta_p = d.parent / "meta.json"
	try:
	pid = json.loads(meta_p.read_text()).get("policy_id") or d.parent.name
	except Exception: # noqa: BLE001
	pid = d.parent.name
	idx[pid] = str(d.resolve())
	except Exception: # noqa: BLE001 — uploaded-pdf index is additive
	pass

	_CORPUS_PDF_IDX = idx
	return idx


	def _is_credible_pdf_url(u: str \| None) -> bool:
	"""#87 — a recorded source_pdf_url is only trustworthy as the policy-PDF
	link if it unambiguously points at a document, not an insurer homepage
	or a generic section page (e.g. https://www.sbigeneral.in,
	https://nationalinsurance.nic.co.in/en/health-insurance). When it isn't,
	we prefer the local corpus PDF we definitively have for every policy."""
	if not u:
	return False
	from urllib.parse import urlparse

	try:
	path = (urlparse(u).path or "").lower()
	except Exception:
	return False
	if ".pdf" in path:
	return True
	return any(
	m in path
	for m in ("/documents/", "/dam/", "/download", "/sites/default/files/")
	)


	@app.get("/api/policy-pdf/{policy_id}")
	def policy_pdf(policy_id: str):
	"""Serve the local corpus PDF for a policy — the exact document the
	catalogue, vectors and facts were all built from. Guarantees every one
	of the 148 cards has a working real-PDF link even when no public origin
	URL was ever captured. Path is constrained to rag/corpus."""
	idx = _corpus_pdf_index()
	ap = idx.get(policy_id) or idx.get(policy_id.replace("/", "__"))
	if not ap:
	raise HTTPException(status_code=404, detail="No source PDF for this policy")
	p = Path(ap).resolve()
	# #52 — also allow the persistent uploaded-docs store (the uploaded PDF
	# lives there, not in rag/corpus). Both roots are server-controlled
	# directories; the index only ever maps to files inside one of them, so
	# this stays a strict allowlist (no traversal surface).
	_allowed_roots = (
	str(settings.CORPUS_DIR.resolve()),
	str(settings.UPLOADED_DOCS_DIR.resolve()),
	)
	if not (p.is_file() and any(str(p).startswith(r) for r in _allowed_roots)):
	raise HTTPException(status_code=404, detail="Source PDF not found")
	return FileResponse(
	str(p),
	media_type="application/pdf",
	headers={"Content-Disposition": f'inline; filename="{p.name}"'},
	)


	def _merge_curated(extracted: dict, curated: dict \| None) -> dict:
	"""Curated facts override LLM extraction for every field they populate.
	LLM extraction fills the long tail. Provenance pointers survive in the
	merged dict so the UI can show source quotes per field."""
	if not curated:
	return extracted
	merged = dict(extracted)
	for k, v in curated.items():
	if v is not None and v != "" and v != []:
	merged[k] = v
	return merged


	def _si_source_quote(data: dict) -> str:
	"""The verbatim source_quote backing this policy's sum_insured_options.

	Every real SI value in the catalogue comes from the curated
	40-data/policy_facts layer (extracted SI is null across the board); the
	flatten step in _load_curated_facts() stores its provenance at
	data["_facts_provenance"]["sum_insured_options"]["source_quote"], which
	_merge_curated() carries through onto the merged dict. We also accept the
	wrapped `{value, source_quote}` shape defensively in case a future
	extraction path leaves the field unflattened.
	"""
	prov = (data.get("_facts_provenance") or {}).get("sum_insured_options")
	if isinstance(prov, dict) and prov.get("source_quote"):
	return str(prov["source_quote"])
	raw = data.get("sum_insured_options")
	if isinstance(raw, dict) and raw.get("source_quote"):
	return str(raw["source_quote"])
	return ""


	def _rationalise_si(data: dict, si_values: list[int]) -> "_si.SumInsuredView":
	"""Apply the deterministic D3 source-quote corroboration filter + D1
	band-vs-tier classification to this policy's SI list. Returns a
	SumInsuredView the marketplace serializer maps onto sum_insured_*.
	"""
	return _si.rationalise(si_values, _si_source_quote(data))


	def _policy_corroborated_si(policy_id: str \| None) -> "_si.SumInsuredView":
	"""The corroborated SI view for a single policy_id (D2/D3). Resolves the
	same merged extracted+curated `data` the marketplace serializer sees,
	then runs the source-quote corroboration filter. `kind == "none"` ⇒ the
	policy publishes NO corroborated Sum Insured (drives the D2 disclosure).
	"""
	if not policy_id:
	return _si.SumInsuredView(kind="none", tiers=[], min_inr=None, max_inr=None)
	import json as _json
	try:
	curated = _load_curated_facts()
	except Exception:
	curated = {}
	data: dict = {}
	ep = settings.EXTRACTED_DIR / f"{policy_id}.json"
	if ep.exists():
	try:
	data = _json.loads(ep.read_text())
	except Exception:
	data = {}
	cur = curated.get((data.get("policy_id") if data else None) or policy_id) \
	or curated.get(policy_id)
	data = _merge_curated(data, cur) if (data or cur) else {}
	si = data.get("sum_insured_options") or []
	if isinstance(si, list):
	si = [int(x) for x in si
	if isinstance(x, (int, float)) or (isinstance(x, str) and x.isdigit())]
	else:
	si = []
	return _rationalise_si(data, si)


	# Decision-critical fields that distinguish a RENAME (curated entry folds
	# onto extracted parent) from a VARIANT (same UIN but materially different
	# product — must stay as its own card). Same UIN ≠ same product:
	# regulators file one "wordings" PDF that covers multiple marketed variants
	# (e.g. ProHealth Prime vs ProHealth Protect both filed under
	# MCIHLIP24011V072324; copay/PED/maternity/NCB differ).
	_KI145_DIFF_FIELDS: tuple[str, ...] = (
	"copayment_pct",
	"pre_existing_disease_waiting_months",
	"maternity_coverage",
	"maternity_waiting_months",
	"room_rent_capping",
	"restoration_benefit",
	"no_claim_bonus_pct",
	"post_hospitalization_days",
	)


	def _ki145_extract_value(raw, field: str):
	"""Unwrap the value from either scalar OR nested `{value, ...}` shapes.
	For two fields the extracted-side shape is `{covered, ...}` instead of
	`{value, ...}`: maternity_coverage and restoration_benefit. We project
	those onto the boolean `covered` so a curated bool/str compares cleanly
	against the extracted dict's truthiness.
	"""
	if raw is None:
	return None
	if isinstance(raw, dict):
	if "value" in raw:
	return raw.get("value")
	if field in ("maternity_coverage", "restoration_benefit") and "covered" in raw:
	return raw.get("covered")
	# Unknown dict shape — treat as opaque non-null marker so a real
	# diff isn't accidentally suppressed.
	return raw
	return raw


	def _ki145_normalize(field: str, val):
	"""Coerce field value into a comparable form (numbers as floats, bools as
	bools, strings stripped lower-case). Returns None on null/empty/"" so it
	is consistently skipped in the diff count."""
	if val is None:
	return None
	# Numeric fields
	if field in (
	"copayment_pct",
	"pre_existing_disease_waiting_months",
	"maternity_waiting_months",
	"no_claim_bonus_pct",
	"post_hospitalization_days",
	):
	try:
	return float(val)
	except (TypeError, ValueError):
	return None
	# Boolean fields
	if field == "maternity_coverage":
	if isinstance(val, bool):
	return val
	if isinstance(val, (int, float)):
	return bool(val)
	if isinstance(val, str):
	s = val.strip().lower()
	if s in ("true", "yes", "covered"):
	return True
	if s in ("false", "no", "not covered", "excluded"):
	return False
	return None
	return None
	# Restoration may arrive as bool (extracted .covered), str (curated prose)
	# or dict (already unwrapped above). Treat presence/absence as the signal:
	# a free-text limit phrase = True, explicit False/None = False.
	if field == "restoration_benefit":
	if isinstance(val, bool):
	return val
	if isinstance(val, str):
	s = val.strip().lower()
	if not s:
	return None
	if s in ("false", "no", "none", "n/a", "not available"):
	return False
	return True
	return None
	# String fields (room_rent_capping)
	if isinstance(val, str):
	s = val.strip().lower()
	return s or None
	return val


	def _ki145_material_diffs(curated: dict, extracted: dict) -> int:
	"""Count fields where BOTH sides have non-null values that disagree.
	Null on either side = SKIP (extraction incompleteness, not a real diff).
	>= 2 diffs → VARIANT (keep separate). < 2 → RENAME (alias-merge)."""
	diffs = 0
	for f in _KI145_DIFF_FIELDS:
	cur_v = _ki145_normalize(f, _ki145_extract_value(curated.get(f), f))
	ext_v = _ki145_normalize(f, _ki145_extract_value(extracted.get(f), f))
	if cur_v is None or ext_v is None:
	continue # extraction incompleteness, not a real diff
	if cur_v != ext_v:
	diffs += 1
	return diffs


	def _profile_summary_model(sc) -> Optional[ProfileSummaryModel]:
	"""Adapt the scorecard's ProfileSummary dataclass → the API model.

	None-safe (older Scorecard objects / defensive paths may not carry one).
	"""
	ps = getattr(sc, "profile_summary", None)
	if ps is None:
	return None
	return ProfileSummaryModel(
	strengths=list(getattr(ps, "strengths", []) or []),
	caveat=getattr(ps, "caveat", None),
	)


	def _marketplace_catalogue(user_profile_dict, _collect_scorecards=None):
	"""SINGLE SOURCE OF TRUTH for the marketplace card set (#40).

	The recommendation path (brain_tools._scorecard_signal via
	marketplace_grade) and /api/policies/all BOTH derive a policy's
	grade from THIS one computation, so the cited-card grade can never
	diverge from the marketplace card grade — including marketing-rename
	alias / KI-145 variant cards. Body is the former inline endpoint
	logic, moved verbatim; fully synchronous.

	Task #31 (single-source-of-truth, option (a)): when `_collect_scorecards`
	is a dict, it is populated `{surviving_card.policy_id: Scorecard}` with
	the EXACT `Scorecard` object (full 6 sub_scores + profile_summary +
	grade) computed here for each card that survives the final dedup. The
	single /api/policies/{id}/scorecard endpoint serves that object verbatim
	so its profile_summary / grade / sub_scores are byte-identical to the
	/api/policies/all card for the same canonical id BY CONSTRUCTION — both
	flow through this one `build_scorecard` pass on the same chosen sibling's
	`(data, insurer_reviews, profile)`. (The endpoint's old doctype-rank
	sibling-reconstruction picked a DIFFERENT sibling than this catalogue's
	completeness-based `_best` dedup, emitting a different strength set.)
	"""
	import json as _json
	# Task #31 — {id(MarketplacePolicy): Scorecard}. Keyed by the card
	# OBJECT's identity (NOT its policy_id string — several pre-dedup `out`
	# entries can share the same curated-canonical policy_id, so a string
	# key would let a lower-completeness sibling's Scorecard clobber the
	# survivor's). After `_best` picks the surviving object we map each
	# survivor's policy_id / canonical `_ident` to ITS OWN Scorecard.
	_sc_by_obj: dict = {} if _collect_scorecards is not None else None
	from backend.scorecard import build_scorecard
	from backend.policy_identity import clean_display_policy_name
	corpus_url_index = _build_corpus_url_index()
	curated_facts = _load_curated_facts()

	# KI-132 (2026-05-15) — expanded insurer_meta to cover all 19 real
	# insurers. Previously only 10 had curated display-names + home URLs,
	# so 9 insurers rendered as raw slugs in the marketplace dropdown
	# (acko, cholamandalam, go-digit, iffco-tokio, national-insurance,
	# oriental-insurance, reliance-general, royal-sundaram, sbi-general).
	insurer_meta = {
	"acko": ("Acko Health Insurance", "https://www.acko.com/health-insurance/"),
	"aditya-birla": ("Aditya Birla Health Insurance", "https://www.adityabirlacapital.com/healthinsurance"),
	"bajaj-allianz": ("Bajaj Allianz General Insurance", "https://www.bajajallianz.com/"),
	"care-health": ("Care Health Insurance", "https://www.careinsurance.com/"),
	"cholamandalam": ("Cholamandalam MS General Insurance", "https://www.cholainsurance.com/"),
	"go-digit": ("Go Digit General Insurance", "https://www.godigit.com/"),
	"hdfc-ergo": ("HDFC ERGO General Insurance", "https://www.hdfcergo.com/"),
	"icici-lombard": ("ICICI Lombard General Insurance", "https://www.icicilombard.com/"),
	"iffco-tokio": ("IFFCO Tokio General Insurance", "https://www.iffcotokio.co.in/"),
	"manipalcigna": ("ManipalCigna Health Insurance", "https://www.manipalcigna.com/"),
	"national-insurance": ("National Insurance Company", "https://nationalinsurance.nic.co.in/"),
	"new-india": ("New India Assurance", "https://www.newindia.co.in/"),
	"niva-bupa": ("Niva Bupa Health Insurance", "https://www.nivabupa.com/"),
	"indusind-general": ("IndusInd General Insurance (formerly Reliance General)", "https://www.indusind.com/general-insurance/"),
	"oriental-insurance": ("Oriental Insurance Company", "https://orientalinsurance.org.in/"),
	"reliance-general": ("Reliance General Insurance", "https://www.reliancegeneral.co.in/"),
	"royal-sundaram": ("Royal Sundaram General Insurance", "https://www.royalsundaram.in/"),
	"sbi-general": ("SBI General Insurance", "https://www.sbigeneral.in/"),
	"star-health": ("Star Health & Allied Insurance", "https://www.starhealth.in/"),
	"tata-aig": ("Tata AIG General Insurance", "https://www.tataaig.com/"),
	}

	def _coerce_bool(v):
	if isinstance(v, dict) and "covered" in v: return v.get("covered")
	if isinstance(v, bool): return v
	return None

	# Build a unified policy set: every extracted JSON + every curated facts
	# JSON that doesn't have an extracted counterpart yet. This way, even
	# policies whose LLM extraction failed still surface in the marketplace
	# with their human-curated data.
	#
	# KI-133 (2026-05-15) — dedup marketplace cards to ONE per policy product
	# (not one per PDF document). Previously wordings + brochure + cis of
	# the same product created three separate cards, ballooning the
	# marketplace from 138 products to ~209 cards and confusing users who
	# see "138 POLICIES" in the badge but 209 cards below.
	#
	# Algorithm: sort source filenames so the canonical "wordings" variant
	# is encountered first for each product, then dedup by stripped
	# policy_id (everything before the trailing __<doctype>).
	# Doctype preference: wordings > prospectus > cis > brochure > anything
	# else (alphabetical fallback).
	_DOCTYPE_RANK = {"wordings": 0, "prospectus": 1, "cis": 2, "brochure": 3}
	def _doctype_of(stem: str) -> str:
	return stem.rsplit("__", 1)[1] if "__" in stem else ""
	def _product_key_of(policy_id: str) -> str:
	# Strip trailing __<doctype> so wordings/brochure/cis of the same
	# product collapse to a single key.
	return policy_id.rsplit("__", 1)[0] if "__" in policy_id else policy_id

	sorted_files = sorted(
	settings.EXTRACTED_DIR.glob("*.json"),
	key=lambda fp: (_DOCTYPE_RANK.get(_doctype_of(fp.stem), 99), fp.stem),
	)

	# KI-141 (2026-05-15) — alias-dedup pre-pass. Curated "marketing rename"
	# entries that re-describe the SAME IRDAI-filed product collapse onto a
	# single marketplace card; the marketing names surface as `aliases`.
	#
	# KI-142 (2026-05-15, REFACTORED) — UIN-primary invariant: 1 unique UIN
	# = 1 unique marketplace card. The PDF-based gate is now a fallback for
	# entries that lack a UIN.
	#
	# Algorithm (two phases so PDF-backed extracted entries always claim
	# their UIN before any curated rename does):
	# Phase A: walk extracted/*.json (sorted by doctype rank, then stem).
	# Each extracted parent claims its uin_code into `uin_to_parent`.
	# Phase B: walk curated_facts (sorted by policy_id for determinism).
	# For each canonical curated entry (skip lookup-permutation aliases
	# and entries that ARE __wordings/__brochure/__cis themselves):
	# 1. Read curated UIN (scalar OR nested .value form).
	# 2. If UIN non-empty AND already in `uin_to_parent` (claimant !=
	# self) → alias of that parent.
	# 3. Else if UIN non-empty → claim it (so subsequent curated
	# siblings with the same UIN alias onto THIS entry in pass 2).
	# 4. Else (UIN empty) OR (UIN had no prior claimant) → fall back
	# to the source_pdf gate: if `_primary_source_pdf` maps to an
	# extracted parent stem, alias under that parent.
	# 5. Otherwise the curated entry stays as a standalone card.
	#
	# Multi-variant wordings PDFs with a single filed UIN (e.g.
	# manipalcigna prohealth-insurance-all-variants.pdf — the PDF text
	# confirms only ONE UIN `MCIHLIP24011V072324` is filed for that
	# product) correctly collapse all sub-product curated entries onto one
	# card. Distinct-UIN siblings under a shared PDF would surface as
	# separate cards because their UINs claim independent parents.
	extracted_stems = {fp.stem for fp in sorted_files}

	# Phase A — extracted parents claim their UINs first. We also retain the
	# parsed extracted JSON so Phase B can run the KI-145 material-diff check
	# without re-reading from disk.
	uin_to_parent: dict[str, str] = {}
	extracted_uin: dict[str, str] = {} # kept for downstream introspection
	extracted_data: dict[str, dict] = {}
	for fp in sorted_files:
	try:
	_d = _json.loads(fp.read_text())
	except Exception:
	continue
	extracted_data[fp.stem] = _d
	_u = _d.get("uin_code")
	if isinstance(_u, dict):
	_u = _u.get("value")
	_u = (_u or "").strip() if isinstance(_u, str) else ""
	if _u:
	extracted_uin[fp.stem] = _u
	uin_to_parent.setdefault(_u, fp.stem)

	# Direct-parent map for each curated entry (built in Phase B), then
	# chain-compressed in Phase C so transitive aliases (e.g. activ-one →
	# activ-health → activ-health-individual__wordings) flatten onto the
	# ultimate extracted parent.
	direct_parent: dict[str, str] = {}
	curated_canonical_ids: list[str] = []
	# KI-145 — curated entries whose UIN matched a candidate parent but
	# failed the material-diffs gate (>= 2 decision-critical fields disagree
	# with the parent's extracted JSON). These are genuine variants that
	# must emit as standalone cards in pass 2 even when their policy_id is
	# a prefix of a seen extracted policy_id (the old startswith-skip would
	# otherwise drop them silently).
	ki145_variant_curated_ids: set[str] = set()

	# Phase B — walk curated entries deterministically (sorted by policy_id).
	for curated_policy_id, cdata in sorted(curated_facts.items()):
	# Skip the __wordings/__brochure/__cis lookup-permutation aliases
	# that _load_curated_facts adds for hit-rate (canonical policy_id is
	# stored in the JSON's "policy_id" field).
	if curated_policy_id != cdata.get("policy_id", curated_policy_id):
	continue
	# Skip curated entries that ARE their own __wordings/__brochure/__cis
	# (doctype-permutation curated files, not marketing renames; pass-2
	# dedup handles them via the seen_policy_ids prefix check).
	if any(curated_policy_id.endswith(f"__{dt}")
	for dt in ("wordings", "brochure", "cis", "prospectus")):
	continue
	curated_canonical_ids.append(curated_policy_id)

	# Read curated UIN (scalar OR nested {value, source_pdf_path, ...}).
	curated_uin = cdata.get("uin_code")
	if isinstance(curated_uin, dict):
	curated_uin = curated_uin.get("value")
	curated_uin = (curated_uin or "").strip() if isinstance(curated_uin, str) else ""

	parent_id: str \| None = None
	if curated_uin and curated_uin in uin_to_parent \
	and uin_to_parent[curated_uin] != curated_policy_id:
	# KI-145 (2026-05-15) — UIN-primary path with smart variant
	# detection. Same UIN does NOT guarantee same product: a single
	# regulator-filed PDF often covers multiple marketed variants
	# (e.g. ProHealth Prime vs ProHealth Protect both filed under
	# MCIHLIP24011V072324; activ-assure-diamond curated vs extracted
	# disagree on PED/NCB). Compare 8 decision-critical fields; if
	# 2+ disagree on non-null values, treat as a VARIANT and keep
	# this curated entry as its own card. < 2 = pure rename → merge.
	candidate = uin_to_parent[curated_uin]
	# Candidate may be an extracted stem OR a previously-claimed
	# curated entry. Look up extracted JSON first; fall back to the
	# candidate's curated facts so the diff has real data to compare.
	cand_data = extracted_data.get(candidate) or curated_facts.get(candidate, {})
	if _ki145_material_diffs(cdata, cand_data) < 2:
	parent_id = candidate
	else:
	ki145_variant_curated_ids.add(curated_policy_id)
	elif curated_uin:
	# New UIN — this curated entry becomes the claimant so any
	# later curated sibling with the same UIN aliases onto it. Per
	# KI-145 spec ("if UIN doesn't match any extracted parent →
	# treat as standalone"), also flag this entry so pass-2 emits
	# it even when its policy_id is a prefix of a seen extracted id.
	uin_to_parent[curated_uin] = curated_policy_id
	ki145_variant_curated_ids.add(curated_policy_id)

	if parent_id is None and not curated_uin:
	# KI-142 (preserved): source-PDF fallback only fires for curated
	# entries with NO UIN. When UIN is present but unmatched, the
	# KI-145 spec mandates standalone — source-PDF coincidence MUST
	# NOT override the UIN-mismatch signal.
	fb_parent = _source_pdf_to_policy_id(cdata.get("_primary_source_pdf"))
	if fb_parent and fb_parent in extracted_stems and fb_parent != curated_policy_id:
	ext_data = extracted_data.get(fb_parent, {})
	if _ki145_material_diffs(cdata, ext_data) < 2:
	parent_id = fb_parent
	else:
	ki145_variant_curated_ids.add(curated_policy_id)

	if parent_id:
	direct_parent[curated_policy_id] = parent_id

	# Phase C — chain-compress direct_parent so every curated alias points
	# at its terminal parent (an extracted stem, or a curated parent that
	# itself has no parent). Detect cycles defensively. After compression
	# we emit one alias entry per curated descendant onto the terminal
	# parent's product_key.
	parent_pkey_aliases: dict[str, list[str]] = {}
	aliased_curated_ids: set[str] = set()

	def _terminal_parent(start: str) -> str \| None:
	"""Walk direct_parent until we hit an extracted stem or a curated id
	with no further parent. Returns None on cycle (defensive)."""
	seen_chain: set[str] = set()
	cur = start
	while True:
	nxt = direct_parent.get(cur)
	if not nxt:
	return cur if cur != start else None
	if nxt in seen_chain or nxt == start:
	return None # cycle — drop the alias attempt
	seen_chain.add(nxt)
	cur = nxt

	for curated_policy_id in curated_canonical_ids:
	if curated_policy_id not in direct_parent:
	continue
	terminal = _terminal_parent(curated_policy_id)
	if not terminal:
	continue
	# Alias-target product_key: extracted stems use _product_key_of()
	# (strips __doctype). Curated terminals use the policy_id directly.
	if terminal in extracted_stems:
	terminal_pkey = _product_key_of(terminal)
	else:
	terminal_pkey = terminal
	alias_name = clean_display_policy_name(
	curated_facts.get(curated_policy_id, {}).get("policy_name")
	or curated_policy_id
	)
	parent_pkey_aliases.setdefault(terminal_pkey, []).append(alias_name)
	aliased_curated_ids.add(curated_policy_id)

	seen_product_keys: set[str] = set()
	seen_policy_ids: set[str] = set()
	out = []

	# Pass 1: existing extracted policies (merged with curated overrides)
	for fp in sorted_files:
	try:
	data = _json.loads(fp.read_text())
	except Exception:
	continue
	policy_id_local = data.get("policy_id", fp.stem)
	curated_for_this = curated_facts.get(policy_id_local) or curated_facts.get(fp.stem)
	data = _merge_curated(data, curated_for_this)
	seen_policy_ids.add(policy_id_local)
	slug = data.get("insurer_slug", "")
	# Regulatory is not an insurer; drop entirely from the marketplace.
	# IRDAI/NHA docs are still retrieved and cited in chat answers, they
	# just don't appear as marketplace cards.
	if slug == "regulatory":
	continue
	# Dedup by product (insurer__product), so the wordings PDF wins and
	# the brochure/cis variants don't generate duplicate cards. Pass-1
	# sort order guarantees wordings comes first.
	product_key = _product_key_of(policy_id_local)
	if product_key in seen_product_keys:
	continue
	seen_product_keys.add(product_key)
	name, home = insurer_meta.get(slug, (slug, ""))
	# Get insurer reviews if available for the scorecard
	ir = None
	if slug:
	rp = settings.DATA_DIR / "reviews" / f"{slug}.json"
	if rp.exists():
	try: ir = _json.loads(rp.read_text())
	except Exception: pass
	sc = build_scorecard(data, insurer_reviews=ir, profile=user_profile_dict)
	# #48 — recover facts from the scorecard so the flat marketplace
	# fields (hence the CARD) match the detail-modal snapshot. Only
	# fill nulls; never overwrite a real extracted value.
	_rf = _recover_scorecard_facts(sc)
	for _dk in (
	"pre_existing_disease_waiting_months", "copayment_pct",
	"network_hospital_count", "cashless_treatment_supported",
	"ayush_coverage", "maternity_coverage", "max_entry_age",
	):
	if data.get(_dk) is None and _rf.get(_dk) is not None:
	data[_dk] = _rf[_dk]
	if not data.get("room_rent_capping"):
	if _rf.get("_room_no_cap"):
	data["room_rent_capping"] = "No room rent cap"
	elif _rf.get("_room_cap_text"):
	data["room_rent_capping"] = _rf["_room_cap_text"]

	si = data.get("sum_insured_options") or []
	if isinstance(si, list):
	si = [int(x) for x in si if isinstance(x, (int, float)) or (isinstance(x, str) and x.isdigit())]
	else:
	si = []
	# D3 — drop every SI value the field's own source_quote does not
	# genuinely state, then D1-classify the corroborated set as a
	# continuous band or discrete tiers. sum_insured_options/_min/_max
	# are now the CORROBORATED set (no fabrication), so the slider
	# filter + range display stay honest by construction.
	_siv = _rationalise_si(data, si)
	si = _siv.tiers

	try:
	policy_id = data.get("policy_id", fp.stem)
	# Backfill source_pdf_url from corpus_urls.md when extraction didn't
	# populate it. Try exact policy_id match first, then key permutations.
	# #87 — prefer a CREDIBLE public document URL; otherwise use the
	# local corpus PDF we definitively have for every policy (served
	# via /api/policy-pdf). A homepage/section URL is never trusted
	# over the real document. Never an empty link.
	_pidx = _corpus_pdf_index()
	_cand = (
	data.get("source_pdf_url")
	or corpus_url_index.get(policy_id)
	or corpus_url_index.get(fp.stem)
	or ""
	)
	_local = (
	f"/api/policy-pdf/{policy_id}"
	if (_pidx.get(policy_id) or _pidx.get(fp.stem))
	else ""
	)
	source_pdf_url = (
	_cand if _is_credible_pdf_url(_cand) else (_local or _cand)
	)
	_mp = MarketplacePolicy(
	policy_id=policy_id,
	policy_name=clean_display_policy_name(
	data.get("policy_name", fp.stem)
	),
	insurer_slug=slug,
	insurer_name=name,
	insurer_home_url=home,
	source_pdf_url=source_pdf_url,
	grade=sc.grade,
	overall_score=sc.overall_score,
	one_liner=sc.one_liner,
	data_completeness_pct=sc.data_completeness_pct,
	profile_summary=_profile_summary_model(sc),
	min_entry_age=data.get("min_entry_age"),
	max_entry_age=data.get("max_entry_age"),
	sum_insured_options=si,
	sum_insured_min=_siv.min_inr,
	sum_insured_max=_siv.max_inr,
	sum_insured_is_band=_siv.is_band,
	sum_insured_tiers=si,
	pre_existing_disease_waiting_months=data.get("pre_existing_disease_waiting_months"),
	initial_waiting_period_days=data.get("initial_waiting_period_days"),
	maternity_waiting_months=data.get("maternity_waiting_months"),
	copayment_pct=data.get("copayment_pct") if isinstance(data.get("copayment_pct"), (int, float)) else None,
	network_hospital_count=data.get("network_hospital_count"),
	no_claim_bonus_pct=data.get("no_claim_bonus_pct"),
	ayush_coverage=_coerce_bool(data.get("ayush_coverage")),
	maternity_coverage=_coerce_bool(data.get("maternity_coverage")),
	cashless_treatment_supported=_coerce_bool(data.get("cashless_treatment_supported")),
	room_rent_capping=data.get("room_rent_capping") if isinstance(data.get("room_rent_capping"), str) else None,
	network_list_url=_insurer_network(slug).get("network_list_url"),
	network_count_official=_insurer_network(slug).get("stated_count"),
	network_list_is_pdf=bool(_insurer_network(slug).get("is_pdf")),
	# KI-141 — merge marketing-rename curated entries onto this
	# parent card. Sorted for deterministic output.
	aliases=sorted(parent_pkey_aliases.get(product_key, [])),
	)
	out.append(_mp)
	if _sc_by_obj is not None:
	# Task #31 — bind THIS card object to the exact Scorecard
	# built above on the catalogue's chosen sibling
	# `data`/`ir`/profile. Object-keyed so it survives the
	# post-dedup mapping unambiguously.
	_sc_by_obj[id(_mp)] = sc
	except Exception as e:
	# One malformed extraction should not kill the whole feed
	print(f"[marketplace] skipping {fp.name}: {type(e).__name__}: {str(e)[:120]}")
	continue

	# Pass 2: curated policies that don't yet have an LLM extraction.
	# These come straight from 40-data/policy_facts/*.json — fully human-curated
	# with verbatim source quotes per field.
	for curated_policy_id, data in curated_facts.items():
	# Skip permutation keys (we set __wordings / __brochure / __cis aliases
	# in _load_curated_facts to maximise the lookup hit-rate in pass 1)
	if curated_policy_id != data.get("policy_id", curated_policy_id):
	continue
	if curated_policy_id in seen_policy_ids:
	continue
	# Also skip if any extracted ID matches with a suffix — UNLESS this
	# curated entry was classified as a KI-145 variant (same UIN/source-PDF
	# as a pass-1 card but materially different decision-critical fields).
	# Variants MUST surface as their own marketplace card; the legacy
	# startswith dedup would otherwise drop them silently.
	if curated_policy_id not in ki145_variant_curated_ids \
	and any(eid.startswith(curated_policy_id + "__") for eid in seen_policy_ids):
	continue
	# KI-141 — skip curated entries that have already been collapsed onto
	# a pass-1 parent card via the aliases mechanism (e.g. Activ One →
	# Activ Health Individual Wordings).
	if curated_policy_id in aliased_curated_ids:
	continue
	seen_policy_ids.add(curated_policy_id)
	slug = data.get("insurer_slug", "")
	# KI-208 (2026-05-15) — defensive symmetry with pass-1 (line 1842): any
	# curated_facts entry with insurer_slug=='regulatory' must NOT surface
	# as a marketplace card. Today no curated regulatory docs exist, but
	# adding the filter here closes a future-leak vector if an operator
	# accidentally curates an IRDAI/NHA fact-sheet under 40-data/policy_facts.
	if slug == "regulatory":
	continue
	name, home = insurer_meta.get(slug, (slug, ""))
	# Insurer reviews for scorecard
	ir = None
	if slug:
	rp = settings.DATA_DIR / "reviews" / f"{slug}.json"
	if rp.exists():
	try:
	ir = _json.loads(rp.read_text())
	except Exception:
	pass
	sc = build_scorecard(data, insurer_reviews=ir, profile=user_profile_dict)
	# #48 — recover facts from the scorecard so the flat marketplace
	# fields (hence the CARD) match the detail-modal snapshot. Only
	# fill nulls; never overwrite a real extracted value.
	_rf = _recover_scorecard_facts(sc)
	for _dk in (
	"pre_existing_disease_waiting_months", "copayment_pct",
	"network_hospital_count", "cashless_treatment_supported",
	"ayush_coverage", "maternity_coverage", "max_entry_age",
	):
	if data.get(_dk) is None and _rf.get(_dk) is not None:
	data[_dk] = _rf[_dk]
	if not data.get("room_rent_capping"):
	if _rf.get("_room_no_cap"):
	data["room_rent_capping"] = "No room rent cap"
	elif _rf.get("_room_cap_text"):
	data["room_rent_capping"] = _rf["_room_cap_text"]
	si = data.get("sum_insured_options") or []
	if isinstance(si, list):
	si = [int(x) for x in si if isinstance(x, (int, float)) or (isinstance(x, str) and x.isdigit())]
	else:
	si = []
	# D3/D1 — same source-quote corroboration + band/tier classification
	# as pass 1 (curated-only products take this branch).
	_siv = _rationalise_si(data, si)
	si = _siv.tiers
	try:
	# #87 — credible doc URL preferred, else the guaranteed-real
	# local corpus PDF; a homepage/section URL is never trusted.
	_pidx = _corpus_pdf_index()
	_cand = (
	data.get("source_pdf_url")
	or corpus_url_index.get(curated_policy_id)
	or corpus_url_index.get(f"{curated_policy_id}__wordings")
	or ""
	)
	_local = (
	f"/api/policy-pdf/{curated_policy_id}"
	if _pidx.get(curated_policy_id)
	else ""
	)
	source_pdf_url = (
	_cand if _is_credible_pdf_url(_cand) else (_local or _cand)
	)
	_mp = MarketplacePolicy(
	policy_id=curated_policy_id,
	policy_name=clean_display_policy_name(
	data.get("policy_name", curated_policy_id)
	),
	insurer_slug=slug,
	insurer_name=name,
	insurer_home_url=home,
	source_pdf_url=source_pdf_url,
	grade=sc.grade,
	overall_score=sc.overall_score,
	one_liner=sc.one_liner,
	data_completeness_pct=sc.data_completeness_pct,
	profile_summary=_profile_summary_model(sc),
	min_entry_age=data.get("min_entry_age"),
	max_entry_age=data.get("max_entry_age"),
	sum_insured_options=si,
	sum_insured_min=_siv.min_inr,
	sum_insured_max=_siv.max_inr,
	sum_insured_is_band=_siv.is_band,
	sum_insured_tiers=si,
	pre_existing_disease_waiting_months=data.get("pre_existing_disease_waiting_months"),
	initial_waiting_period_days=data.get("initial_waiting_period_days"),
	maternity_waiting_months=data.get("maternity_waiting_months"),
	copayment_pct=data.get("copayment_pct") if isinstance(data.get("copayment_pct"), (int, float)) else None,
	network_hospital_count=data.get("network_hospital_count"),
	no_claim_bonus_pct=data.get("no_claim_bonus_pct"),
	ayush_coverage=_coerce_bool(data.get("ayush_coverage")),
	maternity_coverage=_coerce_bool(data.get("maternity_coverage")),
	cashless_treatment_supported=_coerce_bool(data.get("cashless_treatment_supported")),
	room_rent_capping=data.get("room_rent_capping") if isinstance(data.get("room_rent_capping"), str) else None,
	network_list_url=_insurer_network(slug).get("network_list_url"),
	network_count_official=_insurer_network(slug).get("stated_count"),
	network_list_is_pdf=bool(_insurer_network(slug).get("is_pdf")),
	# KI-142 — curated entries can ALSO be UIN-claimants when no
	# extracted parent owns their UIN. In that case their later
	# curated siblings alias onto them and surface here.
	aliases=sorted(parent_pkey_aliases.get(curated_policy_id, [])),
	)
	out.append(_mp)
	if _sc_by_obj is not None:
	# Task #31 — exact Scorecard for this curated-only card,
	# bound to the card object (see Pass-1 rationale).
	_sc_by_obj[id(_mp)] = sc
	except Exception as e:
	print(f"[marketplace] skipping curated {curated_policy_id}: {type(e).__name__}: {str(e)[:120]}")
	continue

	# #80 — final safety dedup. The UIN/PDF gate above can still leak the
	# SAME logical product as both `insurer__product` and a doctype sibling
	# (`insurer__product__wordings\|brochure\|cis\|prospectus\|policy`). Collapse
	# to ONE card per product identity (richer entry wins; aliases merged) so
	# the marketplace never shows a plan twice — 1 product = 1 card.
	_DOCT = ("wordings", "brochure", "cis", "prospectus", "policy")

	def _ident(pid: str) -> str:
	for dt in _DOCT:
	if pid.endswith(f"__{dt}"):
	return pid[: -(len(dt) + 2)]
	return pid

	_best: dict[str, MarketplacePolicy] = {}
	for p in out:
	k = _ident(p.policy_id)
	prev = _best.get(k)
	if prev is None:
	_best[k] = p
	continue
	s = (p.data_completeness_pct, len(p.sum_insured_options),
	1 if p.policy_id == k else 0)
	ps = (prev.data_completeness_pct, len(prev.sum_insured_options),
	1 if prev.policy_id == k else 0)
	if s > ps:
	p.aliases = sorted(set(p.aliases) \| set(prev.aliases))
	_best[k] = p
	else:
	prev.aliases = sorted(set(prev.aliases) \| set(p.aliases))
	deduped = list(_best.values())

	if _collect_scorecards is not None:
	# Task #31 — publish ONLY the post-dedup survivors' Scorecards,
	# each survivor mapped (by OBJECT identity) to ITS OWN Scorecard,
	# keyed by the survivor's policy_id AND its canonical
	# `_ident(policy_id)` so /api/policies/{id}/scorecard resolves a
	# doctype-suffixed / curated-canonical id onto the SAME card the
	# catalogue serves — the exact `Scorecard` object built here on the
	# catalogue's chosen sibling. Parity holds by construction (one
	# build_scorecard pass feeds both surfaces). Exact policy_id wins
	# over the canonical-ident fallback (setdefault) so a precise id is
	# never shadowed by a sibling sharing its _ident.
	for p in deduped:
	sc = _sc_by_obj.get(id(p))
	if sc is None:
	continue
	_collect_scorecards[p.policy_id] = sc
	_collect_scorecards.setdefault(_ident(p.policy_id), sc)
	return deduped

	@app.get("/api/policies/all", response_model=MarketplaceResponse)
	async def policies_all(session_id: Optional[str] = None):
	"""The marketplace data feed — every extracted policy + scorecard + filterable fields.

	When session_id is provided AND the session has a profile populated to
	≥0.6 completeness, every policy is scored against THAT profile (dynamic
	per-user grade). Otherwise we score with the generic baseline weights.
	"""
	import json as _json
	from backend.scorecard import build_scorecard, profile_completeness as _completeness
	from backend.session_state import get_session as _get_sess

	# Pull user profile if we have one. KI-271 — drive the profile dict off
	# brain_tools.SLOT_UNION (via union_snapshot) so every captured slot —
	# including copay_pct, desired_sum_insured_inr, family_medical_history,
	# health_conditions, age — flows into build_scorecard's profile-aware
	# {strengths, caveat} generator (task #31). union_snapshot already drops
	# empty/None/[] slots, so presence == captured.
	user_profile_dict: Optional[dict] = None
	if session_id:
	sess = _get_sess(session_id)
	p = sess.profile
	profile_dict = brain_tools.union_snapshot(p)
	# parents_* are NOT in SLOT_UNION's snapshot if False/None but the
	# weight-tuner reads parents_to_insure/parents_age_max/parents_has_ped
	# explicitly — carry them through (None-safe) without overwriting a
	# snapshot value.
	for _pf in ("parents_to_insure", "parents_age_max", "parents_has_ped"):
	if _pf not in profile_dict:
	_v = getattr(p, _pf, None)
	if _v is not None:
	profile_dict[_pf] = _v
	if _completeness(profile_dict) >= 0.6:
	user_profile_dict = profile_dict

	deduped = _marketplace_catalogue(user_profile_dict)
	return MarketplaceResponse(
	policies=deduped,
	total=len(deduped),
	insurers_indexed=len({p.insurer_slug for p in deduped}),
	)


	@app.get("/api/policies/compare", response_model=CompareResponse)
	async def compare_policies(policy_ids: list[str] = None):
	"""Side-by-side comparison of 2-4 policies with their scorecards + field diffs."""
	import json as _json
	from backend.scorecard import build_scorecard
	from backend.policy_identity import clean_display_policy_name

	if not policy_ids:
	from fastapi import Query
	raise HTTPException(400, "Provide policy_ids as repeated query params")
	if len(policy_ids) < 2 or len(policy_ids) > 4:
	raise HTTPException(400, "compare requires 2 to 4 policy_ids")

	entries = []
	# KI: apply the SAME curated-override as /api/policies/all so COMPARE ALL
	# reflects the corrected/verbatim 40-data/policy_facts, not stale extract.
	_curated = _load_curated_facts()
	for pid in policy_ids:
	ep = settings.EXTRACTED_DIR / f"{pid}.json"
	data: Optional[dict] = None
	if ep.exists():
	try:
	data = _json.loads(ep.read_text())
	except Exception:
	data = None
	if data is not None:
	data = _merge_curated(
	data,
	_curated.get(data.get("policy_id", pid)) or _curated.get(pid),
	)
	if data is None:
	# #75 (2026-05-18) — curated-only catalogued products (e.g.
	# star-health__star-comprehensive, UIN SHAHLIP26044V092526) have
	# NO rag/extracted/<pid>.json. The marketplace, single
	# /api/scorecard, and bulk scorecard endpoints all resolve these
	# from the curated layer; compare_policies alone still 404'd,
	# breaking "Compare all" for those policies. Mirror the same
	# curated fallback (curated dict also carries doctype-suffixed
	# alias keys) instead of raising.
	data = (
	_curated.get(pid)
	or _curated.get(f"{pid}__wordings")
	or _curated.get(f"{pid}__cis")
	or _curated.get(f"{pid}__brochure")
	or _curated.get(f"{pid}__prospectus")
	)
	if not data:
	raise HTTPException(404, f"No data for {pid}")
	# Insurer reviews for scorecard
	slug = data.get("insurer_slug")
	ir = None
	if slug:
	rp = settings.DATA_DIR / "reviews" / f"{slug}.json"
	if rp.exists():
	try: ir = _json.loads(rp.read_text())
	except Exception: pass
	sc = build_scorecard(data, insurer_reviews=ir)
	entries.append(CompareEntry(
	policy_id=pid,
	policy_name=clean_display_policy_name(
	data.get("policy_name", pid)
	),
	insurer_slug=slug or "?",
	fields=data,
	scorecard=ScorecardResponse(
	policy_id=sc.policy_id, policy_name=sc.policy_name, insurer_slug=sc.insurer_slug,
	overall_score=sc.overall_score, grade=sc.grade, one_liner=sc.one_liner,
	sub_scores=[ScorecardSubScore(**s.__dict__) for s in sc.sub_scores],
	data_completeness_pct=sc.data_completeness_pct,
	methodology_link=sc.methodology_link,
	profile_summary=_profile_summary_model(sc),
	),
	))

	# Comparison-critical fields, in order
	field_order = [
	"policy_type", "uin_code",
	"min_entry_age", "max_entry_age",
	"sum_insured_options",
	"initial_waiting_period_days", "pre_existing_disease_waiting_months",
	"maternity_waiting_months",
	"pre_hospitalization_days", "post_hospitalization_days",
	"day_care_treatments_count", "ayush_coverage", "maternity_coverage",
	"newborn_coverage", "organ_donor_expenses",
	"no_claim_bonus_pct", "restoration_benefit",
	"room_rent_capping", "copayment_pct", "deductible_amount",
	"network_hospital_count", "cashless_treatment_supported",
	"claim_settlement_ratio", "tat_cashless_authorization_hours",
	]
	return CompareResponse(policies=entries, field_order=field_order)


	@app.get("/api/policies/{policy_id}/scorecard", response_model=ScorecardResponse)
	async def policy_scorecard(
	policy_id: str,
	age: Optional[int] = None,
	parents_to_insure: Optional[bool] = None,
	budget_band: Optional[str] = None,
	session_id: Optional[str] = None,
	):
	"""Compute the 6-sub-score A-F scorecard for an extracted policy.

	Now also pulls insurer-level reviews (IRDAI claim ratio + complaints) into
	the Claim Experience sub-score. See 70-docs/scorecard-methodology.md.

	§4c (task #31) — when `session_id` is supplied AND that session's profile
	is populated to ≥0.6 completeness, the policy is scored against THAT full
	profile (resolved the SAME way /api/policies/all does, via
	brain_tools.union_snapshot) so this endpoint's grade + profile_summary
	are byte-identical to the marketplace card for the same canonical id. The
	standalone `age` / `parents_to_insure` / `budget_band` query params remain
	a back-compat fallback when no session profile is available.
	"""
	import json as _json

	from backend.scorecard import build_scorecard
	from backend.scorecard import profile_completeness as _completeness
	from backend.session_state import get_session as _get_sess

	# ROOT-CAUSE FIX (scorecard 404 for catalogued curated-only products):
	# /api/policies/all catalogues a card for every extracted JSON AND every
	# curated-facts product (40-data/policy_facts/<insurer>__<product>.json).
	# Curated-only products (e.g. Tata AIG MediCare Lite → policy_id
	# `tata-aig__medicare-lite`) have NO `rag/extracted/<policy_id>.json` —
	# only doctype-suffixed extractions like `...__cis.json` — so the old
	# `extracted_path.exists() → 404` made the scorecard hard-fail for ~77 of
	# 170 catalogued policies, surfacing as the frontend's generic Retry
	# fallback. The marketplace builds those cards' grades straight from the
	# curated dict (policies_all Pass-2 `build_scorecard(data, ...)`); the
	# scorecard endpoint must resolve the SAME way. A catalogued policy_id
	# therefore resolves from extracted-with-curated-override OR, when no
	# extracted file exists, from the curated layer alone — never a 404 for a
	# catalogued product, never a fabricated grade.
	_curated = _load_curated_facts()
	extracted_path = settings.EXTRACTED_DIR / f"{policy_id}.json"

	if extracted_path.exists():
	try:
	policy = _json.loads(extracted_path.read_text())
	except Exception as e:
	raise HTTPException(500, f"Could not load extracted policy: {e}")
	# KI: same curated-override as /api/policies/all so the standalone
	# scorecard reflects the corrected/verbatim 40-data/policy_facts.
	policy = _merge_curated(
	policy,
	_curated.get(policy.get("policy_id", policy_id)) or _curated.get(policy_id),
	)
	else:
	# No bare `<policy_id>.json` extraction. Task #31 PARITY FIX: the
	# marketplace card for a doctype-suffixed extracted-only product
	# (e.g. star-health__star-cardiac-care, whose only extraction is
	# `...__wordings.json`) is built by /api/policies/all Pass-1 from
	# that doctype-suffixed EXTRACTED file (preferred over curated via
	# _DOCTYPE_RANK). The standalone endpoint previously skipped straight
	# to the curated layer, so its grade + profile_summary diverged from
	# the card for the SAME canonical id. Mirror the catalogue's doctype
	# preference (wordings > prospectus > cis > brochure) on the
	# EXTRACTED layer first, with the same curated-override, before
	# falling back to a curated-only product.
	policy = None
	for _dt in ("wordings", "prospectus", "cis", "brochure"):
	_ep = settings.EXTRACTED_DIR / f"{policy_id}__{_dt}.json"
	if _ep.exists():
	try:
	policy = _json.loads(_ep.read_text())
	except Exception:
	policy = None
	continue
	policy = _merge_curated(
	policy,
	_curated.get(policy.get("policy_id", policy_id))
	or _curated.get(f"{policy_id}__{_dt}")
	or _curated.get(policy_id),
	)
	break
	if policy is None:
	# No extraction in ANY doctype — fall back to the human-curated
	# facts layer (mirrors /api/policies/all Pass 2). The curated
	# dict also carries doctype-suffixed alias keys, so try the
	# canonical id and the raw lookup keys.
	policy = _curated.get(policy_id) or _curated.get(f"{policy_id}__cis") \
	or _curated.get(f"{policy_id}__wordings") \
	or _curated.get(f"{policy_id}__brochure") \
	or _curated.get(f"{policy_id}__prospectus")
	if not policy:
	# Genuinely not in EITHER layer ⇒ this id is not a catalogued
	# product at all (bad/typo id). 404 is the correct, honest
	# response here — it is NOT a catalogued policy.
	raise HTTPException(404, f"No data for policy_id={policy_id}")
	policy = dict(policy)
	policy.setdefault("policy_id", policy_id)

	# Load insurer reviews if present so the Claim Experience sub-score
	# uses authoritative IRDAI data, not just the (mostly-null) per-policy fields.
	insurer_reviews = None
	slug = policy.get("insurer_slug")
	if slug:
	rp = settings.DATA_DIR / "reviews" / f"{slug}.json"
	if rp.exists():
	try:
	insurer_reviews = _json.loads(rp.read_text())
	except Exception:
	pass

	# §4c — resolve the session profile the SAME way /api/policies/all does
	# (brain_tools.union_snapshot full dict + parents_* carry-through) so this
	# endpoint's grade + profile_summary match the marketplace card for the
	# same canonical id by construction. Only when ≥0.6 complete.
	#
	# `catalogue_profile` is EXACTLY what /api/policies/all would pass to
	# _marketplace_catalogue for this session (the ≥0.6 SLOT_UNION snapshot,
	# else None) — used below for the catalogue-card parity override. The
	# back-compat query-param path is a separate, profile-NEUTRAL-vs-catalogue
	# fallback (the catalogue is never built from loose query params).
	catalogue_profile: Optional[dict] = None
	profile: dict = {}
	if session_id:
	try:
	_p = _get_sess(session_id).profile
	_pd = brain_tools.union_snapshot(_p)
	for _pf in ("parents_to_insure", "parents_age_max", "parents_has_ped"):
	if _pf not in _pd:
	_v = getattr(_p, _pf, None)
	if _v is not None:
	_pd[_pf] = _v
	if _completeness(_pd) >= 0.6:
	profile = _pd
	catalogue_profile = _pd
	except Exception: # noqa: BLE001 — bad/expired session ⇒ back-compat path
	profile = {}
	catalogue_profile = None
	if not profile:
	# Back-compat: standalone query params when no usable session profile.
	if age is not None: profile["age"] = age
	if parents_to_insure is not None: profile["parents_to_insure"] = parents_to_insure
	if budget_band is not None: profile["budget_band"] = budget_band

	# TASK #31 — SINGLE SOURCE OF TRUTH (option (a)). When this id IS a
	# marketplace card, serve the EXACT `Scorecard` object the
	# /api/policies/all catalogue built for that canonical card under THIS
	# session's profile — full sub_scores + profile_summary + grade +
	# data_completeness + one_liner, all from the catalogue's ONE
	# build_scorecard pass on the catalogue's chosen sibling
	# `(data, insurer_reviews, profile)`. Parity is byte-identical BY
	# CONSTRUCTION: the same object feeds both surfaces, so the endpoint can
	# no longer pick a different doctype sibling than the catalogue's
	# completeness-based `_best` dedup (the prior bug — the old endpoint
	# reconstructed `policy` via its own doctype-rank loop and emitted a
	# different strength set / caveat for the same canonical id).
	#
	# `_catalogue_scorecard` returns None ONLY when the id is not a
	# catalogued product at all — then we fall through to the locally-built
	# scorecard so the curated-only / back-compat query-param / never-404
	# behaviour the resolution block above guarantees is fully preserved.
	cat_sc = None
	try:
	cat_sc = _catalogue_scorecard(policy_id, catalogue_profile)
	except Exception: # noqa: BLE001 — never let the SSOT resolver 500 a card
	cat_sc = None

	sc = cat_sc if cat_sc is not None else build_scorecard(
	policy, insurer_reviews=insurer_reviews, profile=profile or None
	)

	return ScorecardResponse(
	policy_id=sc.policy_id,
	policy_name=sc.policy_name,
	insurer_slug=sc.insurer_slug,
	overall_score=sc.overall_score,
	grade=sc.grade,
	one_liner=sc.one_liner,
	sub_scores=[ScorecardSubScore(**s.__dict__) for s in sc.sub_scores],
	data_completeness_pct=sc.data_completeness_pct,
	methodology_link=sc.methodology_link,
	insufficient_data=sc.insufficient_data,
	profile_summary=_profile_summary_model(sc),
	)


	# ----------------------------------------------------------------------------
	# Bulk scorecard endpoint — powers the PolicyCompareModal scorecard widget.
	# ----------------------------------------------------------------------------
	# Why bulk: the compare modal renders 2-4 scorecards in parallel and each is
	# profile-tuned. Doing N sequential GETs from the client wastes the per-policy
	# JSON I/O cost (we re-load every reviews file even for the same insurer) and
	# fans out N renders. One POST with the full profile + id list lets us:
	# - load each reviews file once per slug (memoized in the loop)
	# - return missing policies as N/A so the client renders a clean placeholder
	# - share one profile dict — no copy-paste of every field in N query strings
	class BulkScorecardRequest(BaseModel):
	policy_ids: list[str]
	profile: Optional[dict] = None


	class BulkScorecardEntry(BaseModel):
	policy_id: str
	policy_name: str
	insurer_slug: str
	overall_grade: str # "A" / "B+" / etc — letter only for missing
	overall_score: int # 0-100
	sub_scores: dict[str, int] # {coverage_breadth: 82, cost_predictability: 64, ...}
	profile_rationale: list[str] # bullets explaining WHY this score for this user
	data_completeness_pct: float
	one_liner: str = ""
	# raw signals per sub-score so the widget can pop-out a tooltip with detail
	signals: dict[str, list[str]] = Field(default_factory=dict)
	# Deterministic, profile-aware {strengths, caveat} — the structured
	# replacement for the generic one_liner the widget now renders at top.
	profile_summary: Optional[ProfileSummaryModel] = None


	class BulkScorecardResponse(BaseModel):
	per_policy: dict[str, BulkScorecardEntry]


	def _slugify_subscore(name: str) -> str:
	"""'Coverage Breadth' -> 'coverage_breadth' (stable key for the widget)."""
	return name.lower().replace("-", "_").replace("&", "and").replace(" ", "_").replace("__", "_")


	def _profile_rationale_for(policy: dict, profile: Optional[dict], sub_scores) -> list[str]:
	"""Turn raw signals + profile facts into 2-5 plain-English bullets.

	Each bullet is shaped as 'Strong fit:' or 'Weak fit:' so the buyer can scan
	pros and cons at a glance. We anchor each bullet to a concrete profile
	attribute (you mentioned X) so the user trusts the personalization is real.
	"""
	if not profile:
	return []
	bullets: list[str] = []
	conditions = profile.get("health_conditions") or []
	cond_str = " ".join(str(c).lower() for c in conditions) if isinstance(conditions, list) else ""
	age = profile.get("age") if isinstance(profile.get("age"), int) else None
	deps = (profile.get("dependents") or "").lower()
	loc = profile.get("location_tier")
	goal = (profile.get("primary_goal") or "").lower()
	existing = profile.get("existing_cover_inr")

	# Pre-existing disease handling
	if cond_str and any(c in cond_str for c in ("diab", "bp", "hyper", "thyroid", "heart")):
	ped = policy.get("pre_existing_disease_waiting_months")
	try:
	ped_n = int(ped) if ped is not None else None
	except (TypeError, ValueError):
	ped_n = None
	if ped_n is not None:
	if ped_n <= 24:
	bullets.append(f"Strong fit: PED waiting is only {ped_n} months — short for your {cond_str.strip()}.")
	elif ped_n >= 48:
	bullets.append(f"Weak fit: {ped_n}-month PED waiting is long for your {cond_str.strip()} — alternatives offer 24-36 months.")
	else:
	bullets.append(f"Fair fit: {ped_n}-month PED waiting is standard for your {cond_str.strip()}.")

	# Senior + claim reliability
	if age and age >= 60:
	nh = policy.get("network_hospital_count")
	try:
	nh_n = int(nh) if nh is not None else None
	except (TypeError, ValueError):
	nh_n = None
	if nh_n is not None and nh_n >= 7000:
	bullets.append(f"Strong fit: {nh_n:,}+ cashless hospitals matters at age {age} when access speed counts.")
	elif nh_n is not None and nh_n < 3000:
	bullets.append(f"Weak fit: only {nh_n} cashless hospitals — thin network for age {age}.")
	# max_renewal_age removed: lifelong renewability is the IRDAI norm for
	# every health-indemnity policy (universal → not a differentiator, and
	# the old `>= 99` check fired on the fabricated 999 sentinel).

	# Family + room-rent / maternity
	if any(k in deps for k in ("spouse", "wife", "husband", "partner", "kid", "child", "family")):
	rrc = policy.get("room_rent_capping")
	rrc_text = rrc if isinstance(rrc, str) else (rrc.get("limit_text") if isinstance(rrc, dict) else None)
	if rrc_text and "no cap" in rrc_text.lower():
	bullets.append("Strong fit: no room-rent cap — works for any hospital your family chooses.")
	elif rrc_text and ("1%" in rrc_text or "%" in rrc_text):
	metro_qual = " in a metro" if loc == "metro" else ""
	bullets.append(f"Weak fit: room rent capped ({rrc_text[:40].strip()}) may be tight for hospitals{metro_qual}.")
	if any(k in deps for k in ("spouse", "wife", "husband", "partner")):
	mc = policy.get("maternity_coverage")
	covered = mc.get("covered") if isinstance(mc, dict) else mc
	if covered is True:
	mw = policy.get("maternity_waiting_months")
	bullets.append(
	f"Strong fit: maternity covered with {mw}-month wait — relevant to your spouse."
	if mw else
	"Strong fit: maternity covered — relevant to your spouse."
	)
	elif covered is False:
	bullets.append("Weak fit: no maternity coverage — you'd need a separate rider.")

	# First-time buyer — simplicity / premium predictability
	if existing == 0:
	copay = policy.get("copayment_pct")
	try:
	copay_n = float(copay) if copay is not None else None
	except (TypeError, ValueError):
	copay_n = None
	if copay_n is not None and copay_n == 0:
	bullets.append("Strong fit: zero co-pay — simpler to budget for as a first-time buyer.")
	elif copay_n is not None and copay_n >= 20:
	bullets.append(f"Weak fit: {copay_n:.0f}% co-pay adds a surprise out-of-pocket — hard to plan as a first-time buyer.")

	# Tax-saving goal anchor
	if "tax" in goal:
	bullets.append("Note: premium qualifies for Section 80D deduction — aligned with your tax-saving goal.")

	# If we still have <2 bullets, fall back to top sub-score deltas vs neutral
	if len(bullets) < 2:
	ranked = sorted(sub_scores, key=lambda s: s.score, reverse=True)
	if ranked:
	top = ranked[0]
	bullets.append(f"Strongest area: {top.name} ({top.score}/100) — {top.summary.lower()}.")
	if len(ranked) > 1:
	bot = ranked[-1]
	if bot.score < 60:
	bullets.append(f"Watch out: {bot.name} ({bot.score}/100) — {bot.summary.lower()}.")

	return bullets[:5]


	def _letter_grade_with_plus(score: int) -> str:
	"""Convert 0-100 to A / A- / B+ / B / B- / C+ / C / C- / D / F.

	The base grade_for() returns flat letters (A/B/C/D/F). For the compare
	widget the buyer wants finer distinction between e.g. an 84 (top of B) and
	a 71 (bottom of B). Thresholds:
	90+ A, 85-89 A-, 80-84 B+, 75-79 B, 70-74 B-,
	65-69 C+, 60-64 C, 55-59 C-, 40-54 D, <40 F.
	"""
	if score >= 90: return "A"
	if score >= 85: return "A-"
	if score >= 80: return "B+"
	if score >= 75: return "B"
	if score >= 70: return "B-"
	if score >= 65: return "C+"
	if score >= 60: return "C"
	if score >= 55: return "C-"
	if score >= 40: return "D"
	return "F"


	@app.post("/api/scorecard/bulk", response_model=BulkScorecardResponse)
	async def scorecard_bulk(req: BulkScorecardRequest):
	"""Compute profile-tuned scorecards for N policies in one round-trip.

	Body: { policy_ids: [...], profile: {...} }
	Returns: { per_policy: { <policy_id>: { overall_grade, overall_score,
	sub_scores, profile_rationale,
	data_completeness_pct } } }

	Missing policy_ids get overall_grade="N/A" + rationale=["Data not indexed"].
	"""
	import json as _json
	from backend.scorecard import build_scorecard

	if not req.policy_ids:
	raise HTTPException(400, "policy_ids must be a non-empty list")
	if len(req.policy_ids) > 8:
	raise HTTPException(400, "bulk scorecard caps at 8 policies per call")

	profile = req.profile or None
	insurer_cache: dict[str, Optional[dict]] = {}
	out: dict[str, BulkScorecardEntry] = {}
	# KI: same curated-override as /api/policies/all so the bulk scorecard
	# badges reflect the corrected/verbatim 40-data/policy_facts.
	_curated = _load_curated_facts()

	for pid in req.policy_ids:
	extracted_path = settings.EXTRACTED_DIR / f"{pid}.json"
	policy = None
	if extracted_path.exists():
	try:
	policy = _json.loads(extracted_path.read_text())
	except Exception as e:
	out[pid] = BulkScorecardEntry(
	policy_id=pid, policy_name=pid, insurer_slug="?",
	overall_grade="N/A", overall_score=0, sub_scores={},
	profile_rationale=[f"Data unreadable: {e}"],
	data_completeness_pct=0.0,
	one_liner="Extraction file is corrupted.",
	signals={},
	)
	continue
	policy = _merge_curated(
	policy, _curated.get(policy.get("policy_id", pid)) or _curated.get(pid)
	)
	else:
	# ROOT-CAUSE FIX #60 (2026-05-18): curated-only catalogued
	# products (e.g. star-health__star-comprehensive, UIN
	# SHAHLIP26044V092526) have NO rag/extracted/<pid>.json — only
	# doctype-suffixed extractions. The marketplace + the single
	# /api/scorecard endpoint already resolve these from the curated
	# layer (policies_all Pass-2 / lines ~3617). The BULK endpoint
	# did not, so it emitted the N/A "No extraction available" /
	# "Data not indexed" sentinel — the broken-card defect the user
	# saw for Star Comprehensive. Mirror that curated fallback here;
	# the curated dict also carries doctype-suffixed alias keys.
	policy = (
	_curated.get(pid)
	or _curated.get(f"{pid}__wordings")
	or _curated.get(f"{pid}__cis")
	or _curated.get(f"{pid}__brochure")
	or _curated.get(f"{pid}__prospectus")
	)
	if not policy:
	# Genuinely absent from BOTH layers ⇒ not a catalogued product.
	out[pid] = BulkScorecardEntry(
	policy_id=pid,
	policy_name=pid,
	insurer_slug="?",
	overall_grade="N/A",
	overall_score=0,
	sub_scores={},
	profile_rationale=["Data not indexed"],
	data_completeness_pct=0.0,
	one_liner="No extraction available for this policy.",
	signals={},
	)
	continue

	slug = policy.get("insurer_slug") or "?"
	if slug not in insurer_cache:
	insurer_cache[slug] = None
	rp = settings.DATA_DIR / "reviews" / f"{slug}.json"
	if rp.exists():
	try:
	insurer_cache[slug] = _json.loads(rp.read_text())
	except Exception:
	insurer_cache[slug] = None

	sc = build_scorecard(policy, insurer_reviews=insurer_cache[slug], profile=profile)

	sub_map = {_slugify_subscore(s.name): s.score for s in sc.sub_scores}
	signal_map = {_slugify_subscore(s.name): s.signals for s in sc.sub_scores}
	psm = _profile_summary_model(sc)

	# Bridge the legacy profile_rationale list off the deterministic
	# profile_summary so the old field stays populated AND consistent
	# with the new structured data (strengths + [caveat]). Only fall
	# back to the heuristic _profile_rationale_for when the deterministic
	# summary produced too little to be useful (insufficient-data /
	# profile-neutral with <3 facts) so no surface goes blank.
	if psm and psm.strengths:
	rationale = list(psm.strengths)
	if psm.caveat:
	rationale.append(psm.caveat)
	else:
	rationale = _profile_rationale_for(policy, profile, sc.sub_scores)

	out[pid] = BulkScorecardEntry(
	policy_id=sc.policy_id or pid,
	policy_name=sc.policy_name or pid,
	insurer_slug=sc.insurer_slug or slug,
	overall_grade=_letter_grade_with_plus(sc.overall_score),
	overall_score=sc.overall_score,
	sub_scores=sub_map,
	profile_rationale=rationale,
	data_completeness_pct=sc.data_completeness_pct,
	one_liner=sc.one_liner,
	signals=signal_map,
	profile_summary=psm,
	)

	return BulkScorecardResponse(per_policy=out)


	class ReviewsResponse(BaseModel):
	insurer_slug: str
	insurer_name: str
	# #76 — these structured sub-objects are NOT present in every review
	# file (e.g. acko.json has none); requiring them 500'd the endpoint and
	# blanked the whole reputation panel even though real data existed.
	# Default-empty so the endpoint always returns 200 with whatever real
	# data the file does have (InsurerReviewsBlock already renders each
	# sub-object conditionally).
	aggregate_score: dict = Field(default_factory=dict)
	claim_metrics: dict = Field(default_factory=dict)
	aggregator_ratings: dict = Field(default_factory=dict)
	reddit_sentiment: dict = Field(default_factory=dict)
	youtube_coverage: dict = Field(default_factory=dict)
	in_news: list = Field(default_factory=list)
	last_updated: str = ""


	@app.get("/api/insurers/{insurer_slug}/reviews", response_model=ReviewsResponse)
	async def get_reviews(insurer_slug: str):
	"""Aggregated reviews + claim metrics for an insurer.

	Data sourced from IRDAI annual report + PolicyBazaar/InsuranceDekho +
	Reddit r/IndianFinance + YouTube finance creators (Ditto et al) +
	news mentions. Per-insurer JSON at 40-data/reviews/<slug>.json — see
	40-data/reviews/INDEX.md for leaderboard.
	"""
	import json
	p = settings.DATA_DIR / "reviews" / f"{insurer_slug}.json"
	if not p.exists():
	raise HTTPException(404, f"No reviews for insurer={insurer_slug}")
	try:
	d = json.loads(p.read_text())
	return ReviewsResponse(**d)
	except Exception as e:
	raise HTTPException(500, f"Failed to load reviews: {e}")


	class PremiumEstimateRequest(BaseModel):
	age: int = Field(..., ge=0, le=120)
	sum_insured_inr: int = Field(..., ge=100000, le=100000000)
	city_tier: str = Field("metro", pattern="^(metro\|tier1\|tier2)$")
	smoker: bool = False
	# family_size: 0 is the slider "self-only" sentinel (treated identical to 1)
	family_size: int = Field(1, ge=0, le=8)
	policy_id: Optional[str] = None
	# Pre-existing condition flag — controls PED premium load. Allowed values
	# mirror the FALLBACK_PED keys in backend/premium_calculator.py
	pre_existing_conditions: str = Field(
	"none",
	pattern="^(none\|diabetes_or_hypertension\|heart_disease\|multiple)$",
	)
	# Voluntary co-payment % — reduces premium ~7% per 10pp of co-pay
	copayment_pct: float = Field(0.0, ge=0, le=40)
	# Family medical history tokens (cancer / diabetes / heart_disease / …).
	# Applies the same family_history_loading (1.0×–1.10×) the header band and
	# bulk path use, so the per-policy panel reflects family history too (#52).
	family_medical_history: Optional[list[str]] = None
	# B2 widget parity (KI-bugfix, 2026-05-15) — optional slider overrides so
	# PolicyPremiumWidget (compare modal) can use the same curated-anchored
	# estimate() pipeline as PremiumCalculatorPanel instead of the divergent
	# bulk_estimate() flat-base path. Applied as straight multipliers on top
	# of the estimate() result using premium_calculator.BULK_TENURE_MULT /
	# BULK_DEDUCTIBLE_DISCOUNT constants — leaves estimate() math untouched.
	tenure_years: Optional[int] = Field(None, ge=1, le=3)
	deductible_inr: Optional[int] = Field(None, ge=0, le=200_000)


	class PremiumEstimateResponse(BaseModel):
	policy_id: str
	point_estimate_inr: int
	low_inr: int
	high_inr: int
	methodology: str
	sources: list[str]
	is_illustrative: bool = True
	disclaimer: str = (
	"Illustrative range only — actual premium depends on underwriting + "
	"medical history + risk factors. Confirm with the insurer before purchase."
	)
	# Echo back the effective tenure / deductible so the widget can render a
	# consistent breakdown line without re-deriving them. Optional for legacy
	# callers (PremiumCalculatorPanel ignores both).
	tenure_years: Optional[int] = None
	deductible_inr: Optional[int] = None
	# BUG #29 — whether THIS policy genuinely offers a user-selectable
	# voluntary deductible (curated deductible_amount > 0 AND not a
	# top-up). Only ~2 of 148 do. The widget hides the deductible selector
	# entirely when False; allowed_deductibles is the exact pill set.
	supports_voluntary_deductible: bool = False
	allowed_deductibles: list[int] = [0]
	# True when the underlying estimate() anchored to a curated quote sample.
	# PolicyPremiumWidget uses this (instead of bulk_estimate's `assumed` flag)
	# to decide whether to show its "Estimate" badge.
	base_sample_used: bool = False
	# D2 (2026-05-16) — non-null ONLY when the policy publishes no
	# corroborated Sum Insured, so this estimate was priced against a
	# fallback cover. The frontend renders it verbatim under the estimate:
	# "Estimate shown for ₹X cover — this policy's sum insured isn't published."
	sum_insured_disclosure: Optional[str] = None


	@app.post("/api/premium/estimate", response_model=PremiumEstimateResponse)
	async def premium_estimate(req: PremiumEstimateRequest):
	"""Illustrative premium calculator — rules-based estimate from curated public data."""
	from backend.premium_calculator import (
	estimate as _estimate,
	BULK_TENURE_MULT,
	BULK_DEDUCTIBLE_DISCOUNT,
	)
	e = _estimate(
	age=req.age,
	sum_insured_inr=req.sum_insured_inr,
	city_tier=req.city_tier,
	smoker=req.smoker,
	family_size=req.family_size,
	policy_id=req.policy_id,
	pre_existing_conditions=req.pre_existing_conditions,
	copayment_pct=req.copayment_pct,
	family_medical_history=req.family_medical_history,
	)

	# Snap incoming tenure / deductible to the nearest supported bucket so the
	# widget can pass raw slider values without precomputing.
	point = e.point_estimate_inr
	low = e.low_inr
	high = e.high_inr
	effective_tenure: Optional[int] = None
	effective_ded: Optional[int] = None
	if req.tenure_years is not None:
	effective_tenure = req.tenure_years if req.tenure_years in BULK_TENURE_MULT else 1
	tenure_mult = BULK_TENURE_MULT.get(effective_tenure, 1.0)
	point = int(round(point * tenure_mult))
	low = int(round(low * tenure_mult))
	high = int(round(high * tenure_mult))
	# BUG #29 — resolve whether this policy genuinely supports a voluntary
	# deductible. Only ~2 of 148 do; for every other policy a caller-supplied
	# deductible must NOT discount the premium.
	from backend.premium_calculator import policy_deductible_support
	_supports, _allowed = policy_deductible_support(req.policy_id)
	if req.deductible_inr is not None:
	if not _supports or req.deductible_inr not in _allowed:
	# Unsupported policy (or a value outside this policy's allowed
	# set) — no phantom discount, honest echo.
	effective_ded = 0
	elif req.deductible_inr in BULK_DEDUCTIBLE_DISCOUNT:
	effective_ded = req.deductible_inr
	else:
	effective_ded = min(
	BULK_DEDUCTIBLE_DISCOUNT.keys(),
	key=lambda d: abs(d - req.deductible_inr),
	)
	ded_mult = BULK_DEDUCTIBLE_DISCOUNT.get(effective_ded, 1.0)
	point = int(round(point * ded_mult))
	low = int(round(low * ded_mult))
	high = int(round(high * ded_mult))

	# D2 — when this policy publishes NO corroborated Sum Insured, the
	# estimate was necessarily priced against a fallback cover (the SI the
	# caller sent, which the per-policy estimator seeds from
	# desired_sum_insured_inr ?? ₹10 L). Surface the verbatim disclosure so
	# the user knows the SI is assumed, not the policy's own.
	si_disclosure: Optional[str] = None
	if req.policy_id:
	try:
	_siv = _policy_corroborated_si(req.policy_id)
	if _siv.kind == "none":
	from backend.premium_calculator import unpublished_si_disclosure
	si_disclosure = unpublished_si_disclosure(req.sum_insured_inr)
	except Exception:
	si_disclosure = None

	return PremiumEstimateResponse(
	policy_id=e.policy_id,
	point_estimate_inr=point,
	low_inr=low,
	high_inr=high,
	methodology=e.methodology,
	sources=e.sources or [],
	tenure_years=effective_tenure,
	deductible_inr=effective_ded,
	supports_voluntary_deductible=_supports,
	allowed_deductibles=_allowed,
	base_sample_used=e.base_sample_used is not None,
	sum_insured_disclosure=si_disclosure,
	)


	# ---------------------------------------------------------------------------
	# /api/premium/bulk — multi-policy slider-driven premium calculator
	# Powers the PolicyPremiumWidget inside PolicyCompareModal.
	# ---------------------------------------------------------------------------

	class PremiumBulkProfile(BaseModel):
	age: Optional[int] = Field(None, ge=0, le=120)
	dependents: Optional[str] = None
	location_tier: Optional[str] = None
	family_size: Optional[int] = Field(None, ge=0, le=10)
	smoker: Optional[bool] = False
	pre_existing_conditions: Optional[str] = "none"


	class PremiumBulkOverride(BaseModel):
	sum_insured_inr: Optional[int] = Field(None, ge=100_000, le=100_000_000)
	tenure_years: Optional[int] = Field(None, ge=1, le=3)
	deductible_inr: Optional[int] = Field(None, ge=0, le=200_000)


	class PremiumBulkRequest(BaseModel):
	policy_ids: list[str] = Field(..., min_length=1, max_length=20)
	profile: PremiumBulkProfile = Field(default_factory=PremiumBulkProfile)
	overrides: Optional[dict[str, PremiumBulkOverride]] = None


	class PremiumBulkRow(BaseModel):
	policy_id: str
	premium_inr_annual: int
	breakdown: dict
	sum_insured_inr: int
	tenure_years: int
	deductible_inr: int
	assumed: bool
	notes: list[str] = []


	class PremiumBulkResponse(BaseModel):
	per_policy: dict[str, PremiumBulkRow]
	profile_used: PremiumBulkProfile
	disclaimer: str = (
	"Illustrative estimates only — actual premiums depend on underwriting, "
	"medical history, and quote-time risk factors. Confirm with the insurer."
	)


	@app.post("/api/premium/bulk", response_model=PremiumBulkResponse)
	async def premium_bulk(req: PremiumBulkRequest):
	"""Bulk slider-driven premium estimator for the PolicyCompareModal widget."""
	from backend.premium_calculator import bulk_estimate as _bulk

	overrides = {
	pid: (ov.model_dump(exclude_none=True) if ov else {})
	for pid, ov in (req.overrides or {}).items()
	}
	rows = _bulk(
	policy_ids=req.policy_ids,
	profile=req.profile.model_dump(exclude_none=True),
	overrides=overrides,
	)
	return PremiumBulkResponse(
	per_policy={
	pid: PremiumBulkRow(
	policy_id=r.policy_id,
	premium_inr_annual=r.premium_inr_annual,
	breakdown=r.breakdown,
	sum_insured_inr=r.sum_insured_inr,
	tenure_years=r.tenure_years,
	deductible_inr=r.deductible_inr,
	assumed=r.assumed,
	notes=r.notes,
	)
	for pid, r in rows.items()
	},
	profile_used=req.profile,
	)


	@app.post("/api/tts")
	async def tts(req: TTSRequest):
	"""Standalone TTS endpoint — returns base64 WAV."""
	try:
	audio = await get_tts().synthesize(
	text=req.text,
	language_code=req.language_code,
	speaker=req.speaker,
	)
	except Exception as e:
	raise HTTPException(500, f"TTS failed: {type(e).__name__}: {e}")
	return JSONResponse({"audio_base64": base64.b64encode(audio).decode("utf-8")})


	@app.get("/api")
	async def api_root():
	return {
	"service": "Insurance Sales Portfolio Expert API",
	"version": "0.1.0",
	"docs": "/docs",
	"health": "/api/health",
	}


	# ---------------------------------------------------------------------------
	# Profile-level predicted-premium BAND — feeds the chat-UI chip that sits
	# next to the "X% DONE" profile-completeness pill. Updates reactively as the
	# profile fills in (frontend refetches whenever completeness_pct changes).
	# ---------------------------------------------------------------------------
	class PredictedPremiumBandResponse(BaseModel):
	min_inr: int
	median_inr: int
	max_inr: int
	sample_size: int
	assumed: bool
	# #63 — the SI the band was priced at. estimate_premium_band's KI-278
	# contract already returns this; the model dropped it, so the pill
	# couldn't tell the user the band is the TYPICAL cohort range at this
	# cover (vs the per-plan LIVE PREMIUM, which is one specific plan and
	# may sit outside the typical band — expected, not a contradiction).
	sum_insured_used: int = 0


	@app.get(
	"/api/profile/predicted-premium-band",
	response_model=PredictedPremiumBandResponse,
	)
	async def predicted_premium_band(session_id: Optional[str] = None):
	"""Return the user's estimated premium band aggregated across a
	representative basket of marketplace policies. Mirrors the slot-shape
	used by /api/profile/completeness so the chip and the bar share triggers.
	"""
	from backend.premium_calculator import estimate_premium_band
	from backend.session_state import get_session

	if not session_id:
	return PredictedPremiumBandResponse(
	min_inr=0, median_inr=0, max_inr=0, sample_size=0, assumed=True,
	sum_insured_used=0,
	)

	sess = get_session(session_id)
	p = sess.profile
	# KI-271 — band endpoint now drives off SLOT_UNION so copay_pct +
	# family_medical_history (D2/KI-269) actually shift the band. Prior
	# 12-key hand-roll silently omitted both → E3 smoke caught identical
	# bands with/without copay+family input.
	profile_dict = {
	slot: getattr(p, slot, None) for slot in brain_tools.SLOT_UNION
	}
	# Same answered-only gate as profile_completeness_view (KI-196 / ADR-041) —
	# only feed slots the user has actually answered, not pre-populated
	# defaults. Keeps the band stable until the user has actually said
	# something meaningful.
	answered = set(getattr(p, "asked", []) or [])
	filtered_profile = {
	k: (v if k in answered else None) for k, v in profile_dict.items()
	}
	band = estimate_premium_band(filtered_profile)
	return PredictedPremiumBandResponse(**band)


	# /api/profile/recall-by-name was REMOVED in ADR-043 (2026-05-27).
	# Cross-session profile recall is gone — sessions are in-memory only, so
	# there is nothing to "recall" off a bare name. The frontend api.ts caller
	# that wrapped this endpoint has also been removed. Old clients still
	# pinging the path get a 404, which is the correct degraded behaviour.


	# ---- Static frontend (served alongside /api on the same port for HF Spaces) ----
	# The Next.js frontend is statically exported during the Docker build to
	# /app/frontend/out. In local dev, this directory may not exist — we still
	# want the backend to start cleanly.
	import os
	from pathlib import Path as _Path

	_FRONTEND_DIR = _Path(__file__).resolve().parent.parent / "frontend" / "out"
	if _FRONTEND_DIR.exists():
	# Serve the built site as the catch-all. /api/* routes registered above
	# take precedence because they are matched first.
	app.mount("/", StaticFiles(directory=str(_FRONTEND_DIR), html=True), name="static")
	else:
	@app.get("/")
	async def root():
	return {
	"service": "Insurance Sales Portfolio Expert API",
	"version": "0.1.0",
	"frontend": "not built — run `cd frontend && npm run build`",
	"docs": "/docs",
	"health": "/api/health",
	}


	# ---- #40 SSOT grade resolver ------------------------------------------------
	# marketplace_grade(policy_id) returns the SAME (grade, overall) the
	# marketplace card for that policy's canonical identity shows. The
	# recommendation path calls this instead of re-deriving a scorecard, so
	# rec-card grade == marketplace grade for ALL 148 by construction.

	import threading as _mg_threading

	_MG_LOCK = _mg_threading.Lock()
	_MG_CACHE: dict = {"sig": None, "index": None}


	def _mg_data_signature() -> tuple:
	"""Cheap fingerprint that changes when any grading input changes
	(so an uploaded-PDF card or a curated edit invalidates the cache)."""
	sig = []
	for d in (settings.EXTRACTED_DIR, settings.DATA_DIR / "policy_facts",
	settings.DATA_DIR / "reviews"):
	try:
	for fp in sorted(d.glob("*.json")):
	st = fp.stat()
	sig.append((fp.name, int(st.st_mtime), st.st_size))
	except Exception: # noqa: BLE001 — missing dir → empty contribution
	continue
	# #52 — PERSISTED uploaded-doc records are ALSO grading inputs
	# (_load_curated_facts merges them). Walk the persistent UPLOADED_DOCS_DIR
	# so a brand-new upload — or a restart that re-materialised the dir —
	# invalidates the #40 grade cache and the new card grades immediately.
	try:
	for fp in sorted(settings.UPLOADED_DOCS_DIR.glob("*/record.json")):
	st = fp.stat()
	sig.append((str(fp.relative_to(settings.UPLOADED_DOCS_DIR)),
	int(st.st_mtime), st.st_size))
	except Exception: # noqa: BLE001 — missing dir → empty contribution
	pass
	return tuple(sig)


	def _mg_norm_uin(raw) -> str:
	try:
	from backend.policy_identity import normalize_uin
	return normalize_uin(raw)
	except Exception: # noqa: BLE001
	return ""


	def _mg_build_index() -> dict:
	"""{lookup_key -> (grade, overall_score)} for every marketplace card,
	keyed by policy_id, product_key, and normalised UIN so a variant /
	alias id resolves to its canonical card's grade."""
	cards = _marketplace_catalogue(None)
	cur = _load_curated_facts()
	idx: dict = {}

	def _put(k, val):
	if k:
	idx.setdefault(k, val)

	for c in cards:
	val = (c.grade, c.overall_score)
	pid = c.policy_id or ""
	_put(f"id:{pid}", val)
	try:
	from backend.policy_identity import product_key as _pk
	_put(f"pk:{_pk(pid)}", val)
	except Exception: # noqa: BLE001
	pass
	# UIN of the card's underlying data (curated wins, like the catalogue)
	cdata = cur.get(pid) or {}
	uin = _mg_norm_uin(cdata.get("uin_code") or cdata.get("uin"))
	if not uin:
	try:
	ep = settings.EXTRACTED_DIR / f"{pid}.json"
	if ep.exists():
	import json as _j
	uin = _mg_norm_uin(_j.loads(ep.read_text()).get("uin_code"))
	except Exception: # noqa: BLE001
	uin = ""
	_put(f"uin:{uin}" if uin else "", val)
	return idx


	def _mg_index() -> dict:
	sig = _mg_data_signature()
	with _MG_LOCK:
	if _MG_CACHE["sig"] != sig or _MG_CACHE["index"] is None:
	_MG_CACHE["index"] = _mg_build_index()
	_MG_CACHE["sig"] = sig
	return _MG_CACHE["index"]


	# Task #31 — profile-keyed {policy_id -> MarketplacePolicy} index so the
	# single /api/policies/{id}/scorecard endpoint can serve the EXACT card the
	# /api/policies/all catalogue produced for that id. This is the only way to
	# guarantee byte-identical profile_summary (and grade / overall_score) for
	# every card id — including doctype-suffixed stems the catalogue's pre-
	# existing #133/#145 dedup picks as the canonical card-id while computing
	# the scorecard from a different-doctype sibling. We do NOT re-architect
	# that dedup (out of scope, protected by test_full_id_universe_parity);
	# instead the endpoint defers to the catalogue, the single source of truth.
	_CAT_CARD_LOCK = _mg_threading.Lock()
	_CAT_CARD_CACHE: dict = {} # profile_key -> (sig, card_idx, sc_idx)


	def _profile_cache_key(profile: Optional[dict]) -> str:
	if not profile:
	return "∅"
	import json as _j

	return _j.dumps(
	{k: profile[k] for k in sorted(profile)},
	sort_keys=True, default=str,
	)


	def _catalogue_indices(profile: Optional[dict]) -> tuple[dict, dict]:
	"""`({policy_id -> MarketplacePolicy}, {policy_id\|_ident -> Scorecard})`
	for `profile`, cached on the data signature + a stable profile key so
	repeated single-scorecard calls in one render don't rebuild the catalogue
	per request.

	The Scorecard index is the Task #31 single-source-of-truth: it holds the
	EXACT `Scorecard` object `_marketplace_catalogue` built for each surviving
	card (full sub_scores + profile_summary + grade), keyed by the card's
	policy_id AND its canonical `_ident`. `/api/policies/{id}/scorecard`
	serves it verbatim, so its scorecard is byte-identical to the
	/api/policies/all card for the same canonical id by construction."""
	sig = _mg_data_signature()
	pkey = _profile_cache_key(profile)
	with _CAT_CARD_LOCK:
	entry = _CAT_CARD_CACHE.get(pkey)
	if entry is None or entry[0] != sig:
	sc_idx: dict = {}
	cards = _marketplace_catalogue(profile, _collect_scorecards=sc_idx)
	card_idx = {c.policy_id: c for c in cards}
	_CAT_CARD_CACHE[pkey] = (sig, card_idx, sc_idx)
	# Bound the cache so distinct profiles don't grow it unbounded.
	if len(_CAT_CARD_CACHE) > 16:
	for k in list(_CAT_CARD_CACHE.keys())[:-16]:
	_CAT_CARD_CACHE.pop(k, None)
	entry = _CAT_CARD_CACHE[pkey]
	return entry[1], entry[2]


	def _catalogue_card_index(profile: Optional[dict]) -> dict:
	"""{policy_id -> MarketplacePolicy} for `profile` (back-compat shim)."""
	return _catalogue_indices(profile)[0]


	# Doctype suffixes used to canonicalise a requested policy_id onto the
	# catalogue's surviving card id (mirrors _marketplace_catalogue._ident).
	_SCORECARD_DOCT = ("wordings", "brochure", "cis", "prospectus", "policy")


	def _canonical_ident(pid: str) -> str:
	for dt in _SCORECARD_DOCT:
	if pid.endswith(f"__{dt}"):
	return pid[: -(len(dt) + 2)]
	return pid


	def _catalogue_scorecard(policy_id: str, profile: Optional[dict]):
	"""The EXACT `Scorecard` the /api/policies/all catalogue produced for
	`policy_id`'s canonical card under `profile`, or None when `policy_id`
	is not a catalogued product.

	Resolution order (single source of truth — same dedup the catalogue
	uses): exact policy_id -> canonical `_ident(policy_id)` -> the
	canonical id of any catalogue card whose `aliases` contains this id's
	display name. Returns None (NOT a 404) so the caller keeps its existing
	curated-only / back-compat / never-404 behaviour for non-card ids."""
	if not policy_id:
	return None
	card_idx, sc_idx = _catalogue_indices(profile)
	pid = policy_id.strip()
	sc = sc_idx.get(pid) or sc_idx.get(_canonical_ident(pid))
	if sc is not None:
	return sc
	# Alias path: a marketing-rename id maps onto its canonical card.
	try:
	from backend.policy_identity import clean_display_policy_name
	want = clean_display_policy_name(pid)
	except Exception: # noqa: BLE001
	want = pid
	for c in card_idx.values():
	if pid in (c.aliases or []) or want in (c.aliases or []):
	cand = sc_idx.get(c.policy_id) or sc_idx.get(
	_canonical_ident(c.policy_id)
	)
	if cand is not None:
	return cand
	return None


	def marketplace_grade(policy_id: str) -> dict:
	"""{"_grade", "_overall_score"} for policy_id, identical to its
	marketplace card. Resolution order: exact id -> product_key -> UIN
	(so a marketing-rename / variant id maps onto its canonical card).
	Returns {} only when the policy is unknown to the marketplace."""
	if not policy_id:
	return {}
	idx = _mg_index()
	from backend.policy_identity import product_key as _pk
	cur = _load_curated_facts()
	pid = policy_id.strip()
	keys = [f"id:{pid}", f"pk:{_pk(pid)}"]
	cdata = cur.get(pid) or cur.get(_pk(pid)) or {}
	uin = _mg_norm_uin(cdata.get("uin_code") or cdata.get("uin"))
	if not uin:
	try:
	import json as _j
	for cand in (pid, _pk(pid)):
	ep = settings.EXTRACTED_DIR / f"{cand}.json"
	if ep.exists():
	uin = _mg_norm_uin(_j.loads(ep.read_text()).get("uin_code"))
	if uin:
	break
	except Exception: # noqa: BLE001
	uin = ""
	if uin:
	keys.append(f"uin:{uin}")
	for k in keys:
	if k in idx:
	g, o = idx[k]
	return {"_grade": g, "_overall_score": o}
	return {}