Spaces:

rohitsar567
/

InsuranceBot

Sleeping

App Files Files Community

InsuranceBot / backend /brain_tools.py

rohitsar567

feat!: remove cross-session profile recall (ADR-043) — net −3700 LOC

6d5684e about 1 month ago

Raw

History Blame Contribute Delete

93.7 kB

	"""Tool functions for single_brain.py (Path B — single-LLM architecture).

	The Gemini Flash model exposed in `backend/single_brain.py` calls these
	three tools to (a) persist captured profile fields, (b) retrieve policy
	chunks from Chroma, and (c) mark which policies it has recommended on
	the current turn so follow-ups like "tell me more about #2" can resolve.

	Each function:
	* Takes plain JSON-serialisable inputs (str / int / list[str]).
	* Returns a plain JSON-serialisable dict that gets fed back to the LLM
	on the next iteration of the function-calling loop.
	* Never raises — failures are surfaced via {"ok": False, "error": "..."}
	so the LLM can decide whether to retry or recover.

	The Gemini function-calling DSL (JSON Schema-flavoured) for these three
	tools is generated by `single_brain.TOOL_SCHEMAS` from this module's
	metadata.

	═══════════════════════════════════════════════════════════════════════════
	SLOT_UNION — SINGLE SOURCE OF TRUTH FOR CAPTURED FIELDS (B6, 2026-05-15)
	═══════════════════════════════════════════════════════════════════════════
	SLOT_UNION enumerates every captured field that influences EITHER the
	recommendation pipeline (retrieval query + scorecard) OR the pricing
	pipeline (premium_calculator.estimate / bulk_estimate). It is the contract
	between brain_tools (capture surface), single_brain (LLM tool calls),
	premium_calculator (pricing inputs) and scorecard (match scoring).

	Slot → consumer matrix:

	RECOMMENDATION SLOTS (in _REQUIRED_FOR_READY — hard gate)
	name → profile identity (no pricing influence)
	age → retrieval query + scorecard + pricing (age band)
	dependents → retrieval query + scorecard + pricing (family loading)
	location_tier → retrieval query + scorecard + pricing (location loading)
	income_band → retrieval query + scorecard
	primary_goal → retrieval query + scorecard
	health_conditions → retrieval query + scorecard + pricing (health loading)

	PRICING-ONLY SLOTS (B5 + B6 additions — SOFT capture, post-recap)
	budget_band → pricing band match
	desired_sum_insured_inr → pricing SI override (per-policy estimate)
	existing_cover_inr → pricing (existing-cover discount loading)

	FAMILY-DETAIL SLOTS (used by pricing if dependents includes parents)
	parents_to_insure → triggers parents_loading branch
	parents_age_max → pricing (parents age loading 1.0× / 1.4× / 1.8×)
	parents_has_ped → pricing (PED loading inflation for parents)

	D2 ADDITIONS (2026-05-15 — copay + family medical history)
	copay_pct → pricing (copay discount 1.0× / 0.95× / 0.88× / 0.80×)
	family_medical_history → pricing (family-history loading) + retrieval boost

	KI-275 (2026-05-15 — smoker / tobacco)
	smoker → pricing (smoker_loading 1.0× / 1.40×, +30-50%)

	Total: 16 slots. `gender` is tolerated by save_profile_field for forward
	compat but is NOT on the Profile dataclass today; it does not appear in
	SLOT_UNION because no consumer reads it.
	"""

	from __future__ import annotations

	import json as _json
	import logging
	import time
	from pathlib import Path
	from typing import Any, Optional

	from backend.config import settings
	from backend.policy_identity import clean_display_policy_name

	_log = logging.getLogger(__name__)


	# ───────────────────────────────────────────────────────────────────────────
	# KI-278 (2026-05-16) — policy-fact enrichment for the eligibility/ranking
	# filter. The Chroma chunk only carries citation metadata; the structural
	# facts the eligibility filter needs (top-up signal, sum-insured options,
	# mandatory co-pay) live in 40-data/policy_facts/*.json.
	#
	# IMPORTANT: this code only READS those JSON files and only reads STABLE
	# SCHEMA KEYS (policy_type_indemnity_or_fixed / deductible_amount /
	# co_payment_pct / sum_insured_options). The concurrent scorecard-repair
	# process rewrites the values; the field names are the contract and do
	# not change. We never write to policy_facts/*.json.
	#
	# A short in-process cache keeps this off the hot path (the catalog is ~250
	# files; we only ever touch the ≤8 retrieved per turn, and memoise stems).
	# ───────────────────────────────────────────────────────────────────────────

	_FACTS_DIR = settings.DATA_DIR / "policy_facts"
	_DOCTYPE_SUFFIXES = ("__wordings", "__brochure", "__cis", "__prospectus")
	# Width of the Chroma candidate pool pulled before eligibility +
	# scorecard-aware ranking — wide enough that a strong policy ranked only
	# mid-cosine for a generic query still enters contention. The LLM still
	# only sees the top-k best-fit survivors.
	_RECALL_POOL = 40
	_FACT_KEYS = (
	"policy_type_indemnity_or_fixed",
	# Raw catalog type key — some curated files carry the product type
	# only under `policy_type` (e.g. "hospital_cash") with no
	# `policy_type_indemnity_or_fixed`; the fixed-benefit gate needs it.
	"policy_type",
	"deductible_amount",
	"co_payment_pct",
	"sum_insured_options",
	# Eligibility-gate keys (read-only):
	# uin_code → canonical dedup identity (1 UIN = 1 product;
	# collapses doctype-sibling/rename duplicates).
	# max_entry_age → hard eligibility for the insured person; the
	# curated value is authoritative and overrides
	# a missing/None Chroma chunk field.
	# maternity_coverage → required-feature gate: an explicit maternity /
	# newborn_coverage newborn need ranks confirmed plans first.
	"uin_code",
	"max_entry_age",
	"maternity_coverage",
	"newborn_coverage",
	)

	# Bug #44 (2026-05-19) — DECISION-CRITICAL coverage fields that MUST be
	# resolved from the SAME canonical curated entry the marketplace
	# scorecard / #31 profile-summary path uses, so a verbal answer (or a
	# comparison TABLE the LLM builds from get_policy_facts) can never
	# contradict the scorecard card for the same policy.
	#
	# Root cause: each product has a base 40-data/policy_facts/<id>.json AND
	# doctype siblings (__wordings/__cis/__brochure/__prospectus). The
	# scorecard path resolves via main._load_curated_facts() (KI-219/KI-251
	# canonical precedence). get_policy_facts previously surfaced facts via
	# _load_policy_facts() — a DIFFERENT _candidate_stems resolver whose
	# 7-key _FACT_KEYS doesn't even include PED — so the two paths could
	# read different files and disagree on PED waiting (a live audit found
	# the comparison table said 24mo while the #31 card said "0 months").
	#
	# Fix: these specific fields are taken from the canonical curated entry
	# (`_curated_facts_all()[pid]`, the EXACT dict main._load_curated_facts()
	# feeds build_scorecard) so both surfaces agree BY CONSTRUCTION. This
	# mirrors the existing _scorecard_signal → marketplace_grade single-
	# source pattern (#40 / KI-219). The guard
	# tests/test_policy_facts_source_consistency.py asserts catalogue-wide
	# agreement.
	_DECISION_CRITICAL_FACT_KEYS = (
	"pre_existing_disease_waiting_months",
	"initial_waiting_period_days",
	"copayment_pct",
	"room_rent_capping",
	"claim_settlement_ratio",
	)


	def canonical_decision_facts(policy_id: str) -> dict:
	"""Decision-critical coverage facts for `policy_id`, resolved from the
	SAME canonical curated entry the marketplace scorecard path uses
	(main._load_curated_facts via _curated_facts_all). Returns only the
	keys in _DECISION_CRITICAL_FACT_KEYS that have a non-empty value.

	Single source of truth (Bug #44): the scorecard / #31 path and
	get_policy_facts BOTH read these fields from this one canonical entry,
	so they cannot drift. Read-only; never raises (returns {} on any
	failure so the tool degrades gracefully)."""
	pid = (policy_id or "").strip()
	if not pid:
	return {}
	try:
	all_cur = _curated_facts_all() or {}
	except Exception: # noqa: BLE001 — curated layer optional
	return {}
	entry = all_cur.get(pid)
	if entry is None:
	# Curated layer registers every doctype-suffix permutation +
	# each sibling stem/policy_id pointing at the canonical entry
	# (main._load_curated_facts Pass-2). Fall back to the canonical
	# (doctype-stripped) form for callers holding a suffixed id.
	for suf in _DOCTYPE_SUFFIXES:
	if pid.endswith(suf):
	entry = all_cur.get(pid[: -len(suf)])
	break
	if not isinstance(entry, dict):
	return {}
	out: dict = {}
	for k in _DECISION_CRITICAL_FACT_KEYS:
	v = entry.get(k)
	# _load_curated_facts already unwraps {value, source_*} to scalar;
	# accept the wrapped shape too, defensively.
	if isinstance(v, dict) and "value" in v:
	v = v.get("value")
	if v in (None, "", []):
	continue
	out[k] = v
	return out


	_facts_cache: dict[str, dict] = {}


	def _unwrap(v: Any) -> Any:
	"""policy_facts values are `{value, source_pdf_path, source_quote}`
	wrappers OR bare scalars. Return the underlying value either way."""
	if isinstance(v, dict) and "value" in v:
	return v["value"]
	return v


	def _candidate_stems(policy_id: str) -> list[str]:
	"""A retrieved chunk's policy_id may be the canonical stem
	(`insurer__product`) OR a doctype-suffixed stem
	(`insurer__product__cis`). Try the exact id first, then the canonical
	form, then every doctype sibling — first existing file wins.
	"""
	pid = (policy_id or "").strip()
	if not pid:
	return []
	stems = [pid]
	base = pid
	for suf in _DOCTYPE_SUFFIXES:
	if base.endswith(suf):
	base = base[: -len(suf)]
	break
	if base != pid:
	stems.append(base)
	for suf in _DOCTYPE_SUFFIXES:
	cand = base + suf
	if cand not in stems:
	stems.append(cand)
	return stems


	_extraction_cache: dict = {}


	def _has_extraction(policy_id: str) -> bool:
	"""True iff this policy has an LLM-extracted corpus file — the EXACT
	renderability rule the marketplace uses (main builds its card set from
	settings.EXTRACTED_DIR/*.json). A policy with curated facts but no
	extracted file renders as a BROKEN card: raw policy_id as the title,
	grade "N/A", "No extraction available for this policy.", "Data not
	indexed" (/api/bulk-scorecard). Such a policy must NEVER be quality-
	seeded or cited. Canonical-stem aware (doctype siblings count); cached
	incl. negatives."""
	pid = (policy_id or "").strip()
	if not pid:
	return False
	if pid in _extraction_cache:
	return _extraction_cache[pid]
	ok = False
	try:
	for stem in _candidate_stems(pid):
	if (settings.EXTRACTED_DIR / f"{stem}.json").exists():
	ok = True
	break
	except Exception: # noqa: BLE001 — predicate must never break retrieval
	ok = False
	_extraction_cache[pid] = ok
	return ok


	def _load_policy_facts(policy_id: str) -> dict:
	"""Return {fact_key: value} for a policy_id, or {} when no facts file
	exists / is unreadable. Cached per policy_id (incl. negative cache)."""
	if policy_id in _facts_cache:
	return _facts_cache[policy_id]
	out: dict = {}
	try:
	for stem in _candidate_stems(policy_id):
	fp = _FACTS_DIR / f"{stem}.json"
	if not fp.exists():
	continue
	try:
	d = _json.loads(fp.read_text())
	except Exception: # noqa: BLE001 — corrupt mid-repair → skip
	continue
	for k in _FACT_KEYS:
	if k in d and k not in out:
	out[k] = _unwrap(d[k])
	# Stop once we have the decision-critical signals. KI-279: a
	# type signal is "have it" if EITHER the canonical key OR the
	# raw `policy_type` key is present (some files only carry the
	# latter), so the fixed-benefit gate is never starved.
	# KI-280: also require the unified-gate signals (uin_code +
	# max_entry_age) before breaking so the eligibility/dedup rules
	# are not starved when a sibling doctype file carries them. The
	# candidate-stem list is short (≤5) so iterating it fully is
	# cheap; this just stops us breaking after stem #1 when the UIN
	# / entry-age lives in stem #2.
	_have_type = (
	"policy_type_indemnity_or_fixed" in out
	or "policy_type" in out
	)
	if (
	_have_type
	and "sum_insured_options" in out
	and "uin_code" in out
	and "max_entry_age" in out
	):
	break
	except Exception as e: # noqa: BLE001 — enrichment must never break retrieval
	_log.warning("KI-278 _load_policy_facts(%s) failed: %s", policy_id, e)
	out = {}
	_facts_cache[policy_id] = out
	return out


	_curated_all_cache: dict = {} # single-slot cache for the full curated layer
	_reviews_cache: dict = {}


	def _curated_facts_all() -> dict:
	"""The full curated-facts layer — the same source the marketplace
	scores from (main._load_curated_facts, KI-219/251 canonical
	precedence; lazy import since main is loaded at request time). Using
	it here makes a policy's recommendation grade identical to its
	marketplace grade. The 7-key `_load_policy_facts` is the input for the
	eligibility/dedup gate, not for grading."""
	if "d" not in _curated_all_cache:
	from backend.main import _load_curated_facts # lazy: avoids cycle
	_curated_all_cache["d"] = _load_curated_facts()
	return _curated_all_cache["d"]


	def _insurer_reviews(slug: str) -> Optional[dict]:
	"""Insurer reviews (40-data/reviews/<slug>.json) passed to
	build_scorecard — drives the claim-experience sub-score; the same
	source the marketplace uses."""
	if not slug:
	return None
	if slug in _reviews_cache:
	return _reviews_cache[slug]
	ir = None
	try:
	rp = settings.DATA_DIR / "reviews" / f"{slug}.json"
	if rp.exists():
	ir = _json.loads(rp.read_text())
	except Exception: # noqa: BLE001 — reviews optional
	ir = None
	_reviews_cache[slug] = ir
	return ir


	def _scorecard_signal(policy_id: str, profile=None) -> dict:
	"""{_grade, _overall_score} for policy_id — the SAME grade its
	marketplace card shows (#40 SINGLE SOURCE OF TRUTH, 2026-05-18).

	Delegates to backend.main.marketplace_grade, which derives the grade
	from the ONE marketplace catalogue computation
	(backend.main._marketplace_catalogue) using UIN-canonical resolution:
	a marketing-rename / KI-145 variant id resolves onto its canonical
	card. There is no longer a parallel doctype-rank/_merge
	re-implementation here, so the cited-card grade cannot drift from the
	marketplace card grade — for ALL 148 by construction, asserted by
	tests/test_scorecard_parity.py.

	`profile` is accepted for call-site compatibility. The parity-relevant
	grade LETTER (what _recommendation_fit gates on) is the profile-neutral
	marketplace grade, identical to the /api/policies/all catalogue view.
	Read-only; returns {} only when the policy is unknown to the
	marketplace (ranking still works off co-pay + SI headroom + cosine)."""
	try:
	from backend.main import marketplace_grade # lazy: avoids cycle
	sig = marketplace_grade(policy_id)
	if sig and sig.get("_grade"):
	return {
	"_grade": sig.get("_grade"),
	"_overall_score": sig.get("_overall_score"),
	}
	return {}
	except Exception: # noqa: BLE001 — scorecard optional; ranking degrades gracefully
	return {}


	# ---- accepted fields for save_profile_field --------------------------------

	# Mirrors the slot list in sales_brain._REQUIRED_FOR_READY plus the
	# nice-to-have fields the LLM may capture opportunistically. `gender`
	# is listed in the spec but is NOT a Profile dataclass field today —
	# we silently no-op on it rather than rejecting (forward-compat).
	_ACCEPTED_FIELDS = {
	"name",
	"age",
	"dependents",
	"location_tier",
	"income_band",
	"primary_goal",
	"health_conditions",
	"existing_cover_inr",
	"budget_band",
	"budget_inr", # #64 — exact ₹/yr; set as a side-effect of budget_band
	"desired_sum_insured_inr", # SOFT capture (pricing input, post-recap)
	# Family-detail pricing inputs (B6) — already on the Profile dataclass
	# via needs_finder.Profile (parents_to_insure / parents_age_max /
	# parents_has_ped). Listed here so save_profile_field can persist them
	# when Gemini extracts them post-recap.
	"parents_to_insure",
	"parents_age_max",
	"parents_has_ped",
	# D2 (2026-05-15) — coupled additions: co-pay tolerance + family medical history
	"copay_pct",
	"family_medical_history",
	# KI-275 (2026-05-15) — smoker / tobacco use, +30-50% premium loading.
	"smoker",
	"gender", # tolerated; not persisted unless Profile gains the field
	}

	# These are the slots the brain MUST capture before recommending — same
	# list as sales_brain._REQUIRED_FOR_READY. Kept inline (not imported)
	# to avoid coupling single_brain to sales_brain.
	_REQUIRED_FOR_READY = (
	"name",
	"age",
	"dependents",
	"location_tier",
	"income_band",
	"primary_goal",
	"health_conditions",
	)


	# ───────────────────────────────────────────────────────────────────────────
	# Bug #108 + #110 (2026-05-16) — POST-RECAP pricing & family-history bundle.
	#
	# Bug #108: the RULE 2.5 bundle (SI / budget / co-pay / family history /
	# smoker) is asked in ONE prompt. When the user answers SOME but
	# not all, the LLM treated the bundle as fully satisfied (it's
	# SOFT capture) and recommended with the unanswered slot blank —
	# e.g. asked SI/budget/co-pay/smoker, user gave SI/budget/co-pay,
	# smoker never re-asked, bot recommended.
	# Bug #110: family_medical_history (item 5 of the bundle) was the slot most
	# often silently dropped — the fact-find effectively NEVER asked it.
	#
	# FIX: a deterministic ONE-SHOT re-ask gate. After the hard 7-slot gate
	# passes, on a recommendation retrieve_policies call, if any UNRESOLVED
	# bundle slot remains we return a directive `pricing_inputs_incomplete`
	# response (re-ask exactly the unresolved ones, verbatim) — but ONLY once
	# per session, and ONLY when the user has not explicitly skipped. After the
	# single re-ask we proceed (SOFT-capture semantics preserved: the user can
	# still skip; we never hard-loop).
	#
	# A bundle slot is RESOLVED when it is either captured on the profile OR the
	# user explicitly declined/skipped it (session.pricing_bundle_skipped — set
	# by single_brain when the user says "just show me options" / "skip" / "you
	# decide"). parents_age_max is conditional: only part of the bundle when the
	# user is covering parents and it isn't captured yet.
	_PRICING_BUNDLE_CORE: tuple[str, ...] = (
	"desired_sum_insured_inr",
	"budget_band",
	"existing_cover_inr",
	"copay_pct",
	"family_medical_history", # Bug #110 — must be asked, same skip handling
	"smoker",
	)

	# Exact verbatim re-ask phrasing per bundle slot (mirrors RULE 2.5 wording so
	# the re-ask reads identically to the first ask). family_medical_history is
	# first so a forgotten Bug #110 slot leads the re-ask.
	_PRICING_BUNDLE_QUESTIONS: dict[str, str] = {
	"family_medical_history": (
	"Any major conditions running in your blood family "
	"(parents/siblings) — cancer / diabetes / heart disease / "
	"hypertension? (say 'none' if not)"
	),
	"desired_sum_insured_inr": (
	"How much sum insured would you like? (e.g., ₹5L / ₹10L / "
	"₹25L / ₹1Cr)"
	),
	"budget_band": (
	"What's your annual premium budget? (e.g., ₹10-15K/year, or "
	"₹50K+ for premium covers)"
	),
	"existing_cover_inr": (
	"Any existing health cover from work or otherwise? "
	"(e.g., '5L through employer', or 'no')"
	),
	"copay_pct": (
	"Are you OK with a co-pay — sharing 10-30% of every claim — to "
	"lower the premium? Or do you want zero co-pay?"
	),
	"smoker": "Do you smoke or use tobacco products? (yes / no)",
	"parents_age_max": (
	"Roughly what's the age of the eldest parent you'd cover?"
	),
	}


	def _profile_has_parents(profile) -> bool:
	"""True when the captured dependents indicate parents are covered (so
	parents_age_max becomes part of the post-recap bundle)."""
	dep = getattr(profile, "dependents", None)
	if isinstance(dep, str) and "parent" in dep.lower():
	return True
	return bool(getattr(profile, "parents_to_insure", None))


	def _unresolved_pricing_bundle(profile, session) -> list[str]:
	"""Return the bundle slots that are NEITHER captured on the profile NOR
	explicitly skipped by the user this session. Empty list ⇒ nothing left
	to re-ask (recommend may proceed)."""
	if session is not None and bool(
	getattr(session, "pricing_bundle_skipped", False)
	):
	# User explicitly said "just show me options / you decide / skip".
	return []
	bundle = list(_PRICING_BUNDLE_CORE)
	if _profile_has_parents(profile):
	bundle.append("parents_age_max")
	# #41 (2026-05-21) — a slot the user has ANSWERED is resolved even if
	# the answer coerces to an empty value (family_medical_history="none"
	# → []). profile.asked records answered slots, so an empty-but-asked
	# slot is NOT re-asked.
	asked = set(getattr(profile, "asked", None) or [])
	unresolved: list[str] = []
	for slot in bundle:
	if getattr(profile, slot, None) in (None, "", []) and slot not in asked:
	unresolved.append(slot)
	return unresolved


	# ───────────────────────────────────────────────────────────────────────────
	# SLOT_UNION (B6, 2026-05-15)
	# ───────────────────────────────────────────────────────────────────────────
	# Single source of truth for every captured field that drives EITHER the
	# profile (recommendation match + scorecard) OR the pricing pipeline
	# (premium_calculator.estimate / bulk_estimate). See module docstring above
	# for the full slot→consumer matrix.
	#
	# Ordering convention (do not re-order without auditing union_snapshot
	# callers): required slots first, then pricing-only slots, then
	# family-detail slots. Total = 13.
	SLOT_UNION: tuple[str, ...] = (
	# Recommendation slots (in _REQUIRED_FOR_READY)
	"name",
	"age",
	"dependents",
	"location_tier",
	"income_band",
	"primary_goal",
	"health_conditions",
	# Pricing slots (B5 + B6 additions)
	"budget_band",
	"budget_inr", # #64 — exact ₹/yr (lossless companion to budget_band)
	"desired_sum_insured_inr",
	"existing_cover_inr",
	# Family-detail slots (used by pricing if applicable)
	"parents_to_insure",
	"parents_age_max",
	"parents_has_ped",
	# D2 additions (2026-05-15)
	"copay_pct",
	"family_medical_history",
	# KI-275 (2026-05-15) — smoker / tobacco use, +30-50% premium loading.
	"smoker",
	)

	# Invariant: every SLOT_UNION field must be accepted by save_profile_field
	# (otherwise the LLM can never capture it). Validated at import time so a
	# future delete here is loud, not silent.
	assert all(_s in _ACCEPTED_FIELDS for _s in SLOT_UNION), (
	"SLOT_UNION contains a field not in _ACCEPTED_FIELDS: "
	f"{[s for s in SLOT_UNION if s not in _ACCEPTED_FIELDS]}"
	)


	def union_snapshot(profile) -> dict:
	"""Return a JSON-safe dict of every SLOT_UNION field currently captured
	on `profile`. Empty / None / [] slots are EXCLUDED so the pricing
	pipeline can safely treat presence as "captured" (KI-091 null-overwrite
	rule — never pass None where 0 is meaningful).

	Used by premium_calculator.estimate / bulk_estimate to read pricing
	inputs without re-implementing the field-name list on each side.
	"""
	snap: dict = {}
	for fld in SLOT_UNION:
	try:
	v = getattr(profile, fld, None)
	except Exception: # noqa: BLE001
	v = None
	if v in (None, "", []):
	continue
	snap[fld] = v
	return snap


	def _profile_complete(profile) -> bool:
	"""Return True when every slot in _REQUIRED_FOR_READY is non-empty on
	the live Profile dataclass."""
	for slot in _REQUIRED_FOR_READY:
	val = getattr(profile, slot, None)
	if val in (None, "", []):
	return False
	return True


	# ---- save_profile_field ----------------------------------------------------

	def save_profile_field(session, field: str, value: Any) -> dict:
	"""Validate + persist a captured profile field on session.profile.

	Accepted fields: name, age, dependents, location_tier, income_band,
	primary_goal, health_conditions, existing_cover_inr,
	budget_band, gender (tolerated, may no-op).

	Lightweight normalization:
	- age: int, clamp to [0, 110]
	- dependents: pass through `_normalize_dependents` when available,
	else stringify.
	- existing_cover_inr: parse via `_parse_inr_amount` when available,
	else int-coerce.
	- health_conditions: coerce to list[str], lowercase, strip empties.
	- everything else: string pass-through (Gemini already emits
	canonical values when prompted correctly).

	Returns: {"saved": True, "field": ..., "value": ...,
	"profile_complete": bool}
	On unknown field: {"saved": False, "error": "unknown_field"}
	"""
	if not isinstance(field, str) or not field:
	return {"saved": False, "error": "missing_field_name"}

	fld = field.strip().lower()
	if fld not in _ACCEPTED_FIELDS:
	return {"saved": False, "error": f"unknown_field:{field}"}

	profile = session.profile
	normalized: Any = value

	try:
	if fld == "age":
	normalized = _coerce_age(value)
	elif fld == "dependents":
	normalized = _coerce_dependents(value)
	elif fld == "health_conditions":
	normalized = _coerce_health_conditions(value)
	elif fld == "existing_cover_inr":
	normalized = _coerce_existing_cover(value)
	elif fld == "desired_sum_insured_inr":
	normalized = _coerce_desired_sum_insured(value)
	elif fld in ("parents_to_insure", "parents_has_ped"):
	normalized = _coerce_bool(value)
	elif fld == "parents_age_max":
	normalized = _coerce_age(value)
	elif fld == "copay_pct":
	normalized = _coerce_copay_pct(value)
	elif fld == "family_medical_history":
	normalized = _coerce_family_medical_history(value)
	elif fld == "smoker":
	normalized = _coerce_smoker(value)
	elif fld == "budget_band":
	normalized = _coerce_budget_band(value)
	elif fld == "name":
	normalized = (str(value).strip() if value is not None else None) or None
	elif fld == "gender":
	# Profile dataclass has no gender field today; silently
	# accept + skip persistence so the LLM doesn't loop trying
	# to save it. Forward-compat: when Profile gains gender,
	# this branch just becomes `normalized = str(value).strip()`.
	return {
	"saved": False,
	"field": fld,
	"value": value,
	"error": "field_not_on_profile_dataclass",
	"profile_complete": _profile_complete(profile),
	}
	else:
	# location_tier / income_band / primary_goal — pass through
	# (budget_band is normalised above via _coerce_budget_band)
	normalized = (str(value).strip() if value is not None else None) or None
	except (TypeError, ValueError) as e:
	return {
	"saved": False,
	"field": fld,
	"value": value,
	"error": f"normalize_failed:{type(e).__name__}:{e}",
	}

	# Drop None/empty so we don't overwrite a previously-captured slot
	# with a Gemini turn that "didn't extract anything". Universal rule
	# from KI-091/094 (extractor null overwrite).
	if normalized in (None, "", []):
	# #41 (2026-05-21) — an explicit NEGATIVE family-history answer
	# ("none") legitimately coerces to []. Do NOT silently drop it as
	# "extracted nothing": record the field on profile.asked so the
	# post-recap pricing-bundle gate (_unresolved_pricing_bundle)
	# treats it RESOLVED and never re-asks a slot the user answered.
	if fld == "family_medical_history" and value is not None and str(value).strip().lower() in (
	"none", "no", "nil", "nothing", "n/a", "na", "none.",
	"no family history", "no family medical history",
	"no family medical history.", "no family history.",
	):
	try:
	if fld not in profile.asked:
	profile.asked.append(fld)
	except Exception: # noqa: BLE001
	pass
	return {
	"saved": True,
	"field": fld,
	"value": [],
	"profile_complete": _profile_complete(profile),
	}
	return {
	"saved": False,
	"field": fld,
	"value": value,
	"error": "normalized_empty",
	"profile_complete": _profile_complete(profile),
	}

	if not hasattr(profile, fld):
	return {
	"saved": False,
	"field": fld,
	"value": value,
	"error": "field_not_on_profile_dataclass",
	"profile_complete": _profile_complete(profile),
	}

	setattr(profile, fld, normalized)
	# #64 — when the user states a budget, ALSO preserve the EXACT ₹ amount
	# losslessly (not just the 4-bucket band) so the slider shows what they
	# actually said ("₹15,000"), never a band representative ("₹12k"). The
	# band stays the pricing contract; budget_inr is the display truth.
	if fld == "budget_band":
	try:
	if isinstance(value, bool):
	_exact = None
	elif isinstance(value, (int, float)):
	_exact = int(value)
	else:
	from backend.needs_finder import _parse_inr_amount as _pinr
	import re as _re2
	# Strip per-annum qualifiers FIRST — same KI-161 guard
	# _coerce_budget_band handles, so "₹15,000/yr" / "15000 a
	# year" / "more than 15000 a year" yield the exact ₹, not
	# None (the parser otherwise reads "year" as age context).
	_s = str(value)
	_cleaned = _re2.sub(
	r"\b(?:per\s(?:year\|annum)\|p\.?\sa\.?\|/\s*(?:yr\|year\|"
	r"annum)\|a\syear\|annually\|yearly\|/\syr)\b",
	" ",
	_s,
	flags=_re2.IGNORECASE,
	)
	_exact = _pinr(_cleaned) or _pinr(_s)
	if _exact and _exact > 0 and hasattr(profile, "budget_inr"):
	profile.budget_inr = int(_exact)
	if "budget_inr" not in getattr(profile, "asked", []):
	profile.asked.append("budget_inr")
	except Exception: # noqa: BLE001 — exact ₹ is best-effort; band still saved
	pass
	# Track that the brain has "asked" this field so the rest of the
	# codebase's helpers (which inspect profile.asked) stay in sync.
	try:
	if fld not in getattr(profile, "asked", []):
	profile.asked.append(fld)
	except Exception: # noqa: BLE001 — best-effort bookkeeping
	pass

	return {
	"saved": True,
	"field": fld,
	"value": normalized,
	"profile_complete": _profile_complete(profile),
	}


	_qseed_cache: dict = {} # (profile_sig) -> [seed chunk dicts]
	# BUG #30 (B1-c) — per-signature count of TRAILING existing-cover top-up
	# seeds in `_qseed_cache[sig]`. They sit AFTER the primary window and must
	# survive the final `[:limit]` slice so a relevant super-top-up is never
	# truncated out of contention for a user who already holds base cover.
	_qseed_topup_n: dict = {}


	def _qseed_slice(rows: list[dict], sig: str, limit: int) -> list[dict]:
	"""Return up to `limit` primary seeds PLUS all existing-cover top-up
	seeds (which trail the list), so the top-up seeds are never cut."""
	n_top = _qseed_topup_n.get(sig, 0)
	if n_top <= 0:
	return rows[:limit]
	primaries = rows[:-n_top] if n_top < len(rows) else []
	topups = rows[-n_top:]
	return primaries[:limit] + topups


	def _quality_seed_candidates(profile, limit: int = 25) -> list[dict]:
	"""Seed the candidate pool with the catalogue's top policies by the
	profile-tuned scorecard overall, so a strong policy that isn't
	cosine-similar to a generic query still enters contention. This only
	ADDS candidates — filter_pipeline still applies precise eligibility +
	profile-fit ranking on the union; it never bypasses eligibility or
	fabricates a recommendation. Cached per profile-signature."""
	out: list[dict] = []
	try:
	prof_sig = repr(sorted(
	(s, getattr(profile, s, None))
	for s in (
	"age", "income_band", "primary_goal", "existing_cover_inr",
	"copay_pct", "dependents", "health_conditions",
	"budget_band", "location_tier", "parents_to_insure",
	"parents_age_max",
	)
	)) if profile is not None else "none"
	if prof_sig in _qseed_cache:
	return _qseed_slice(_qseed_cache[prof_sig], prof_sig, limit)
	cur = _curated_facts_all()
	scored: list[tuple[float, str, dict, dict]] = []
	seen: set[str] = set()
	for key, data in cur.items():
	if not isinstance(data, dict):
	continue
	pid = (data.get("policy_id") or key or "").strip()
	if not pid or pid in seen:
	continue
	seen.add(pid)
	if not _has_extraction(pid):
	# Curated-graded but no extracted corpus → its card would
	# render as N/A / "No extraction available for this policy"
	# / "Data not indexed". Never seed a non-renderable policy.
	continue
	sig = _scorecard_signal(pid, profile=profile)
	ov = sig.get("_overall_score")
	if ov is None:
	continue
	try:
	ovf = float(ov)
	except (TypeError, ValueError):
	continue
	scored.append((ovf, pid, data, sig))
	scored.sort(key=lambda t: -t[0])
	# BUG #30 (B1-c) — when the user already holds ANY base cover, also
	# union-in the top-N top-up / super-top-up policies even if they fall
	# outside the profile-neutral top-25 window, so a directly relevant
	# super-top-up is seeded into contention (filter_pipeline then ranks
	# the union via _fit_score, which now carries the existing-cover term).
	# Deterministic: drawn from the already-sorted `scored` list, no RNG.
	_existing = getattr(profile, "existing_cover_inr", None) \
	if profile is not None else None
	try:
	_existing_int = int(str(_existing).replace(",", "").strip()) \
	if _existing not in (None, "") else 0
	except (TypeError, ValueError):
	_existing_int = 0
	window = max(limit, 25)
	primary_rows = scored[:window]
	extra: list[tuple[float, str, dict, dict]] = []
	if _existing_int > 0:
	from backend.retrieval_filters import _is_top_up as _rf_is_top_up
	in_window = {pid for _, pid, _, _ in primary_rows}
	_TOPUP_SEED_MAX = 3 # bounded extra seeds; keeps pool deterministic
	for ovf, pid, data, sig in scored[window:]:
	if pid in in_window:
	continue
	probe = {
	"policy_name": data.get("policy_name", pid),
	**_load_policy_facts(pid),
	}
	if _rf_is_top_up(probe):
	extra.append((ovf, pid, data, sig))
	if len(extra) >= _TOPUP_SEED_MAX:
	break
	# `_n_topup_seeds` is preserved on the cached list so the final
	# slice keeps the existing-cover top-up seeds (they sit AFTER the
	# primary window and would otherwise be cut by `out[:limit]`).
	for ovf, pid, data, sig in primary_rows + extra:
	ch = {
	"chunk_id": f"{pid}__qseed",
	"policy_id": pid,
	"policy_name": clean_display_policy_name(
	data.get("policy_name", pid)
	),
	"insurer_slug": data.get("insurer_slug")
	or (pid.split("__", 1)[0] if "__" in pid else ""),
	"doc_type": "policy",
	"source_url": data.get("_primary_source_pdf") or "",
	# No cosine text — filter_pipeline ranks the union by
	# _fit_score (scorecard grade + profile fit), not cosine,
	# so a 0.0 cosine score does not bury a seeded A-policy.
	"chunk_text": "",
	"score": 0.0,
	}
	ch.update(_load_policy_facts(pid))
	ch.update(sig)
	out.append(ch)
	_qseed_cache[prof_sig] = out
	_qseed_topup_n[prof_sig] = len(extra)
	return _qseed_slice(out, prof_sig, limit)
	except Exception as e: # noqa: BLE001 — seeding must never break retrieval
	_log.warning("quality-seed failed: %s", e)
	return out[:limit]


	# ---- uploaded-doc (quarantine) bypass helpers ------------------------------


	def _session_has_quarantine_docs(session_id: str) -> bool:
	"""True iff this session has at least one chunk in the SEPARATE
	`user_uploads_quarantine` Chroma collection.

	Strictly session-scoped (where={"session_id": session_id}); cheap
	metadata-only `.get(limit=1)`. Never raises — a Chroma hiccup just
	means "treat as no upload" so the normal profile-gate path runs.
	"""
	if not session_id:
	return False
	try:
	from rag.ingest import get_quarantine_collection

	q = get_quarantine_collection().get(
	where={"session_id": session_id},
	limit=1,
	include=[],
	)
	return bool(q and q.get("ids"))
	except Exception as e: # noqa: BLE001 — best-effort probe
	_log.warning(
	"quarantine presence probe failed (sid=%s): %s: %s",
	session_id, type(e).__name__, str(e)[:160],
	)
	return False


	async def _retrieve_uploaded_only(
	query: str, session_id: str, top_k: int
	) -> dict:
	"""Quarantine-scoped retrieval that returns ONLY this session's
	uploaded-doc chunks, bypassing the recommendation profile-gate.

	Reuses `rag.retrieve.retrieve(session_id=...)` (whose quarantine boost
	pass already prepends this session's uploaded chunks), then filters the
	result down to `doc_type == "user_upload"` so the bypass response can
	NEVER contain general-corpus policy chunks against an incomplete
	profile. Returns the same dict shape as `retrieve_policies`.
	"""
	try:
	from rag.retrieve import retrieve as _retrieve

	chunks = await _retrieve(
	query=query,
	top_k=max(int(top_k) if top_k else 8, 3),
	session_id=session_id,
	)
	except Exception as e: # noqa: BLE001 — graceful empty
	_log.warning(
	"uploaded-only retrieve failed (sid=%s): %s: %s",
	session_id, type(e).__name__, str(e)[:160],
	)
	return {"chunks": [], "count": 0, "error": f"{type(e).__name__}"}

	uploaded = []
	for c in chunks or []:
	if (getattr(c, "doc_type", "") or "").lower() != "user_upload":
	continue
	# Triple-check session ownership before exposing the chunk —
	# belt + suspenders on top of the where={"session_id"} filter.
	if (getattr(c, "session_id", None) or session_id) != session_id and \
	getattr(c, "session_id", None) not in (None, ""):
	continue
	uploaded.append({
	"chunk_id": getattr(c, "chunk_id", ""),
	"policy_id": getattr(c, "policy_id", ""),
	"policy_name": clean_display_policy_name(
	getattr(c, "policy_name", "")
	),
	"insurer_slug": getattr(c, "insurer_slug", "") or "user-upload",
	"doc_type": "user_upload",
	"source_url": getattr(c, "source_url", ""),
	"chunk_text": (getattr(c, "text", "") or "")[:1200],
	"score": float(getattr(c, "score", 0.0) or 0.0),
	})
	if not uploaded:
	return {"chunks": [], "count": 0}
	return {
	"chunks": uploaded,
	"count": len(uploaded),
	"query": query,
	"source": "uploaded_doc_quarantine",
	"note": (
	"These chunks come from the user's OWN uploaded policy PDF "
	"(session-scoped quarantine). Answer the user's question "
	"about THIS document directly. Do NOT treat this as a "
	"general recommendation and do NOT block on profile "
	"completeness — the user explicitly asked about their "
	"uploaded file."
	),
	}


	# ---- retrieve_policies -----------------------------------------------------

	_NP_STOP = {
	"health", "insurance", "insurances", "policy", "policies", "plan",
	"plans", "the", "and", "of", "for", "cover", "covers", "coverage",
	"india", "general", "life", "assurance", "co", "ltd", "limited",
	"company", "scheme", "what", "is", "are", "tell", "me", "about",
	"detail", "details", "benefit", "benefits",
	}


	def _resolve_named_policy(query: str) -> Optional[str]:
	"""#61 — if the question UNAMBIGUOUSLY names a specific catalogue
	policy, return its policy_id so a factual Q&A can retrieve it without
	being blocked by the recommendation profile-gate. Conservative: >=2
	significant name tokens present, >=60% of the policy_name's significant
	tokens in the query, and the top match strictly ahead of the runner-up
	(no ambiguous grab). Returns None otherwise. Best-effort; never raises."""
	import re as _re
	try:
	q = " " + _re.sub(r"[^a-z0-9 ]", " ", (query or "").lower()) + " "
	if len(q) < 8:
	return None
	from backend.main import _marketplace_catalogue # lazy: avoids cycle
	scored: list[tuple[int, float, str, str]] = []
	for c in _marketplace_catalogue(None):
	name = (getattr(c, "policy_name", "") or "").lower()
	toks = {
	t for t in _re.sub(r"[^a-z0-9 ]", " ", name).split()
	if len(t) > 2 and t not in _NP_STOP
	}
	if len(toks) < 2:
	continue
	hit = sum(1 for t in toks if f" {t} " in q)
	cov = hit / len(toks)
	if hit >= 2 and cov >= 0.6:
	pid = getattr(c, "policy_id", None)
	if pid:
	scored.append((hit, cov, pid, name))
	if not scored:
	return None
	# VERSION DISAMBIGUATION (#61) — when the user explicitly states a
	# version ("...Health Companion V2022" / "V22"), the matching card
	# that carries that exact version token MUST win, even if a shorter
	# base-name card scores more generic tokens. Without this the base
	# "Niva Bupa Health Companion" (0 corpus chunks) was chosen over
	# "Health Companion V2022" (the card the user named, which HAS
	# chunks) → retrieval returned nothing → "I couldn't find it".
	_ver = set(_re.findall(r"\bv?\d{2,4}\b", q))
	if _ver:
	_vmatch = [
	s for s in scored
	if any(v in _re.sub(r"[^a-z0-9 ]", " ",
	s[3]).split() for v in _ver)
	]
	if len(_vmatch) == 1:
	return _vmatch[0][2]
	if _vmatch:
	_vmatch.sort(key=lambda s: (s[0], s[1]), reverse=True)
	if len(_vmatch) == 1 or _vmatch[0][0] > _vmatch[1][0]:
	return _vmatch[0][2]
	scored.sort(key=lambda s: (s[0], s[1]), reverse=True)
	if len(scored) == 1 or scored[0][0] > scored[1][0]:
	return scored[0][2]
	except Exception: # noqa: BLE001 — name resolution is best-effort
	pass
	return None


	async def retrieve_policies(
	query: str,
	top_k: int = 8,
	policy_filter_ids: Optional[list[str]] = None,
	profile=None,
	intent: str = "recommendation",
	session=None,
	session_id: Optional[str] = None,
	) -> dict:
	"""Call the existing Chroma retriever and return policy chunks.

	Returns:
	{"chunks": [{policy_id, policy_name, insurer_slug, chunk_text,
	doc_type, source_url, score, ...}, ...],
	"count": N,
	"query": query,
	"guard": optional {reason, fallback} if filter pipeline says abort}

	On failure: {"chunks": [], "count": 0, "error": "..."}.

	QUARANTINE-RETRIEVAL FIX (2026-05-16) — `session_id` is threaded all the
	way down to `rag.retrieve.retrieve(...)` so a PDF the caller uploaded via
	POST /api/upload-policy (indexed into the SEPARATE
	`user_uploads_quarantine` Chroma collection, tagged with this session's
	id) becomes retrievable BY THE CHAT BRAIN FOR THAT SESSION ONLY. Before
	this fix the upload was embedded but the brain never forwarded
	session_id, so the quarantine boost pass in retrieve.py never fired and
	an uploaded policy could never surface in the conversation. Resolution
	order: explicit `session_id` arg > `session.session_id` attribute >
	None (no quarantine lookup). User A's session_id never leaks into user
	B's retrieval because the quarantine `where={"session_id": ...}` filter
	is strictly equality-scoped (see rag/retrieve.py).
	"""
	# Resolve the effective session id. The single_brain dispatcher passes
	# the live SessionState as `session`; older callers may pass session_id
	# explicitly. Never raise — a missing id just means "no quarantine".
	eff_session_id = session_id
	if eff_session_id is None and session is not None:
	eff_session_id = getattr(session, "session_id", None)
	if isinstance(eff_session_id, str):
	eff_session_id = eff_session_id.strip() or None
	elif eff_session_id is not None:
	eff_session_id = None
	if not isinstance(query, str) or not query.strip():
	return {"chunks": [], "count": 0, "error": "empty_query"}

	# NAMED-POLICY Q&A BYPASS (#61, 2026-05-18) — a direct factual question
	# about a SPECIFIC catalogue policy ("what is the PED waiting period for
	# HDFC ERGO Optima Restore?") must be answerable on a cold /
	# incomplete-profile session. The profile-complete gate below blocks
	# ALL policy_filter_ids=None retrieval until the 7-slot fact-find is
	# done — so the bot replied "I couldn't find that policy" for policies
	# that ARE indexed (#26/#28). The gate exists to not RECOMMEND before
	# fact-find, not to refuse a factual lookup. When the query
	# unambiguously names a known policy, resolve it and reuse the existing
	# TRUSTED known-policy path (legitimately gate-bypassing + getting the
	# #61 canonical-family $in expansion in rag/retrieve.py).
	#
	# NOT gated on `intent`: single_brain._execute_tool HARDCODES
	# intent="recommendation" for EVERY tool call (single_brain.py:1529),
	# so an intent-conditioned bypass is dead code on the live path — the
	# proven (2026-05-18) #61 root cause: every named-policy Q&A arrived
	# with intent="recommendation" → the bypass never fired → the gate
	# blocked → "I couldn't find that policy". Safety is the RESOLVER's
	# conservatism, not the intent: a broad "recommend me a plan" / generic
	# profile request names NO specific policy → _resolve_named_policy
	# returns None → still fully gated (verified). Only an explicit,
	# unambiguous name (>=2 significant tokens, >=60% coverage,
	# version-aware, top strictly ahead of runner-up) triggers it.
	if not policy_filter_ids:
	_np = _resolve_named_policy(query)
	if _np:
	policy_filter_ids = [_np]

	# UPLOADED-DOC BYPASS (2026-05-18) — the user is explicitly promised in
	# the UI ("✓ Indexed … It's now searchable in this chat. Ask me about
	# it.") that an uploaded policy PDF is immediately queryable. But the
	# profile-complete gate below blocks ALL retrieval until the 7-slot
	# fact-find is done (unless policy_filter_ids is set, which the LLM
	# can't know for a freshly-uploaded doc). An uploaded doc is, by
	# definition, a known-doc-FOR-THIS-SESSION — semantically identical to
	# the policy_filter_ids follow-up branch that already legitimately
	# bypasses the gate. So: when this session has chunks in the SEPARATE
	# `user_uploads_quarantine` collection, run a quarantine-ONLY retrieval
	# that bypasses the recommendation profile-gate. Strictly session-
	# scoped (where={"session_id": eff_session_id}) so user A's upload
	# never leaks into user B. The full recommendation flow (general
	# corpus + eligibility + scorecard) still requires the complete
	# profile — this bypass only surfaces the user's OWN uploaded doc.
	if (
	eff_session_id
	and not policy_filter_ids
	and _session_has_quarantine_docs(eff_session_id)
	):
	up = await _retrieve_uploaded_only(query, eff_session_id, top_k)
	# Only short-circuit if the gate would otherwise block (incomplete
	# profile) AND we actually found uploaded chunks. If the profile is
	# already complete we fall through so the upload is folded into the
	# normal ranked recommendation pool by the quarantine boost pass.
	_profile_incomplete = profile is not None and any(
	getattr(profile, slot, None) in (None, "", [])
	for slot in _REQUIRED_FOR_READY
	)
	if up.get("count", 0) > 0 and _profile_incomplete:
	return up

	# Profile-complete gate (skip if caller supplied policy_filter_ids — that
	# branch is a known-policy follow-up). Defense-in-depth: even if the LLM
	# ignores RULE 2 of the system prompt, this refuses to return chunks
	# against an incomplete profile.
	if profile is not None and not policy_filter_ids:
	missing = [
	slot for slot in _REQUIRED_FOR_READY
	if getattr(profile, slot, None) in (None, "", [])
	]
	if missing:
	# KI-Z6-NONE follow-up (2026-05-15): make the response
	# extremely directive so Gemini doesn't burn an iteration
	# re-trying retrieve_policies on the same incomplete profile.
	# Provide an exact_question string the model can literally
	# relay to the user for the first missing slot.
	_SLOT_QUESTIONS = {
	"name": "What's your name?",
	"age": "How old are you?",
	"dependents": (
	"Who would you like the cover to include — just you, "
	"or spouse / kids / parents?"
	),
	"location_tier": "Which city do you live in?",
	"income_band": (
	"Roughly what's your annual household income — "
	"under 10 lakh, 10-25 lakh, or above 25 lakh?"
	),
	"primary_goal": (
	"Is this your first health policy, an upgrade, for "
	"tax planning, or to find a cheaper option?"
	),
	"health_conditions": (
	"Do you or your family have any pre-existing health "
	"conditions like diabetes, BP, or thyroid? If none, "
	"just say no."
	),
	}
	first = missing[0]
	return {
	"chunks": [],
	"count": 0,
	"error": "profile_incomplete",
	"missing_slots": missing,
	"action_required": "ask_user_for",
	"field": first,
	"exact_question": _SLOT_QUESTIONS.get(
	first,
	f"Could you share your {first.replace('_', ' ')}?",
	),
	"instruction": (
	f"Profile is incomplete — missing: {', '.join(missing)}. "
	"Do NOT call retrieve_policies again this turn. Do NOT "
	"retry save_profile_field for the same field. Emit a "
	"TEXT reply that asks the user the `exact_question` "
	"above verbatim."
	),
	}

	# Bug #108 + #110 (2026-05-16) — POST-RECAP pricing & family-history
	# bundle re-ask gate. The hard 7-slot gate above is satisfied; before we
	# return chunks for a RECOMMENDATION, ensure every bundle item (SI /
	# budget / existing cover / co-pay / FAMILY MEDICAL HISTORY / smoker /
	# parents-age-if-applicable) has been RESOLVED — captured OR explicitly
	# skipped. If the user answered some but not all, re-ask ONLY the
	# unresolved ones — but exactly ONCE per session (one-shot guard) so we
	# never hard-loop and SOFT-capture semantics survive (the user can still
	# skip on the re-ask). Follow-ups (policy_filter_ids) bypass this — it's
	# purely the first recommendation path.
	if (
	profile is not None
	and not policy_filter_ids
	and (intent or "").lower() == "recommendation"
	and session is not None
	and not bool(getattr(session, "pricing_bundle_reasked", False))
	):
	unresolved = _unresolved_pricing_bundle(profile, session)
	if unresolved:
	# One-shot: mark so the NEXT recommendation retrieve proceeds
	# even if the user skips on the re-ask (SOFT capture, not a hard
	# gate — Bug #108 fix must re-ask, not loop forever).
	try:
	session.pricing_bundle_reasked = True
	except Exception: # noqa: BLE001 — bookkeeping must not break
	pass
	_qs = [
	_PRICING_BUNDLE_QUESTIONS.get(
	s, f"Could you share your {s.replace('_', ' ')}?"
	)
	for s in unresolved
	]
	_numbered = "\n".join(
	f"{i}. {q}" for i, q in enumerate(_qs, start=1)
	)
	return {
	"chunks": [],
	"count": 0,
	"error": "pricing_inputs_incomplete",
	"missing_slots": unresolved,
	"action_required": "ask_user_for",
	"field": unresolved[0],
	"exact_question": (
	"Before I pull your recommendations, just a couple more "
	"(you can skip any):\n" + _numbered
	),
	"instruction": (
	"The user answered some but not all of the pricing / "
	"family-history questions. Do NOT call retrieve_policies "
	"again this turn and do NOT recommend yet. Emit a TEXT "
	"reply that asks ONLY the still-missing items in "
	"`exact_question` verbatim. If the user then provides "
	"them, save each via save_profile_field; if they skip, "
	"proceed to retrieve_policies on the next turn."
	),
	}

	try:
	from rag.retrieve import retrieve as _retrieve

	# Decouple the Chroma recall pool from the caller's top_k: pull a
	# wide pool so eligibility + scorecard-aware ranking choose from a
	# broad set, then return the top-k best-fit survivors (truncated
	# after filter_pipeline below). For an explicit known-policy
	# follow-up (policy_filter_ids) keep the narrow top_k.
	_recall_pool = (
	(int(top_k) if top_k else 8)
	if policy_filter_ids
	else _RECALL_POOL
	)
	chunks = await _retrieve(
	query=query,
	top_k=_recall_pool,
	policy_ids=policy_filter_ids or None,
	session_id=eff_session_id,
	)
	except Exception as e: # noqa: BLE001 — return graceful empty
	_log.warning(
	"retrieve_policies failed (q=%r): %s: %s",
	query[:120], type(e).__name__, str(e)[:200],
	)
	return {
	"chunks": [],
	"count": 0,
	"error": f"{type(e).__name__}:{str(e)[:200]}",
	}

	raw: list[dict] = []
	for c in chunks or []:
	pid = getattr(c, "policy_id", "")
	doc_type = getattr(c, "doc_type", "")
	chunk_dict = {
	"chunk_id": getattr(c, "chunk_id", ""),
	"policy_id": pid,
	"policy_name": clean_display_policy_name(
	getattr(c, "policy_name", "")
	),
	"insurer_slug": getattr(c, "insurer_slug", ""),
	"doc_type": doc_type,
	"source_url": getattr(c, "source_url", ""),
	"chunk_text": (getattr(c, "text", "") or "")[:1200],
	"score": float(getattr(c, "score", 0.0) or 0.0),
	"min_entry_age": getattr(c, "min_entry_age", None),
	"max_entry_age": getattr(c, "max_entry_age", None),
	}
	# KI-278 — enrich policy chunks with the structural facts the
	# eligibility/profile-fit filter needs (top-up signal, SI options,
	# mandatory co-pay, scorecard grade). Skip non-policy chunks
	# (profile/regulatory/review) — they're never recommendable policies
	# and the eligibility rules don't apply to them.
	if pid and (doc_type or "").lower() not in (
	"profile", "regulatory", "review"
	):
	try:
	chunk_dict.update(_load_policy_facts(pid))
	chunk_dict.update(_scorecard_signal(pid, profile=profile))
	except Exception as e: # noqa: BLE001 — never break retrieval
	_log.warning("KI-278 enrich(%s) failed: %s", pid, e)
	raw.append(chunk_dict)

	# X5 sidecar: apply profile-fit + citation-grounding + dedup. Skip when
	# caller supplied an explicit policy_filter_ids (we already know which
	# policies they want).
	guard_signal = None
	filtered = raw
	if not policy_filter_ids:
	# Union the cosine pool with the catalogue's top profile-graded
	# policies so a strong policy that isn't cosine-similar to a
	# generic needs-query still enters contention. filter_pipeline
	# then applies eligibility + profile-fit ranking on the union. A
	# cosine chunk wins on a dup (it carries real retrieved text);
	# seeds only add missing candidates.
	if profile is not None:
	_seen_pids = {
	(c.get("policy_id") or "").strip() for c in raw
	}
	for _seed in _quality_seed_candidates(profile, limit=25):
	_sp = (_seed.get("policy_id") or "").strip()
	if _sp and _sp not in _seen_pids:
	_seen_pids.add(_sp)
	raw.append(_seed)
	try:
	from backend.retrieval_filters import filter_pipeline
	filtered, guard_signal = filter_pipeline(
	raw, profile=profile, query=query, intent=intent,
	)
	except Exception as e: # noqa: BLE001 — pipeline must never break retrieval
	_log.warning("retrieval_filters.filter_pipeline failed: %s", e)
	filtered = raw

	# filter_pipeline has eligibility-filtered + ranked the wide pool
	# best-fit-first (scorecard-aware, deduped to ~1 chunk/policy).
	# Return only the top-N best-fit survivors — enough for the LLM to
	# pick 2-4 recommendations and for the citation builder to select
	# from, without the wide tail as context. This is the only
	# truncation, done after quality ranking, so the LLM and the cards
	# see the same best-fit set.
	filtered = filtered[: max((int(top_k) if top_k else 8), 12)]

	# For a recommendation turn, apply the same fitness floor the
	# citation builder uses (_recommendation_fit) here, so the LLM only
	# sees cardable policies — prose and cards stay 1:1 (it cannot name
	# a policy it won't card). If nothing clears the floor the set is
	# empty and the LLM says there is no strong match rather than
	# padding with a sub-floor policy. qa / follow-up intents are
	# untouched (they cite supporting source chunks regardless of
	# recommendation grade).
	if (intent or "").lower() == "recommendation" and filtered:
	try:
	from backend.single_brain import _recommendation_fit
	filtered = [c for c in filtered if _recommendation_fit(c)[0]]
	except Exception as e: # noqa: BLE001 — never break retrieval
	_log.warning("rec-fit 1:1 gate failed: %s", e)

	# X7 — cache slug→insurer lookups on session so a subsequent
	# mark_recommendation call (same turn) can stamp the right insurer on the
	# shown_policies event. Each retrieve_policies call MERGES into the cache
	# rather than overwriting, so an LLM that hits multiple retrieves before
	# marking still resolves every cited slug. Keep last_retrieved_chunks too
	# for parity with future tools that need the full chunk objects.
	if session is not None:
	try:
	slug_to_insurer = dict(getattr(session, "slug_to_insurer", {}) or {})
	for c in filtered:
	slug = (c.get("policy_id") or "").strip()
	insurer = (c.get("insurer_slug") or "").strip()
	if slug and insurer:
	slug_to_insurer[slug] = insurer
	session.slug_to_insurer = slug_to_insurer
	session.last_retrieved_chunks = list(filtered)
	except Exception: # noqa: BLE001 — bookkeeping must never fail retrieval
	pass

	out = {
	"chunks": filtered,
	"count": len(filtered),
	"query": query,
	}
	if guard_signal is not None:
	out["guard"] = guard_signal
	return out


	# ---- mark_recommendation ---------------------------------------------------

	def get_policy_facts(session, policy_ids: Optional[list[str]] = None) -> dict:
	"""Return AUTHORITATIVE claim / reputation / scorecard / coverage facts
	for one or more policy_ids — the SAME data the frontend detail-modal
	shows (insurer reviews `claim_metrics` + scorecard grade + the curated
	coverage facts). This is the tool the brain calls for ANY follow-up
	about claim-settlement ratio, claim denials/rejections, complaints,
	incurred-claim ratio, insurer reputation, or to COMPARE two policies
	the user already saw.

	Root cause (2026-05-18): the brain previously had NO way to reach
	claim/denial/complaint/review data — retrieve_policies returns policy
	WORDING chunks only — so it falsely answered "I don't have enough
	information" for claims questions and could not back a verbal
	comparison. This tool closes that gap; it reuses the existing
	`_insurer_reviews` / `_scorecard_signal` / `_load_policy_facts` /
	`_curated_facts_all` loaders so a verbal answer matches the modal.

	`policy_ids` empty/None → falls back to the active shortlist
	(`session.last_recommendation_ids`) so "compare the ones you showed"
	works without the model re-deriving ids.
	"""
	ids = [str(p).strip() for p in (policy_ids or []) if str(p).strip()]
	if not ids:
	ids = [
	str(p).strip()
	for p in (getattr(session, "last_recommendation_ids", []) or [])
	if str(p).strip()
	]
	if not ids:
	return {
	"ok": False,
	"error": (
	"no_policy_ids — pass policy_ids, or recommend policies "
	"first so there is an active shortlist"
	),
	}

	# Resolve policy_id → (policy_name, insurer_slug) from the caches
	# retrieve_policies stashed this session, then the curated catalogue.
	slug_map = dict(getattr(session, "slug_to_insurer", {}) or {})
	name_by_id: dict[str, str] = {}
	for c in getattr(session, "last_retrieved_chunks", []) or []:
	pid = (c.get("policy_id") or "").strip()
	if not pid:
	continue
	name_by_id.setdefault(pid, c.get("policy_name") or pid)
	if pid not in slug_map and c.get("insurer_slug"):
	slug_map[pid] = c.get("insurer_slug")
	try:
	curated = _curated_facts_all()
	except Exception: # noqa: BLE001 — curated layer optional
	curated = {}

	out: list[dict] = []
	for pid in ids:
	cur = curated.get(pid) or {}
	slug = (slug_map.get(pid) or cur.get("insurer_slug") or "").strip()
	pname = clean_display_policy_name(
	name_by_id.get(pid) or cur.get("policy_name") or pid
	)
	rv = _insurer_reviews(slug) or {}
	cm = rv.get("claim_metrics") or {}
	agg = rv.get("aggregate_score") or {}
	sig = _scorecard_signal(pid) or {}
	try:
	facts = _load_policy_facts(pid) or {}
	except Exception: # noqa: BLE001 — facts optional
	facts = {}
	out.append(
	{
	"policy_id": pid,
	"policy_name": pname,
	"insurer_slug": slug,
	"insurer_name": rv.get("insurer_name")
	or (slug.replace("-", " ").title() if slug else ""),
	"scorecard_grade": sig.get("_grade"),
	"scorecard_overall_0_100": sig.get("_overall_score"),
	"claim_settlement_ratio_pct": cm.get(
	"claim_settlement_ratio_pct"
	),
	"claim_settlement_ratio_year": cm.get(
	"claim_settlement_ratio_year"
	),
	"three_year_avg_csr_pct": cm.get("three_year_avg_csr_pct"),
	"complaints_per_10k_policies": cm.get(
	"complaints_per_10k_policies"
	),
	"complaints_year": cm.get("complaints_year"),
	"claims_rejected_fy24": cm.get("claims_rejected_fy24"),
	"incurred_claim_ratio_pct": cm.get("incurred_claim_ratio_pct"),
	"reputation_headline": agg.get("headline"),
	"reputation_grade": agg.get("letter_grade"),
	"claim_data_source_url": (
	cm.get("source_irdai_url")
	or cm.get("source_secondary_url")
	or cm.get("source_complaints_url")
	),
	# Bug #44 — decision-critical fields (PED waiting, initial
	# waiting, copay, room-rent cap, CSR) are resolved from the
	# SAME canonical curated entry the scorecard / #31 path
	# uses, so a verbal answer / comparison table built from
	# this tool can never contradict the policy's scorecard
	# card. They OVERRIDE the divergent _load_policy_facts
	# 7-key resolver for these keys, agreeing by construction.
	"key_coverage_facts": {
	**{k: v for k, v in facts.items() if v not in (None, "", [])},
	**canonical_decision_facts(pid),
	},
	"reviews_available": bool(rv),
	}
	)

	return {
	"ok": True,
	"count": len(out),
	"policies": out,
	"note": (
	"This is the authoritative claim-settlement / complaint / "
	"denial / scorecard data (IRDAI + scorecard) — answer the "
	"user's question directly from it; do NOT say you lack this "
	"information. Cite as "
	"[Source: <insurer> claim data (IRDAI), <claim_data_source_url>]."
	),
	}


	def mark_recommendation(
	session,
	policy_ids: list[str],
	is_final: bool = False,
	) -> dict:
	"""Persist the policies just recommended so follow-up turns can resolve
	references like "tell me about #2".

	Sets `session.last_recommendation_ids = policy_ids` (the same field the
	orchestrator already maintains for follow-up routing — KI-224 / KI-228).
	`is_final` is accepted for forward-compat (when the session grows a
	`closed` field); today it's logged but not persisted.

	Returns: {"recorded": True, "policy_ids": [...], "is_final": bool}
	"""
	if not isinstance(policy_ids, list):
	return {"recorded": False, "error": "policy_ids_not_list"}

	# Coerce + dedupe while preserving order.
	seen: set[str] = set()
	cleaned: list[str] = []
	for pid in policy_ids:
	s = str(pid).strip()
	if s and s not in seen:
	seen.add(s)
	cleaned.append(s)

	# Z2 fix — Issue 2 (hallucinated closure). Vikram T6 saw the LLM emit
	# mark_recommendation with an empty policy_ids list, the tool silently
	# returned {"recorded": True, "policy_ids": []}, and the bot then said
	# "I'm glad we found a good fit" despite ZERO cards shown. Two
	# preconditions, gated BEFORE any session write so we don't poison
	# last_recommendation_ids / shown_policies events with junk:
	# (a) empty (after dedup) → no_policies_supplied
	# (b) non-empty BUT no retrieval history this session → caller
	# must run retrieve_policies first (Y2 cache check via
	# session.last_retrieved_chunks)
	if not cleaned:
	return {"recorded": False, "error": "no_policies_supplied"}
	_retrieval_cache = getattr(session, "last_retrieved_chunks", None)
	if not _retrieval_cache:
	return {
	"recorded": False,
	"error": "no_retrieval_history — call retrieve_policies first",
	}

	try:
	session.last_recommendation_ids = cleaned
	except Exception as e: # noqa: BLE001
	return {
	"recorded": False,
	"error": f"setattr_failed:{type(e).__name__}:{e}",
	}

	if is_final and hasattr(session, "closed"):
	try:
	session.closed = True # type: ignore[attr-defined]
	except Exception: # noqa: BLE001
	pass

	# X7 — write a shown_policies event per cited policy so the admin
	# Recommendation History panel needs single_brain turns logged the same
	# way the (now-removed) orchestrator did its `_log_shown_policies`
	# (KI-063): dedupe by slug, resolve insurer via the slug→insurer
	# cache `retrieve_policies` stashed on the session this turn, and stamp
	# `turn_idx=session.turn_idx` so the frontend "Conversation turn" column
	# has a real value instead of "—".
	#
	# No profile name → no JSON file to write to (anonymous session). No
	# insurer resolution for a slug → skip that slug. All errors swallowed
	# so a logging failure never breaks the tool reply back to Gemini.
	# ADR-043 (2026-05-27) — record_policy_event used to write the shown
	# policy onto the named-profile JSON for cross-session "have I shown
	# this before" tracking. Cross-session persistence is gone; the
	# in-memory equivalent (avoid re-pitching within the same session)
	# is handled by session.last_recommendation_ids / shown_policies on
	# the live Profile dataclass.
	try:
	profile = getattr(session, "profile", None)
	if profile is not None and cleaned:
	shown = list(getattr(profile, "shown_policies", None) or [])
	existing_slugs = {(e or {}).get("policy_slug") for e in shown}
	slug_to_insurer = dict(getattr(session, "slug_to_insurer", {}) or {})
	turn_idx = int(getattr(session, "turn_idx", 0) or 0)
	session_id = getattr(session, "session_id", None)
	now_iso = time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime())
	for slug in cleaned:
	if not slug or slug in existing_slugs:
	continue
	insurer = slug_to_insurer.get(slug)
	if not insurer:
	continue
	shown.append({
	"policy_slug": slug,
	"insurer": insurer,
	"event_at": now_iso,
	"session_id": session_id,
	"reason": "shown_in_recommendation",
	"turn_idx": turn_idx,
	})
	existing_slugs.add(slug)
	profile.shown_policies = shown
	except Exception as e: # noqa: BLE001 — never break the tool reply
	_log.warning(
	"mark_recommendation shown-event logging (in-memory) failed: "
	"%s: %s",
	type(e).__name__, str(e)[:200],
	)

	return {
	"recorded": True,
	"policy_ids": cleaned,
	"is_final": bool(is_final),
	}


	# ---- private normalizers ---------------------------------------------------

	def _coerce_age(value: Any) -> Optional[int]:
	"""int(value), clamped to [0, 110]. Empty / non-numeric → None."""
	if value is None:
	return None
	try:
	if isinstance(value, bool): # bool is an int subclass — block first
	return None
	n = int(value)
	except (TypeError, ValueError):
	# Try string parse — Gemini sometimes emits "29" as a JSON string
	try:
	n = int(str(value).strip())
	except (TypeError, ValueError):
	return None
	if n < 0:
	n = 0
	if n > 110:
	n = 110
	return n


	# Ported from sales_brain_normalizer.py (B6 cleanup, 2026-05-15) — the legacy
	# normalizer module is being deleted; this is the only consumer left.
	_DEPENDENT_VAGUE_TERMS = (
	"family", "everyone", "all of us", "everybody",
	"whole family", "joint family",
	)


	def _normalize_dependents_inline(value: Any) -> Optional[str]:
	"""Port of sales_brain_normalizer._normalize_dependents.

	Schema-free variant — the original required a `schema["values"]` lookup
	for direct enum hits; here we hard-code the canonical bucket set used
	by the bot (kept in sync with the previous fact-find schema).
	"""
	if not isinstance(value, str):
	return None
	s = value.strip().lower()
	if not s:
	return None
	# Canonical enum values (formerly schema["values"]).
	_CANONICAL_VALUES = (
	"self",
	"self+spouse",
	"self+spouse+kids",
	"self+spouse+parents",
	"self+spouse+kids+parents",
	"self+kids",
	"self+parents",
	)
	if s in _CANONICAL_VALUES:
	return s

	has_spouse = any(k in s for k in ("spouse", "wife", "husband", "partner"))
	has_kids = ("kid" in s) or ("child" in s) or ("children" in s) or ("son" in s) or ("daughter" in s)
	has_parents = "parent" in s

	# Vague terms with no specific signals → cannot coerce
	if any(v in s for v in _DEPENDENT_VAGUE_TERMS) and not (has_spouse or has_kids or has_parents):
	return None

	if has_spouse and has_kids and has_parents:
	return "self+spouse+kids+parents"
	if has_spouse and has_parents:
	return "self+spouse+parents"
	if has_spouse and has_kids:
	return "self+spouse+kids"
	if has_spouse:
	return "self+spouse"
	if has_kids and has_parents:
	# No canonical bucket — fold parents into the wider bundle
	return "self+spouse+kids+parents"
	if has_kids:
	return "self+kids"
	if has_parents:
	return "self+parents"
	# KI-222 — expand the "self" alias set. Live captures showed users
	# answering "single", "unmarried", "no dependents", "just myself" etc.,
	# which previously fell through to None and got silently dropped — the
	# bot then re-asked the same slot on the next turn.
	_SELF_ALIASES = (
	"self", "me", "just me", "only me", "myself", "only self",
	"single", "unmarried", "alone", "bachelor", "no dependents",
	"just myself", "nobody else", "no one else", "nobody",
	"myself only", "by myself", "solo",
	)
	if s in _SELF_ALIASES:
	return "self"
	# Substring fall-through for the same intents when wrapped in extra prose
	# (e.g. "i'm single right now", "just myself for now").
	if any(alias in s for alias in (
	"single", "unmarried", "no dependents", "just myself",
	"by myself", "nobody else", "no one else", "myself only",
	"bachelor", "solo",
	)):
	return "self"
	return None


	def _coerce_dependents(value: Any) -> Optional[str]:
	"""Normalize raw dependents text to a canonical bucket; see
	`_normalize_dependents_inline` (ported from sales_brain_normalizer)."""
	if value is None:
	return None
	try:
	return _normalize_dependents_inline(value)
	except Exception: # noqa: BLE001 — best-effort
	s = str(value).strip()
	return s or None


	def _coerce_existing_cover(value: Any) -> Optional[int]:
	"""Parse INR amounts like "5L" / "5 lakh" / 500000 via the canonical
	parser. Numeric pass-throughs are clamped to >= 0.
	"""
	if value is None:
	return None
	if isinstance(value, bool):
	return None
	if isinstance(value, (int, float)):
	n = int(value)
	return max(0, n)
	try:
	from backend.needs_finder import _parse_inr_amount

	parsed = _parse_inr_amount(str(value))
	if parsed is not None:
	return max(0, int(parsed))
	except Exception: # noqa: BLE001
	pass
	# Last-ditch: strip non-digits
	try:
	digits = "".join(ch for ch in str(value) if ch.isdigit())
	if digits:
	return max(0, int(digits))
	except Exception: # noqa: BLE001
	pass
	return None


	# Canonical budget bands — the EXACT string contract the frontend
	# ProfileBuilderPanel round-trips via budgetBandToInr / budgetInrToBand
	# (frontend/src/app/page.tsx) and that needs_finder._parse_budget_band
	# emits. Keeping this set inline makes the contract greppable from the
	# capture surface.
	_CANONICAL_BUDGET_BANDS: frozenset[str] = frozenset(
	{"under_15k", "15k_30k", "30k_60k", "60k+"}
	)


	def _coerce_budget_band(value: Any) -> Optional[str]:
	"""Normalise a budget capture to the documented `budget_band` contract.

	Bug #109 (2026-05-16). The user states a premium budget in chat
	("max ₹15,000/yr", "around 30k", "15000"). Gemini calls
	save_profile_field(field="budget_band", value=...) but often passes the
	NUMERIC the user said, not a canonical band. The old code let
	budget_band fall through the generic string pass-through, so
	profile.budget_band was stored as the raw "15000" — which the frontend
	ProfileBuilderPanel's budgetBandToInr() switch can't map, so the panel
	never pre-filled the budget slider even though the bot's summary showed
	it.

	Mapping (matches frontend budgetInrToBand + needs_finder bands):
	• already a canonical band ("15k_30k") → passed through unchanged
	• free-text / numeric ("max ₹15,000/yr", "30k", 22000, "10-15K")
	→ delegated to needs_finder._parse_budget_band → canonical band
	• unrecognised → None (KI-091 null-overwrite guard then refuses to
	clobber a previously-captured band)
	"""
	if value is None:
	return None
	# Numeric → bucket directly (₹ amount per year).
	if isinstance(value, bool):
	return None
	if isinstance(value, (int, float)):
	v = int(value)
	if v < 15_000:
	return "under_15k"
	if v < 30_000:
	return "15k_30k"
	if v < 60_000:
	return "30k_60k"
	return "60k+"
	s = str(value).strip()
	if not s:
	return None
	# Already canonical — accept verbatim (case/space tolerant).
	norm = s.lower().replace(" ", "")
	if norm in _CANONICAL_BUDGET_BANDS:
	return norm
	# Strip ANNUAL-budget qualifiers FIRST. needs_finder._parse_inr_amount
	# treats a bare "yr" / "year" as an AGE context and refuses to read any
	# number as currency (the KI-161 age guard) — so the canonical live
	# phrasing "max ₹15,000/yr" / "₹15000 per year" parsed to None and the
	# band was never captured (Bug #109). These suffixes are unambiguous
	# PER-ANNUM budget markers here (the field is explicitly the premium
	# budget), not an age, so we drop them before delegating.
	import re as _re

	cleaned = _re.sub(
	r"\b(?:per\s(?:year\|annum)\|p\.?\sa\.?\|/\s*(?:yr\|year\|annum)\|"
	r"a\syear\|annually\|yearly\|/\syr)\b",
	" ",
	s,
	flags=_re.IGNORECASE,
	)
	# Free-text / amount → canonical band via the shared parser. This
	# handles "max ₹15,000", "30k", "around 25000", "15-30k", "1 lakh".
	try:
	from backend.needs_finder import _parse_budget_band

	band = _parse_budget_band(cleaned)
	if band in _CANONICAL_BUDGET_BANDS:
	return band
	# Last-resort: if the qualifier strip left only the amount, try the
	# raw string too (covers phrasings the regex didn't anticipate).
	if cleaned != s:
	band = _parse_budget_band(s)
	if band in _CANONICAL_BUDGET_BANDS:
	return band
	except Exception: # noqa: BLE001 — parser optional; fall through to None
	pass
	return None


	def _coerce_bool(value: Any) -> Optional[bool]:
	"""Tri-state bool coercion for parents_to_insure / parents_has_ped.

	Accepts: True / False / "yes" / "no" / "y" / "n" / "true" / "false"
	/ 1 / 0. Anything else → None (so the KI-091 null-overwrite guard
	refuses to clobber a previously-captured value).
	"""
	if value is None:
	return None
	if isinstance(value, bool):
	return value
	if isinstance(value, (int, float)):
	return bool(value)
	s = str(value).strip().lower()
	if s in ("true", "yes", "y", "1"):
	return True
	if s in ("false", "no", "n", "0"):
	return False
	return None


	def _coerce_smoker(value: Any) -> Optional[bool]:
	"""KI-275 (2026-05-15) — tri-state bool for smoker / tobacco use.

	Accepts:
	- True / "yes" / "true" / "smoker" / "smokes" / "tobacco" / 1 → True
	- False / "no" / "false" / "non-smoker" / "doesn't smoke" / 0 → False
	- None / "" / unclear → None

	Returning None lets the KI-091 null-overwrite guard in
	save_profile_field refuse to clobber a previously-captured value.
	"""
	if value is None:
	return None
	if isinstance(value, bool):
	return value
	if isinstance(value, (int, float)):
	return bool(value)
	s = str(value).strip().lower()
	if not s:
	return None
	_YES = {
	"yes", "y", "true", "1",
	"smoker", "smokes", "smoke", "i smoke",
	"tobacco", "tobacco user", "uses tobacco",
	"i do", "yep", "yeah", "yup",
	}
	_NO = {
	"no", "n", "false", "0",
	"non-smoker", "nonsmoker", "non smoker",
	"doesn't smoke", "does not smoke", "dont smoke", "don't smoke",
	"i don't", "i do not", "nope", "never", "no tobacco",
	}
	if s in _YES:
	return True
	if s in _NO:
	return False
	# Substring fall-through for prose ("I'm a non-smoker", "I smoke daily").
	if any(tok in s for tok in ("non-smoker", "nonsmoker", "non smoker", "don't smoke",
	"doesn't smoke", "do not smoke", "no tobacco")):
	return False
	if any(tok in s for tok in ("smoker", "smokes", "tobacco")):
	return True
	return None


	def _coerce_desired_sum_insured(value: Any) -> Optional[int]:
	"""Parse desired sum insured (cover amount) as integer rupees.

	Accepts: "10L" / "10 lakh" / "1 crore" / "1Cr" / 1000000 /
	"₹10,00,000" / "five lakh" (rejected — words not numerals).
	Delegates to `_parse_inr_amount` from needs_finder for the heavy lift,
	falls back to bare-digit extraction. Clamps to [50_000, 500_000_000]
	(₹50K floor, ₹50Cr ceiling) — anything outside is implausible for a
	health-insurance sum insured and likely a parse error.
	"""
	if value is None:
	return None
	if isinstance(value, bool):
	return None
	if isinstance(value, (int, float)):
	n = int(value)
	return max(50_000, min(500_000_000, n))
	try:
	from backend.needs_finder import _parse_inr_amount

	parsed = _parse_inr_amount(str(value))
	if parsed is not None:
	return max(50_000, min(500_000_000, int(parsed)))
	except Exception: # noqa: BLE001
	pass
	# Last-ditch: strip non-digits (handles "₹10,00,000" if parser missed).
	try:
	digits = "".join(ch for ch in str(value) if ch.isdigit())
	if digits:
	n = int(digits)
	if n >= 50_000:
	return min(500_000_000, n)
	except Exception: # noqa: BLE001
	pass
	return None


	def _coerce_health_conditions(value: Any) -> Optional[list[str]]:
	"""Always return list[str] lowercase, stripped, empties dropped.

	KI-Z6-NONE (2026-05-15): "none" / "no" / "n/a" — used to be stripped to
	`[]`, but downstream `save_profile_field` then hits the KI-091 null-
	overwrite guard (`normalized in (None, "", [])`) and refuses to persist
	the slot. Result: profile.health_conditions stays empty forever,
	`_profile_complete` returns False, retrieve_policies returns
	profile_incomplete, the brain loops, MAX_ITERATIONS exhausts, the bot
	emits "Sorry — I lost my train of thought" (W1 Turn 3 live blocker).

	Fix: keep the explicit-negation sentinel `["none"]` so:
	• the slot is non-empty → _profile_complete=True → retrieve fires
	• downstream consumers can still detect "no PED" via the literal
	token `"none"` in the list (callers already lowercase-compare).
	"""
	if value is None:
	return None
	if isinstance(value, str):
	# Gemini sometimes emits comma-joined strings instead of a list.
	items = [t.strip() for t in value.split(",")]
	elif isinstance(value, (list, tuple)):
	items = [str(t).strip() for t in value]
	else:
	items = [str(value).strip()]
	cleaned = [t.lower() for t in items if t]
	# Explicit-negation tokens — collapse to the canonical sentinel
	# `["none"]` rather than `[]` so the slot is captured, not blanked.
	_NEGATION = {"none", "no", "n/a", "na", "nil", "nothing", "healthy"}
	if cleaned and all(t in _NEGATION for t in cleaned):
	return ["none"]
	# Mixed input ("diabetes, none") — drop the negation noise, keep real
	# conditions.
	real = [t for t in cleaned if t not in _NEGATION]
	return real


	# ---------------------------------------------------------------------------
	# D2 (2026-05-15) — copay_pct + family_medical_history coercers
	# ---------------------------------------------------------------------------

	# Word-number map for "twenty", "ten" etc. (RULE 2.5 asks the user in
	# multiples of 10; Gemini sometimes echoes the user's word verbatim).
	_COPAY_WORD_TO_INT: dict[str, int] = {
	"zero": 0, "none": 0, "no": 0,
	"ten": 10, "fifteen": 15, "twenty": 20,
	"twenty five": 25, "twenty-five": 25,
	"thirty": 30, "forty": 40, "fifty": 50,
	}


	def _coerce_copay_pct(value: Any) -> Optional[int]:
	"""Parse a co-pay tolerance percent, clamped to [0, 50].

	Accepts:
	- int / float → int + clamp
	- "20", "20%", " 20 % ", "20 percent" → 20
	- "no copay" / "zero" / "none" → 0
	- word numbers like "twenty" → 20
	- bool → blocked (KI-091 null-overwrite caution: bool is an int subclass)

	Returns None for unrecognised input so the null-overwrite guard in
	save_profile_field can refuse to clobber a previously-captured slot.
	"""
	if value is None:
	return None
	if isinstance(value, bool):
	return None
	if isinstance(value, (int, float)):
	n = int(value)
	return max(0, min(50, n))
	s = str(value).strip().lower()
	if not s:
	return None
	# Explicit zero phrasings.
	if s in ("no", "none", "nil", "zero", "no copay", "no co-pay", "no co pay"):
	return 0
	# Word-number lookup (exact match).
	if s in _COPAY_WORD_TO_INT:
	return _COPAY_WORD_TO_INT[s]
	# Strip "%" + "percent" + "pct".
	cleaned = (
	s.replace("%", " ")
	.replace("percent", " ")
	.replace("pct", " ")
	.replace("copay", " ")
	.replace("co-pay", " ")
	.replace("co pay", " ")
	)
	# Digit run.
	import re as _re
	m = _re.search(r"\d+(?:\.\d+)?", cleaned)
	if m:
	try:
	n = int(float(m.group(0)))
	return max(0, min(50, n))
	except ValueError:
	return None
	# Word-number fall-through (substring on cleaned text).
	for word, num in _COPAY_WORD_TO_INT.items():
	if word in cleaned.split():
	return num
	return None


	# Alias map for family medical history — same canonicalisation logic as
	# health_conditions but kept inline so this slot stays self-contained.
	_FAMILY_HISTORY_ALIASES: dict[str, str] = {
	"bp": "hypertension",
	"high bp": "hypertension",
	"high-bp": "hypertension",
	"hi-bp": "hypertension",
	"high blood pressure": "hypertension",
	"blood pressure": "hypertension",
	"sugar": "diabetes",
	"diabetic": "diabetes",
	"type 2 diabetes": "diabetes",
	"type 1 diabetes": "diabetes",
	"heart attack": "heart",
	"heart disease": "heart",
	"cardiac": "heart",
	"cardiac disease": "heart",
	"stroke": "heart",
	"tumor": "cancer",
	"tumour": "cancer",
	"carcinoma": "cancer",
	}

	_FAMILY_HISTORY_NEGATION = {
	"none", "no", "n/a", "na", "nil", "nothing", "healthy",
	"no family history", "no history", "no medical history",
	}


	def _coerce_family_medical_history(value: Any) -> Optional[list[str]]:
	"""Return list[str] lowercase canonical conditions running in BLOOD family.

	Accepts:
	- list / tuple of strings
	- comma-joined string ("cancer, diabetes")
	- "none" / "no family history" → []

	Alias map collapses BP/sugar/cardiac/tumor → hypertension/diabetes/heart/
	cancer respectively (same family as _coerce_health_conditions). Negation
	sentinels return `[]` since downstream pricing & retrieval BOTH treat an
	empty list as the "no family history" branch (different from health_
	conditions where the explicit `["none"]` sentinel is needed for the
	profile-completeness gate).
	"""
	if value is None:
	return None
	if isinstance(value, str):
	items = [t.strip() for t in value.split(",")]
	elif isinstance(value, (list, tuple)):
	items = [str(t).strip() for t in value]
	else:
	items = [str(value).strip()]
	cleaned = [t.lower() for t in items if t]
	# Full-string negation collapses to [].
	if cleaned and all(t in _FAMILY_HISTORY_NEGATION for t in cleaned):
	return []
	# Drop negation noise from mixed input ("cancer, none").
	cleaned = [t for t in cleaned if t not in _FAMILY_HISTORY_NEGATION]
	# Canonicalise via alias map.
	canonical: list[str] = []
	seen: set[str] = set()
	for t in cleaned:
	c = _FAMILY_HISTORY_ALIASES.get(t, t)
	if c and c not in seen:
	seen.add(c)
	canonical.append(c)
	return canonical


	__all__ = [
	"save_profile_field",
	"retrieve_policies",
	"mark_recommendation",
	"SLOT_UNION",
	"union_snapshot",
	]