Spaces:

rohitsar567
/

InsuranceBot

Sleeping

App Files Files Community

InsuranceBot / tools /audit /flows.py

rohitsar567

feat(audit): 100-persona multi-scenario simulation framework

3dab53c about 2 months ago

Raw

History Blame Contribute Delete

13.4 kB

	"""Generate 30-turn conversational flows for each persona.

	Flow shape per persona (30 turns total):
	Phase 1 — Opening ( 1 turn)
	Phase 2 — Fact-find answers ( 9 turns)
	Phase 3 — Free-form policy Qs (10 turns)
	Phase 4 — Edge-case probes ( 5 turns)
	Phase 5 — Adversarial + close ( 5 turns)

	Each turn is a single `user_text` string the audit runner will POST to
	/api/chat. The persona's `style` and `lang` control surface variation
	(terse vs verbose, English vs Hinglish, hedge-heavy vs clean).

	Output: tools/audit/flows.json (dict[persona_id, list[str]]).
	"""
	from __future__ import annotations

	import json
	import random
	from pathlib import Path
	from typing import Any

	# Anchor questions per concern — driving what each free-form turn asks.
	CONCERN_QS = {
	"coverage_breadth": ["What does Care Supreme cover for hospital expenses?",
	"Does Star Comprehensive include AYUSH treatment?"],
	"premium_value": ["What's the cheapest ₹10L sum insured option?",
	"Compare premiums on Optima Secure vs Niva Bupa ReAssure"],
	"claim_settlement": ["What's the claim settlement ratio for HDFC ERGO?",
	"Which insurer has the lowest claim rejection rate?"],
	"sum_insured_size": ["Should I buy ₹10L or ₹25L sum insured?",
	"Does restoration benefit fully reset the sum insured?"],
	"ped_waiting": ["What's the PED waiting period under Care Supreme?",
	"Does any policy have a shorter PED waiting than 36 months?"],
	"restoration_benefit": ["Which policies offer unlimited restoration?",
	"When does the restoration benefit kick in?"],
	"parents_age_max": ["Up to what age can I add my parents?",
	"What's the renewal age cap on senior-citizen plans?"],
	"specific_disease_waiting": ["What's the waiting period for cataract surgery?",
	"Does any plan have a shorter cancer waiting period?"],
	"sub_limits": ["Does Care Supreme cap room rent?",
	"What's the ICU sub-limit on Optima Secure?"],
	"network_hospitals": ["How many cashless hospitals does Niva Bupa have in Bangalore?",
	"Does Bajaj Allianz have empanelled hospitals in Delhi?"],
	"no_claim_bonus": ["What's the NCB rate on Optima Restore?",
	"Does NCB compound year-over-year?"],
	"exclusions": ["What's permanently excluded under Care Supreme?",
	"Are pregnancy complications covered?"],
	"free_look": ["How many days is the free-look period?",
	"Can I cancel within the free-look and get a full refund?"],
	"irdai_mandate": ["What does IRDAI's 2024 master circular say about cataract caps?",
	"Is there an IRDAI rule on premium revision frequency?"],
	"tax_treatment": ["How much premium can I claim under Section 80D?",
	"Is the premium for parents above 60 separately deductible?"],
	"ombudsman": ["How do I file an ombudsman complaint?",
	"What's the turnaround for an ombudsman decision?"],
	"reviews": ["What do customers say about ICICI Lombard claim settlement?",
	"How does Star Health rate on Reddit?"],
	"regulatory_overlay": ["Does IRDAI override a policy's claim-time disclosure rule?",
	"What's the standard pre-existing-condition definition per IRDAI?"],
	"section_80d": ["Maximum 80D deduction if I'm 45 and parents are 70?",
	"Does preventive health check-up qualify for 80D?"],
	"premium_band": ["What's a typical premium for ₹15L at age 35?",
	"How much more does ₹25L cost vs ₹10L for a 40-year-old?"],
	"language_switch": ["What is the room rent cap?",
	"रूम रेंट कैप क्या है?"],
	}

	# Edge-case templates — applied to every persona regardless of archetype.
	EDGE_CASES = [
	"Open the marketplace.", # view-context shift
	"Try again", # retry intent (Bug C)
	"I forgot to mention — I was just diagnosed with diabetes", # mid-flow profile update
	"What's the room rent cap on this?", # view-aware reference
	"Just say it again please", # another retry phrasing
	]

	# Adversarial probes — tests refusal, regulatory grounding, OOC behavior.
	ADVERSARIAL = [
	"Does this policy cover space tourism injuries?", # OOC — refuse cleanly
	"Should I buy this policy?", # close-resistance
	"What does IRDAI say about my situation?", # regulatory grounding
	"Compare Star Comprehensive, Care Supreme, and Optima Secure on PED waiting", # multi-policy
	"give me a quick summary of what we discussed", # close
	]


	def _opener(p: dict[str, Any]) -> str:
	arch = p["archetype"]
	style = p["style"]
	base = {
	"first_buyer": "I'm looking to buy my first health insurance policy.",
	"upgrader": "I have a ₹5L cover and want to upgrade.",
	"senior_care": "I need to insure my parents — they're around 75.",
	"comparer": "Help me compare HDFC Optima Secure, Care Supreme, and ICICI Elevate.",
	"anxious": "I'm worried insurers will deny claims later. Where do I start?",
	"savvy": "I want a plan with strong restoration and ≥4Cr lifetime renewability.",
	"tax_planner": "I want to maximise my 80D deduction while getting good cover.",
	"low_trust": "Honest question — which insurer actually pays claims fast?",
	"code_switcher": "Hi, mujhe health insurance chahiye, can you help?",
	"specific_condition": f"I have {p['health_conditions'][0] if p['health_conditions'] else 'a condition'}; what should I look at?",
	}[arch]
	return _stylize(base, style, p["style_hedges"])


	def _factfind_answers(p: dict[str, Any]) -> list[str]:
	"""9 ordered answers matching the fact-find graph: age, dependents,
	income, existing_cover, primary_goal, location, parents, conditions, budget."""
	age = p["age"]
	deps = p["dependents"]
	inc = {"under_5L": "under 5 lakh", "5L-10L": "around 8 lakh", "10L-25L": "around 18 lakh", "25L+": "more than 25 lakh"}[p["income_band"]]
	cover = "no existing cover" if p["existing_cover_inr"] == 0 else "₹5 lakh from work"
	goal = {"first_buy": "this is my first policy", "upgrade": "upgrading existing cover", "compare_specific": "comparing specific plans", "tax_planning": "mainly for tax planning"}[p["primary_goal"]]
	loc = {"metro": "Bangalore", "tier1": "Pune", "tier2": "Indore", "tier3": "Bhilai"}[p["location_tier"]]
	parents = "yes, both parents" if p["parents_to_insure"] else "no, just me / family"
	cond = ", ".join(p["health_conditions"]) if p["health_conditions"] else "none"
	budget = {"under_15k": "under 15 thousand a year", "15k_30k": "15-30k", "30k_60k": "30-60k", "60k+": "more than 60k"}[p["budget_band"]]

	raws = [
	f"{age}",
	_deps_to_natural(deps),
	inc,
	cover,
	goal,
	loc,
	parents,
	cond,
	budget,
	]
	return [_stylize(r, p["style"], p["style_hedges"]) for r in raws]


	def _deps_to_natural(deps: str) -> str:
	return {
	"self": "just me",
	"self+spouse": "me and my wife",
	"self+spouse+kids": "me, wife, and two kids",
	"self+parents": "me and my parents",
	"self+spouse+kids+parents": "me, wife, kids, and parents",
	}.get(deps, deps)


	def _freeform_qs(p: dict[str, Any]) -> list[str]:
	"""10 policy Qs anchored on the persona's concerns."""
	out: list[str] = []
	concerns = p["anchor_concerns"]
	# Two Qs per anchor concern + filler from neighbouring concerns
	for c in concerns:
	for q in CONCERN_QS.get(c, []):
	out.append(_stylize(q, p["style"], p["style_hedges"]))
	if len(out) >= 6:
	break
	if len(out) >= 6:
	break
	# Fill to 10 with neutral concerns
	filler_pool = ["coverage_breadth", "premium_value", "ped_waiting", "free_look", "exclusions"]
	rng = random.Random(p["persona_id"]) # deterministic per persona
	while len(out) < 10:
	pool_c = rng.choice(filler_pool)
	candidates = CONCERN_QS.get(pool_c, [])
	if candidates:
	out.append(_stylize(rng.choice(candidates), p["style"], p["style_hedges"]))
	return out[:10]


	def _edge_cases(p: dict[str, Any]) -> list[str]:
	return [_stylize(e, p["style"], p["style_hedges"]) for e in EDGE_CASES]


	def _adversarial(p: dict[str, Any]) -> list[str]:
	return [_stylize(a, p["style"], p["style_hedges"]) for a in ADVERSARIAL]


	# ----------------------------------------------------------------------------
	# Style transforms
	# ----------------------------------------------------------------------------

	_HINGLISH_MAP = {
	"policy": "policy", "insurance": "insurance", # English loan-words stay
	"cover": "cover", "premium": "premium",
	"I": "main", "have": "hai", "want": "chahiye", "need": "chahiye",
	"what": "kya", "is": "hai", "the": "wo", "should": "karu",
	"first": "pehla", "buy": "buy", "tell": "batao", "me": "mujhe",
	"show": "dikhao", "compare": "compare kar do",
	}


	def _to_hinglish(text: str) -> str:
	words = text.split()
	out = []
	for w in words:
	bare = w.strip(".,?!:").lower()
	if bare in _HINGLISH_MAP:
	out.append(_HINGLISH_MAP[bare] + w[len(bare):])
	else:
	out.append(w)
	return " ".join(out)


	def _to_hindi_devanagari(text: str) -> str:
	"""Light transliteration sample — keeps policy/insurance words in English
	but flavours basic phrases. Real Hindi-primary users speak this way."""
	mappings = [
	("I want", "मुझे चाहिए"),
	("I have", "मेरे पास है"),
	("Please tell me", "मुझे बताइए"),
	("What is", "क्या है"),
	("policy", "policy"),
	("compare", "तुलना करें"),
	("waiting period", "waiting period"),
	]
	out = text
	for src, dst in mappings:
	out = out.replace(src, dst)
	return out


	def _stylize(text: str, style: str, hedges: list[str]) -> str:
	if style == "terse":
	words = text.split()
	return " ".join(words[:7]) + ("." if not words[0].endswith("?") else "")
	if style == "verbose":
	prefix = (hedges[0] if hedges else "") + "so basically, "
	suffix = ", let me know what you think"
	return prefix + text.lower() + suffix
	if style == "hinglish":
	return _to_hinglish(text)
	if style == "hindi_primary":
	return _to_hindi_devanagari(text)
	if style == "formal_en":
	return text # already formal English
	if style == "casual_en":
	return (hedges[0] if hedges else "") + text.lower()
	if style == "anxious_q":
	return (hedges[0] if hedges else "") + text + " — is that right?"
	if style == "numbers_heavy":
	return text # natural form often has numbers
	if style == "stream":
	return (hedges[0] if hedges else "") + text + " " + (hedges[-1] if hedges else "") + "also what else should i ask?"
	if style == "tester":
	return text + " (and don't make up the answer)"
	return text


	# ----------------------------------------------------------------------------
	# Composer
	# ----------------------------------------------------------------------------

	def build_flow(p: dict[str, Any]) -> list[str]:
	flow: list[str] = []
	flow.append(_opener(p)) # 1 opening
	flow.extend(_factfind_answers(p)) # 9 fact-find
	flow.extend(_freeform_qs(p)) # 10 free-form
	flow.extend(_edge_cases(p)) # 5 edge cases
	flow.extend(_adversarial(p)) # 5 adversarial + close
	assert len(flow) == 30, f"flow length {len(flow)} != 30 for {p['persona_id']}"
	return flow


	def main() -> None:
	root = Path(__file__).resolve().parent
	personas = json.loads((root / "personas.json").read_text())
	out: dict[str, list[str]] = {}
	for p in personas:
	out[p["persona_id"]] = build_flow(p)
	out_path = root / "flows.json"
	out_path.write_text(json.dumps(out, indent=2, ensure_ascii=False))
	total_turns = sum(len(v) for v in out.values())
	print(f"wrote {out_path} ({len(out)} personas, {total_turns} total turns)")
	# Show one sample flow
	sample_id = "P001"
	print(f"\n=== Sample flow for {sample_id} ({personas[0]['archetype_label']}, style={personas[0]['style']}) ===")
	for i, turn in enumerate(out[sample_id][:5], 1):
	print(f" {i}. {turn}")
	print(" ...")


	if __name__ == "__main__":
	main()