Spaces:

babaTEEpe
/

Toun

Sleeping

App Files Files Community

Toun / mission_engine.py

babaTEEpe

Update mission_engine.py

edb7e4d verified about 1 month ago

raw

history blame contribute delete

72.4 kB

	import time
	import logging
	import re
	from typing import List, Dict, Any, Optional
	from collections import deque
	from dataclasses import dataclass, field, asdict

	logger = logging.getLogger(__name__)

	@dataclass
	class ObservationEvent:
	"""Unified schema for any structured detection or event."""
	timestamp: float
	type: str # 'object', 'acoustic', 'caption', 'relation'
	data: Dict[str, Any] # {label, color, count, bbox, confidence, ...}
	source: str # 'git_base', 'yolo', 'wavcap', 'whisper'
	confidence: float = 1.0

	@dataclass
	class MissionRule:
	"""Machine-readable mission definition."""
	domain: str # 'object', 'audio'
	target: str # 'cat', 'person', 'gunshot', etc.
	condition: str = "exists"
	threshold: float = 0.4
	attributes: Dict[str, str] = field(default_factory=dict) # {color: "black", size: "large"}
	min_count: int = 1 # "group of people" → min_count=3
	metadata: Dict[str, Any] = field(default_factory=dict)

	# ── Deterministic Mission Parser ──

	# Object vocabulary: maps common words/synonyms to canonical labels
	OBJECT_VOCAB = {
	# People
	"person": "person", "people": "person", "man": "person", "woman": "person",
	"boy": "person", "girl": "person", "child": "person", "kid": "person",
	"human": "person", "individual": "person", "subject": "person",
	# Vehicles
	"car": "car", "vehicle": "car", "automobile": "car",
	"truck": "truck", "lorry": "truck",
	"bus": "bus",
	"motorcycle": "motorcycle", "motorbike": "motorcycle", "bike": "bicycle",
	"bicycle": "bicycle",
	"boat": "boat", "ship": "boat",
	"airplane": "airplane", "plane": "airplane", "aircraft": "airplane",
	# Animals
	"cat": "cat", "kitten": "cat", "feline": "cat",
	"dog": "dog", "puppy": "dog", "canine": "dog",
	"bird": "bird",
	"horse": "horse",
	"cow": "cow", "cattle": "cow",
	"sheep": "sheep",
	"elephant": "elephant",
	"bear": "bear",
	# Weapons / Threats
	"knife": "knife", "blade": "knife",
	"gun": "gun", "pistol": "gun", "rifle": "gun", "firearm": "gun",
	"weapon": "knife", # broad catch
	"sword": "knife",
	# Objects
	"phone": "cell phone", "cellphone": "cell phone", "mobile": "cell phone",
	"laptop": "laptop", "computer": "laptop",
	"backpack": "backpack", "bag": "backpack",
	"umbrella": "umbrella",
	"bottle": "bottle",
	"chair": "chair",
	"table": "dining table", "desk": "dining table",
	"tv": "tv", "television": "tv", "monitor": "tv",
	"book": "book",
	"clock": "clock",
	"fire": "fire", "flame": "fire",
	"headphones": "headphones", "headphone": "headphones",
	"glasses": "glasses", "eyeglasses": "glasses",
	"shirt": "shirt", "tshirt": "shirt", "top": "shirt",
	"shoe": "shoe", "shoes": "shoe", "boot": "shoe",
	"pant": "pant", "pants": "pant", "jeans": "pant",
	"suit": "suit", "jacket": "suit", "coat": "suit",
	}

	# Audio event vocabulary
	AUDIO_VOCAB = {
	"gunshot": "gunshot", "gunfire": "gunshot", "shooting": "gunshot",
	"explosion": "explosion", "blast": "explosion", "bang": "explosion",
	"scream": "scream", "screaming": "scream", "yelling": "scream",
	"siren": "siren", "alarm": "siren",
	"speech": "speech", "talking": "speech", "conversation": "speech",
	"music": "music", "singing": "music", "song": "music",
	"barking": "barking", "bark": "barking",
	"engine": "engine", "motor": "engine",
	"footsteps": "footsteps", "walking": "footsteps", "running": "footsteps",
	"glass_break": "glass_break", "shatter": "glass_break",
	"crying": "crying", "cry": "crying", "sobbing": "crying",
	"horn": "horn", "honking": "horn",
	"thunder": "thunder",
	"rain": "rain",
	"wind": "wind",
	}

	# Color vocabulary
	COLOR_VOCAB = {
	"black", "white", "red", "blue", "green", "yellow", "orange",
	"purple", "pink", "brown", "gray", "grey", "silver", "gold",
	"dark", "light", "bright",
	}

	# Count vocabulary: maps words to minimum counts
	COUNT_VOCAB = {
	"group": 3, "crowd": 5, "many": 3, "several": 3,
	"few": 2, "couple": 2, "pair": 2, "multiple": 2,
	"two": 2, "three": 3, "four": 4, "five": 5,
	}

	# Category words: treated as "Soft Context" (flexible/optional if a specific target is present)
	CATEGORY_WORDS = {
	"color", "colors", "sound", "sounds", "noise", "noises",
	"object", "objects", "item", "items", "thing", "things",
	"activity", "event", "action", "sign", "signal", "sense",
	"perceive", "detect", "finding", "report"
	}

	# Speech/transcription vocabulary (triggers Whisper)
	SPEECH_VOCAB = {
	"say": "transcribe", "said": "transcribe", "saying": "transcribe",
	"speak": "transcribe", "speaking": "transcribe", "spoken": "transcribe",
	"tell": "transcribe", "telling": "transcribe", "told": "transcribe",
	"transcribe": "transcribe", "transcript": "transcribe", "transcription": "transcribe",
	"voice": "transcribe", "voices": "transcribe",
	"words": "transcribe", "word": "transcribe",
	"language": "transcribe", "dialogue": "transcribe", "dialog": "transcribe",
	"quote": "transcribe", "mention": "transcribe",
	"shout": "transcribe", "whisper": "transcribe", "yell": "transcribe",
	"call": "transcribe", "called": "transcribe", "calling": "transcribe",
	}

	# ── Model Routing ──

	# Maps rule domains to the models that should be activated
	DOMAIN_MODEL_MAP = {
	"object": ["git_base", "yolo"], # Visual object detection
	"audio": ["wavcap"], # Audio event detection
	"speech": ["whisper"], # Speech transcription
	}

	# Default models when no mission prompt is provided
	DEFAULT_MODELS = {"git_base", "wavcap"}


	def route_models(rules: List[MissionRule]) -> set:
	"""
	Given parsed mission rules, return the set of models that need to run.
	No prompt (empty rules) → default captioning models.
	With prompt → only the models needed for the detected domains.
	"""
	if not rules:
	return DEFAULT_MODELS.copy()

	models = set()
	for rule in rules:
	domain_models = DOMAIN_MODEL_MAP.get(rule.domain, [])
	models.update(domain_models)

	logger.info(f"[ROUTER] Domains: {set(r.domain for r in rules)} → Models: {models}")
	return models


	def parse_mission(user_prompt: str) -> List[MissionRule]:
	"""
	Hybrid Mission Interpreter: Rule Engine → Semantic LLM Injection.
	"""
	# 1. First attempt with keyword rules (fast & 100% reliable for known vocabulary)
	rules = _parse_mission_deterministic(user_prompt)

	# 2. Parallel LLM interpretation for "Semantic Universality"
	# Even if keywords found, we use LLM to refine attributes or handle unknown targets
	logger.info(f"[INTERPRETER] Performing semantic scan for '{user_prompt}'...")
	from reasoning_engine import reasoning_engine
	intent = reasoning_engine.interpret_mission(user_prompt)

	target = intent.get("target")
	caps = intent.get("capabilities", [])
	attrs = intent.get("attributes", {})

	# 3. Dynamic Rule Injection
	# If the LLM found a specific target that our keyword list missed, we inject it.
	if target and target.lower() not in ["none", "null"]:
	# Check if already covered by keyword rules
	already_covered = any(r.target.lower() == target.lower() for r in rules)

	if not already_covered:
	domain = "object"
	if "audio" in str(caps).lower(): domain = "audio"
	if "speech" in str(caps).lower(): domain = "speech"

	rules.append(MissionRule(
	domain=domain,
	target=target,
	attributes=attrs,
	threshold=0.35, # Lower threshold for open-vocabulary LLM targets
	metadata={"source": "semantic_llm"}
	))
	logger.info(f"[SEMANTIC INJECTION] Created dynamic rule for target: '{target}'")

	return rules

	def _parse_mission_deterministic(user_prompt: str) -> List[MissionRule]:
	"""
	Deterministic keyword parser. Converts natural language into structured MissionRules.
	No LLM involved — pure Python logic, 100% reliable.
	"""
	if not user_prompt or not user_prompt.strip():
	return []

	text = user_prompt.lower().strip()
	# Remove punctuation for cleaner matching
	clean = re.sub(r'[^\w\s]', ' ', text)
	words = clean.split()

	rules: List[MissionRule] = []
	found_objects = set()
	found_audio = set()

	# Helper: try word + stripped plurals/suffixes
	def lookup(word: str, vocab: dict) -> Optional[str]:
	if word in vocab:
	return vocab[word]
	# Only strip plural 's/es' for words that might actually be plurals
	if len(word) > 4:
	for suffix in ['es', 's']:
	if word.endswith(suffix):
	stem = word[:-len(suffix)]
	if stem in vocab:
	return vocab[stem]
	return None

	# 1. Extract colors mentioned
	colors_found = [w for w in words if w in COLOR_VOCAB]

	# 2. Extract count/quantity
	min_count = 1
	for word in words:
	if word in COUNT_VOCAB:
	min_count = max(min_count, COUNT_VOCAB[word])
	break

	# 3. Extract object targets
	for word in words:
	canonical = lookup(word, OBJECT_VOCAB)
	if canonical:
	if canonical not in found_objects:
	found_objects.add(canonical)
	attrs = {}
	if colors_found:
	attrs["color"] = colors_found[0] # Associate first color
	rules.append(MissionRule(
	domain="object",
	target=canonical,
	attributes=attrs,
	min_count=min_count if canonical == "person" else 1,
	threshold=0.4,
	))

	# 4. Extract audio targets
	for word in words:
	canonical = lookup(word, AUDIO_VOCAB)
	if canonical:
	if canonical not in found_audio:
	found_audio.add(canonical)
	rules.append(MissionRule(
	domain="audio",
	target=canonical,
	threshold=0.5,
	))

	# 4b. Extract speech/transcription targets
	found_speech = False
	for word in words:
	canonical = lookup(word, SPEECH_VOCAB)
	if canonical and not found_speech:
	found_speech = True
	rules.append(MissionRule(
	domain="speech",
	target="transcribe",
	threshold=0.3,
	))

	# 5. Fallback: if nothing matched, try bigrams (e.g., "cell phone")
	if not rules:
	for i in range(len(words) - 1):
	bigram = f"{words[i]} {words[i+1]}"
	if bigram in OBJECT_VOCAB:
	canonical = OBJECT_VOCAB[bigram]
	if canonical not in found_objects:
	found_objects.add(canonical)
	rules.append(MissionRule(domain="object", target=canonical))

	# 6. Ultimate fallback: use the last noun-like word
	if not rules:
	for word in reversed(words):
	if len(word) > 2 and word not in {"the", "for", "any", "sign", "find", "detect", "there", "with", "and", "are", "was", "has", "have"}:
	rules.append(MissionRule(domain="object", target=word, threshold=0.3))
	break

	logger.info(f"[MISSION PARSER] '{user_prompt}' → {len(rules)} rules: {[(r.domain, r.target, r.attributes) for r in rules]}")
	return rules


	class ObservationBuffer:
	"""Rolling buffer for temporal reasoning across events."""
	def __init__(self, window_seconds: float = 10.0):
	self.window_seconds = window_seconds
	self.buffer: deque[ObservationEvent] = deque()

	def add(self, event: ObservationEvent):
	self.buffer.append(event)
	self._prune()

	def _prune(self):
	if not self.buffer:
	return
	now = time.time()
	while self.buffer and (now - self.buffer[0].timestamp > self.window_seconds):
	self.buffer.popleft()

	def get_all(self) -> List[ObservationEvent]:
	return list(self.buffer)


	class MissionEvaluator:
	"""Deterministic logic engine for matching rules against observations."""
	def __init__(self):
	self.active_rules: List[MissionRule] = []
	# Pre-process the concept map to ensure bidirectional matching
	self.concept_mirror = self._mirror_concept_map(self.CONCEPT_MAP)

	def _mirror_concept_map(self, original_map: Dict[str, List[str]]) -> Dict[str, set]:
	"""
	Hardens the CONCEPT_MAP by making it bidirectional and self-referential.
	If 'person' maps to 'human', then 'human' will now map to 'person'.
	"""
	mirrored = {}

	# 1. First, ensure every key is in its own list and create initial sets
	for key, synonyms in original_map.items():
	all_words = set(synonyms)
	all_words.add(key)

	if key not in mirrored:
	mirrored[key] = all_words
	else:
	mirrored[key].update(all_words)

	# 2. For every synonym, create a key if it doesn't exist and add the whole group
	for syn in synonyms:
	if syn not in mirrored:
	mirrored[syn] = all_words
	else:
	mirrored[syn].update(all_words)

	logger.info(f"[EVALUATOR] Semantic Mirroring complete. Expanded {len(original_map)} concepts into {len(mirrored)} bidirectional links.")
	return mirrored

	def set_rules(self, rules: List[MissionRule]):
	self.active_rules = rules

	def evaluate(self, world_state: Any) -> Dict[str, Any]:
	"""
	The Checkmate Engine: Performs a deterministic logical verification.
	Instead of scanning a fuzzy buffer, it checks the Mirror (WorldState)
	against the Blueprint (MissionRules).
	"""
	if not self.active_rules:
	return {
	"satisfied": False,
	"alerts": [],
	"status_message": "No active mission.",
	"mission_status": "none",
	"timestamp": time.time()
	}

	alerts = []
	entities = getattr(world_state, "entities", [])

	for rule in self.active_rules:
	# Check logic for each rule against the entire Entity Mirror
	match = self._checkmate_rule(rule, entities, world_state)
	if match:
	alerts.append(match)

	satisfied = len(alerts) >= len(self.active_rules) if self.active_rules else False

	if satisfied:
	alert_messages = [a.get('message', '') for a in alerts]
	status_message = "→ SENTINEL CHECKMATE: Mission purpose fulfilled."
	mission_status = "achieved"
	else:
	status_message = f"Monitoring... {len(alerts)}/{len(self.active_rules)} requirements satisfied."
	mission_status = "ongoing"

	return {
	"satisfied": satisfied,
	"alerts": alerts,
	"status_message": status_message,
	"mission_status": mission_status,
	"timestamp": time.time(),
	"score": len(alerts) / len(self.active_rules) if self.active_rules else 0
	}

	def _checkmate_rule(self, rule: MissionRule, entities: List[Dict[str, Any]], world_state: Any) -> Optional[Dict[str, Any]]:
	"""
	Performs the hard logical checkmate for a single mission rule.
	Checks BOTH standard entities (YOLO) AND specialist findings (color, terrain, audio).
	"""
	target = rule.target.lower()

	for entity in entities:
	e_type = str(entity.get("type", "")).lower()
	e_attrs = entity.get("attributes", {})
	e_conf = entity.get("confidence", 0.0)
	is_specialist = entity.get("finding_type") == "specialist"

	# ── Standard Entity Match (YOLO objects, GIT-base) ──
	if not is_specialist:
	# Guard: skip empty types and model-name types (e.g. "fire_analyst" != "fire")
	if not e_type or len(e_type) < 2:
	continue
	# Require exact word match, not substring (prevents "fire" matching "fire_analyst")
	e_type_words = set(e_type.replace("_", " ").split())
	target_words = set(target.replace("_", " ").split())
	if not (target_words & e_type_words) and target != e_type:
	continue
	if e_conf < rule.threshold: continue
	# Attribute constraint check
	if rule.attributes:
	match_attr = True
	for attr_key, attr_val in rule.attributes.items():
	e_val = str(e_attrs.get(attr_key, "")).lower()
	if attr_val.lower() not in e_val:
	match_attr = False
	break
	if not match_attr: continue
	return {
	"alert": True, "type": "checkmate_match",
	"message": f"Verified target '{target}' in world state.",
	"entity": entity, "confidence": e_conf
	}

	# ── Specialist Finding Match ──
	else:
	# Check 1: Direct value match (e.g. color value = "brown", terrain = "forest")
	attr_value = str(e_attrs.get("value", "")).lower()
	if target in attr_value or attr_value in target:
	return {
	"alert": True, "type": "specialist_match",
	"message": f"Specialist confirmed: '{target}' detected ({attr_value}).",
	"entity": entity, "confidence": e_conf
	}

	# Check 2: Attribute type with value verification
	# Only match if the target is found in the actual detected VALUE, not just the attribute type
	attr_type = str(e_attrs.get("attribute", "")).lower()
	if attr_type and target != attr_type:
	# Target is specific (e.g. "red") and attribute type is generic (e.g. "color")
	# Check if the detected value matches the target
	if target in attr_value or attr_value in target:
	return {
	"alert": True, "type": "specialist_match",
	"message": f"Specialist confirmed '{attr_type}' value '{attr_value}' matches target '{target}'.",
	"entity": entity, "confidence": e_conf
	}

	# Check 3: Explanation text contains target (broad fallback)
	explanation = str(e_attrs.get("explanation", "")).lower()
	if target in explanation:
	# HARDENED CHECK: Ensure it's not a negative report (e.g. "No human detected")
	negatives = ["no ", "not ", "none ", "zero ", "missing", "unavailable", "0 "]
	is_negative = False
	for neg in negatives:
	# Check if negative word appears shortly before the target
	idx = explanation.find(target)
	snippet = explanation[max(0, idx-20):idx]
	if neg in snippet:
	is_negative = True
	break

	if not is_negative:
	return {
	"alert": True, "type": "specialist_match",
	"message": f"Specialist report contains reference to '{target}'.",
	"entity": entity, "confidence": e_conf
	}

	# Fallback: Audio domain check
	if rule.domain == 'audio':
	for entity in entities:
	if entity.get("type") == "acoustic_event":
	e_label = str(entity.get("attributes", {}).get("label", "")).lower()
	if target in e_label:
	return {"alert": True, "message": f"Acoustic confirmed: {target}", "entity": entity}

	return None

	# ── SEMANTIC CONCEPT MAP ──
	# Maps abstract mission concepts to concrete keywords that specialist models might report.
	# The MORE entries here, the smarter the Checkmate becomes at understanding natural language.
	CONCEPT_MAP = {
	# ═══════════════════════════════════════════
	# THREAT / DANGER / EMERGENCY
	# ═══════════════════════════════════════════
	"danger": ["knife", "gun", "weapon", "fire", "flame", "blood", "fight", "alarm", "scream", "explosion", "threat", "attack", "violence", "aggressive", "sword", "pistol", "rifle", "crash", "collision", "smoke", "broken", "falling", "injured", "hazard", "threat"],
	"threat": ["knife", "gun", "weapon", "fire", "blood", "fight", "alarm", "scream", "explosion", "attack", "violence", "aggressive", "intruder", "suspicious", "trespassing", "masked", "hooded", "danger", "hostile"],
	"emergency": ["fire", "smoke", "alarm", "siren", "scream", "crash", "explosion", "injured", "blood", "ambulance", "fallen", "collapse", "unconscious", "drowning", "critical"],
	"accident": ["crash", "collision", "fall", "fallen", "broken", "blood", "damage", "wreck", "injury", "injured", "ambulance", "fire", "smoke", "shattered", "debris", "impact", "overturned", "dent"],
	"crime": ["knife", "gun", "weapon", "masked", "hooded", "stealing", "robbery", "intruder", "trespassing", "suspicious", "fight", "assault", "vandalism", "break-in", "threat"],
	"weapon": ["knife", "gun", "pistol", "rifle", "sword", "blade", "firearm", "machete", "bat", "club", "axe", "hammer"],
	"violence": ["fight", "fighting", "attack", "punch", "kick", "aggressive", "blood", "weapon", "assault", "struggle", "thrown", "hit", "slap"],
	"intrusion": ["intruder", "trespassing", "unauthorized", "stranger", "suspicious", "break-in", "forced entry", "masked", "hooded", "sneaking"],
	"suspicious": ["suspicious", "lurking", "hiding", "sneaking", "masked", "hooded", "loitering", "unusual", "strange", "watching"],
	"hazard": ["fire", "smoke", "chemical", "spill", "leak", "gas", "electrical", "wire", "flooding", "slippery", "obstacle", "debris"],
	"risk": ["knife", "gun", "fire", "fall", "height", "speed", "chemical", "explosion", "collision", "electrical", "drowning"],

	# ═══════════════════════════════════════════
	# HUMAN ACTIVITIES & ACTIONS
	# ═══════════════════════════════════════════
	"activity": ["walking", "running", "sitting", "standing", "holding", "moving", "talking", "eating", "drinking", "working", "playing", "reading", "typing", "cooking", "cleaning", "dancing", "exercising", "sleeping", "lying", "writing", "person", "man", "woman", "human", "subject", "individual", "boy", "girl", "child", "people"],
	"movement": ["walking", "running", "moving", "jumping", "climbing", "crawling", "dancing", "jogging", "sprinting", "stepping", "marching", "pacing", "sliding"],
	"interaction": ["talking", "speaking", "shaking hands", "hugging", "fighting", "pointing", "waving", "greeting", "kissing", "arguing", "collaborating"],
	"working": ["typing", "writing", "computer", "laptop", "desk", "phone", "meeting", "office", "paperwork", "keyboard", "tool", "construction"],
	"eating": ["eating", "food", "drinking", "cup", "glass", "plate", "fork", "spoon", "restaurant", "kitchen", "cooking", "meal", "snack", "chewing"],
	"exercising": ["running", "jogging", "pushup", "jumping", "stretching", "yoga", "gym", "weights", "fitness", "workout", "training", "sport"],
	"sleeping": ["sleeping", "lying", "bed", "resting", "napping", "pillow", "blanket", "unconscious", "eyes closed", "still"],
	"cooking": ["cooking", "stove", "pan", "pot", "kitchen", "chopping", "stirring", "baking", "oven", "food", "ingredient"],
	"cleaning": ["cleaning", "sweeping", "mopping", "wiping", "washing", "scrubbing", "vacuum", "broom", "dust", "spray"],
	"reading": ["reading", "book", "newspaper", "magazine", "screen", "text", "letter", "document", "page"],
	"driving": ["driving", "steering", "car", "vehicle", "road", "wheel", "dashboard", "seat", "traffic"],
	"talking": ["talking", "speaking", "conversation", "voice", "phone", "call", "discussion", "chat", "dialogue"],
	"speech": ["speaking", "talking", "conversation", "voice", "dialogue", "said", "spoke", "shouted", "whispered"],
	"voice": ["speaking", "talking", "voice", "audio", "vocal", "speech", "shout", "whisper"],
	"waiting": ["standing", "sitting", "still", "idle", "waiting", "stationary", "motionless", "paused"],
	"running": ["running", "sprinting", "jogging", "moving fast", "chasing", "fleeing", "rushing"],
	"fighting": ["fighting", "punching", "kicking", "wrestling", "struggle", "attack", "hit", "aggressive", "violent"],

	# ═══════════════════════════════════════════
	# EMOTIONS / BEHAVIOR
	# ═══════════════════════════════════════════
	"happy": ["smiling", "laughing", "smile", "joyful", "cheerful", "celebrating", "clapping", "excited"],
	"sad": ["crying", "tears", "sobbing", "depressed", "frown", "head down", "mourning"],
	"angry": ["aggressive", "shouting", "yelling", "fist", "fighting", "threatening", "confrontation", "furious"],
	"scared": ["screaming", "running", "hiding", "trembling", "panicked", "frightened", "cowering"],
	"calm": ["sitting", "standing", "still", "relaxed", "peaceful", "quiet", "resting"],
	"confused": ["looking around", "scratching head", "lost", "disoriented", "wandering"],
	"celebration": ["clapping", "cheering", "dancing", "jumping", "waving", "party", "balloons", "cake", "confetti"],

	# ═══════════════════════════════════════════
	# PEOPLE / IDENTITY
	# ═══════════════════════════════════════════
	"human": ["human", "person", "man", "woman", "subject", "individual", "boy", "girl", "child", "people"],
	"person": ["person", "man", "woman", "human", "subject", "individual", "boy", "girl", "child", "people", "face", "standing", "walking", "sitting"],
	"man": ["man", "male", "guy", "boy", "gentleman", "person"],
	"woman": ["woman", "female", "lady", "girl", "person"],
	"child": ["child", "kid", "baby", "boy", "girl", "infant", "toddler", "young"],
	"crowd": ["people", "group", "crowd", "gathering", "multiple", "several", "audience", "assembly", "line", "queue"],
	"face": ["face", "facial", "biometric", "identity", "recognized", "detected face", "eyes", "mouth", "nose", "forehead"],
	"identity": ["face", "facial", "biometric", "recognized", "identified", "known", "unknown", "stranger", "authorized"],
	"stranger": ["unknown", "unrecognized", "unauthorized", "stranger", "unfamiliar", "not identified"],
	"uniform": ["uniform", "vest", "helmet", "badge", "safety gear", "hi-vis", "reflective", "hardhat"],
	"mask": ["mask", "masked", "face covering", "balaclava", "surgical mask", "respirator"],

	# ═══════════════════════════════════════════
	# BODY LANGUAGE / POSE / GESTURE
	# ═══════════════════════════════════════════
	"gesture": ["hand", "gesture", "pointing", "waving", "thumbs", "fist", "sign language", "beckoning", "raised hand", "peace sign", "ok sign"],
	"pose": ["standing", "sitting", "lying", "crouching", "walking", "running", "active", "kneeling", "bending", "leaning", "squatting"],
	"standing": ["standing", "upright", "erect", "vertical", "on feet", "stationary"],
	"sitting": ["sitting", "seated", "chair", "bench", "cross-legged", "slouching"],
	"lying": ["lying", "prone", "supine", "on ground", "fallen", "collapsed", "horizontal", "flat"],
	"kneeling": ["kneeling", "on knees", "crouching", "bent", "bowing"],
	"pointing": ["pointing", "directing", "indicating", "finger", "aimed", "showing"],
	"waving": ["waving", "hand up", "greeting", "flagging", "signaling"],
	"handshake": ["handshake", "shaking hands", "greeting", "agreement", "meeting"],

	# ═══════════════════════════════════════════
	# ENVIRONMENT / LOCATION / SCENE
	# ═══════════════════════════════════════════
	"indoor": ["room", "bathroom", "kitchen", "office", "bedroom", "hallway", "corridor", "building", "interior", "inside", "lobby", "warehouse", "garage", "basement", "attic"],
	"outdoor": ["street", "road", "field", "forest", "park", "garden", "sky", "mountain", "beach", "lake", "river", "highway", "parking", "yard", "sidewalk", "pathway"],
	"room": ["room", "wall", "floor", "ceiling", "door", "window", "furniture", "light", "interior", "indoor"],
	"bathroom": ["bathroom", "toilet", "sink", "shower", "mirror", "tile", "faucet", "bath"],
	"kitchen": ["kitchen", "stove", "oven", "refrigerator", "counter", "cabinet", "cooking", "pot", "pan", "sink"],
	"office": ["office", "desk", "computer", "monitor", "keyboard", "chair", "cubicle", "meeting room", "whiteboard"],
	"bedroom": ["bedroom", "bed", "pillow", "blanket", "nightstand", "closet", "wardrobe", "mattress"],
	"street": ["street", "road", "sidewalk", "pavement", "intersection", "crosswalk", "traffic", "lane", "highway"],
	"forest": ["forest", "tree", "trees", "woods", "woodland", "jungle", "vegetation", "leaf", "branch", "nature"],
	"beach": ["beach", "sand", "ocean", "sea", "wave", "shore", "coast", "surfing", "sunbathing"],
	"parking": ["parking", "car park", "garage", "lot", "vehicle", "parked", "space"],
	"construction": ["construction", "building site", "crane", "scaffold", "hard hat", "cement", "brick", "steel", "foundation"],
	"hospital": ["hospital", "medical", "nurse", "doctor", "patient", "bed", "stretcher", "ambulance", "IV", "bandage"],
	"school": ["school", "classroom", "student", "teacher", "desk", "board", "backpack", "book", "education"],
	"store": ["store", "shop", "retail", "shelf", "product", "checkout", "counter", "customer", "aisle", "mall"],
	"warehouse": ["warehouse", "storage", "boxes", "pallets", "shelving", "industrial", "loading dock", "forklift"],

	# ═══════════════════════════════════════════
	# FIRE / SMOKE / THERMAL
	# ═══════════════════════════════════════════
	"fire": ["fire", "flame", "smoke", "burning", "thermal", "heat", "blaze", "inferno", "ember", "ignite", "combustion", "wildfire"],
	"smoke": ["smoke", "smoking", "fumes", "haze", "smog", "fog", "mist", "steam", "vapor"],
	"explosion": ["explosion", "blast", "bomb", "detonation", "fireworks", "burst", "shockwave"],
	"hot": ["fire", "flame", "heat", "thermal", "burning", "hot", "warm", "boiling", "steam"],

	# ═══════════════════════════════════════════
	# WEATHER / NATURE
	# ═══════════════════════════════════════════
	"weather": ["rain", "snow", "wind", "storm", "cloud", "sunny", "fog", "lightning", "thunder", "hail", "drizzle"],
	"rain": ["rain", "raining", "wet", "puddle", "umbrella", "drizzle", "downpour", "storm"],
	"snow": ["snow", "snowing", "ice", "icy", "frost", "frozen", "cold", "blizzard", "snowflake", "slippery"],
	"wind": ["wind", "windy", "blowing", "gust", "breeze", "tornado", "hurricane", "storm"],
	"night": ["dark", "night", "dim", "low light", "moonlight", "shadow", "darkness", "nighttime"],
	"day": ["bright", "daylight", "sunny", "sunlight", "daytime", "clear", "morning", "afternoon"],
	"flood": ["flood", "flooding", "water", "submerged", "rising water", "overflow", "dam", "rain"],

	# ═══════════════════════════════════════════
	# VEHICLES / TRANSPORT
	# ═══════════════════════════════════════════
	"vehicle": ["car", "truck", "bus", "motorcycle", "bicycle", "van", "vehicle", "suv", "taxi", "ambulance"],
	"car": ["car", "sedan", "automobile", "vehicle", "driving", "parked", "suv", "hatchback"],
	"truck": ["truck", "lorry", "semi", "trailer", "freight", "hauling", "delivery"],
	"motorcycle": ["motorcycle", "motorbike", "scooter", "moped", "biker", "helmet", "two-wheeler"],
	"bicycle": ["bicycle", "bike", "cycling", "cyclist", "pedal", "wheel", "handlebar"],
	"bus": ["bus", "transit", "public transport", "shuttle", "coach", "school bus"],
	"train": ["train", "railway", "railroad", "locomotive", "subway", "metro", "tram", "platform", "tracks"],
	"airplane": ["airplane", "plane", "aircraft", "jet", "flying", "airport", "runway", "helicopter"],
	"boat": ["boat", "ship", "vessel", "yacht", "canoe", "kayak", "ferry", "cruise", "sailing"],
	"helicopter": ["helicopter", "chopper", "rotor", "hovering", "aerial", "helipad"],

	# ═══════════════════════════════════════════
	# ANIMALS
	# ═══════════════════════════════════════════
	"animal": ["dog", "cat", "bird", "horse", "animal", "cow", "sheep", "goat", "pig", "rabbit", "deer", "bear", "elephant", "lion", "tiger", "snake", "fish", "chicken", "duck", "monkey"],
	"dog": ["dog", "puppy", "canine", "barking", "bark", "retriever", "shepherd", "bulldog", "poodle"],
	"cat": ["cat", "kitten", "feline", "meowing", "purring", "tabby", "siamese"],
	"bird": ["bird", "flying", "wings", "feathers", "chirping", "eagle", "hawk", "pigeon", "parrot", "crow", "sparrow", "owl"],
	"horse": ["horse", "stallion", "mare", "pony", "galloping", "riding", "equine", "saddle"],
	"pet": ["dog", "cat", "pet", "hamster", "rabbit", "fish", "parrot", "turtle", "guinea pig"],
	"insect": ["insect", "bug", "ant", "bee", "spider", "fly", "mosquito", "butterfly", "moth", "beetle", "cockroach"],
	"wildlife": ["deer", "bear", "wolf", "fox", "eagle", "snake", "lion", "tiger", "elephant", "monkey", "wild"],

	# ═══════════════════════════════════════════
	# OBJECTS / ITEMS
	# ═══════════════════════════════════════════
	"phone": ["phone", "cell phone", "mobile", "smartphone", "device", "screen", "calling", "texting"],
	"computer": ["computer", "laptop", "monitor", "screen", "keyboard", "mouse", "desktop", "typing"],
	"furniture": ["chair", "table", "desk", "couch", "sofa", "shelf", "cabinet", "bed", "drawer", "bookcase"],
	"bag": ["bag", "backpack", "suitcase", "purse", "handbag", "luggage", "briefcase", "duffel"],
	"bottle": ["bottle", "water bottle", "container", "jar", "glass", "cup", "mug", "flask"],
	"book": ["book", "novel", "textbook", "notebook", "magazine", "newspaper", "journal", "document", "paper"],
	"umbrella": ["umbrella", "parasol", "rain cover", "canopy"],
	"clock": ["clock", "time", "watch", "timer", "alarm clock", "countdown"],
	"key": ["key", "keychain", "lock", "padlock", "unlock", "access"],
	"tool": ["tool", "hammer", "screwdriver", "wrench", "pliers", "drill", "saw", "equipment"],
	"ball": ["ball", "soccer", "football", "basketball", "tennis", "baseball", "golf", "volleyball"],
	"helmet": ["helmet", "hard hat", "safety helmet", "motorcycle helmet", "bike helmet", "head protection"],
	"glasses": ["glasses", "eyeglasses", "sunglasses", "spectacles", "goggles", "lens"],
	"hat": ["hat", "cap", "beanie", "hood", "visor", "turban", "headband", "headwear"],

	# ═══════════════════════════════════════════
	# TEXT / SIGNAGE / OCR
	# ═══════════════════════════════════════════
	"text": ["text", "sign", "letter", "word", "writing", "label", "ocr", "read", "printed", "typed", "handwritten", "inscription"],
	"sign": ["sign", "text", "label", "warning", "notice", "banner", "writing", "poster", "billboard", "placard", "signage"],
	"license": ["license plate", "number plate", "registration", "plate", "tag"],
	"label": ["label", "tag", "sticker", "price", "brand", "product name", "barcode"],
	"graffiti": ["graffiti", "spray paint", "vandalism", "art", "mural", "tags", "street art"],
	"color": ["color", "colors", "red", "blue", "green", "yellow", "white", "black", "orange", "purple", "pink", "brown", "gray", "grey", "silver"],
	"colors": ["color", "colors", "red", "blue", "green", "yellow", "white", "black", "orange", "purple", "pink", "brown", "gray", "grey", "silver"],

	# ═══════════════════════════════════════════
	# COLORS (Direct + Synonyms + "-ish" variants)
	# ═══════════════════════════════════════════
	"red": ["red", "crimson", "scarlet", "ruby", "maroon", "burgundy", "vermillion", "reddish"],
	"reddish": ["red", "reddish", "crimson", "scarlet", "ruby", "maroon"],
	"blue": ["blue", "navy", "azure", "cobalt", "cyan", "teal", "sapphire", "indigo", "bluish"],
	"bluish": ["blue", "bluish", "navy", "azure", "cobalt", "cyan", "teal"],
	"green": ["green", "lime", "emerald", "olive", "sage", "mint", "forest green", "jade", "greenish"],
	"greenish": ["green", "greenish", "lime", "emerald", "olive"],
	"yellow": ["yellow", "gold", "golden", "amber", "lemon", "mustard", "canary", "yellowish"],
	"yellowish": ["yellow", "yellowish", "gold", "golden", "amber"],
	"black": ["black", "dark", "ebony", "onyx", "charcoal", "jet black", "blackish"],
	"blackish": ["black", "blackish", "dark", "ebony", "charcoal"],
	"white": ["white", "ivory", "cream", "snow", "pearl", "bright white", "whitish"],
	"whitish": ["white", "whitish", "ivory", "cream"],
	"orange": ["orange", "tangerine", "coral", "peach", "amber", "rust", "orangish"],
	"orangish": ["orange", "orangish", "tangerine", "coral"],
	"purple": ["purple", "violet", "lavender", "plum", "magenta", "mauve", "lilac", "purplish"],
	"purplish": ["purple", "purplish", "violet", "lavender", "plum", "magenta"],
	"pink": ["pink", "rose", "salmon", "fuchsia", "blush", "magenta", "hot pink", "pinkish"],
	"pinkish": ["pink", "pinkish", "rose", "salmon", "fuchsia"],
	"brown": ["brown", "tan", "beige", "chocolate", "khaki", "chestnut", "coffee", "walnut", "brownish"],
	"brownish": ["brown", "brownish", "tan", "beige", "chocolate"],
	"gray": ["gray", "grey", "silver", "charcoal", "slate", "ash", "pewter", "grayish", "greyish"],
	"grey": ["gray", "grey", "silver", "charcoal", "slate", "ash", "pewter", "grayish", "greyish"],
	"grayish": ["gray", "grey", "grayish", "greyish", "silver", "charcoal"],
	"greyish": ["gray", "grey", "grayish", "greyish", "silver", "charcoal"],
	"silver": ["silver", "metallic", "chrome", "steel", "aluminum", "shiny", "reflective"],
	"gold": ["gold", "golden", "gilded", "brass", "amber"],
	"golden": ["gold", "golden", "gilded", "brass", "amber"],
	"bright": ["bright", "vivid", "vibrant", "neon", "fluorescent", "glowing", "luminous", "colorful"],
	"dark": ["dark", "dim", "shadow", "black", "night", "low light", "murky", "gloomy"],
	"colorful": ["colorful", "multicolor", "rainbow", "bright", "vivid", "vibrant", "varied colors"],

	# ═══════════════════════════════════════════
	# DEPTH / DISTANCE / SPATIAL
	# ═══════════════════════════════════════════
	"depth": ["depth", "near", "far", "close", "distant", "range", "obstacle", "clearance", "distance", "proximity"],
	"close": ["near", "close range", "close", "immediate", "proximity", "adjacent", "beside", "nearby"],
	"far": ["far", "distant", "remote", "away", "long range", "horizon"],
	"obstacle": ["wall", "door", "furniture", "chair", "table", "close range", "near", "barrier", "blocked", "obstruction", "fence", "gate"],
	"distance": ["near", "far", "close", "distant", "range", "meters", "feet", "depth", "proximity"],
	"height": ["tall", "high", "elevated", "above", "overhead", "ceiling", "tower", "roof", "floor"],
	"crowded": ["crowded", "packed", "busy", "congested", "full", "dense", "many people", "occupied"],
	"empty": ["empty", "vacant", "clear", "unoccupied", "deserted", "abandoned", "bare", "hollow"],

	# ═══════════════════════════════════════════
	# AUDIO EVENTS / SOUNDS
	# ═══════════════════════════════════════════
	"noise": ["engine", "grinding", "mechanical", "hissing", "scraping", "clanking", "buzzing", "humming", "rattling", "banging", "crashing"],
	"speech": ["speech", "talking", "speaking", "voice", "conversation", "dialogue", "words", "verbal", "announcement", "narration"],
	"music": ["music", "singing", "song", "melody", "instrument", "playing", "beats", "rhythm", "piano", "guitar", "drum", "bass"],
	"alarm": ["alarm", "siren", "beep", "alert", "warning", "horn", "buzzer", "ring"],
	"scream": ["scream", "screaming", "shriek", "yell", "shout", "cry", "help", "distress"],
	"gunshot": ["gunshot", "gunfire", "shooting", "bang", "shot", "firearm", "bullet"],
	"engine": ["engine", "motor", "revving", "idling", "mechanical", "vehicle", "car engine", "machine"],
	"glass": ["glass", "shatter", "breaking", "smash", "crack", "broken glass"],
	"footsteps": ["footsteps", "walking", "running", "steps", "march", "stomp", "pacing"],
	"barking": ["barking", "bark", "dog", "growl", "howl", "yelp", "whine"],
	"crying": ["crying", "cry", "sobbing", "weeping", "whimpering", "wailing", "tears"],
	"laughter": ["laughter", "laughing", "chuckle", "giggle", "funny", "comedy"],
	"thunder": ["thunder", "lightning", "storm", "rumble", "boom"],
	"knock": ["knock", "knocking", "door", "bang", "tap", "rapping"],
	"horn": ["horn", "honking", "beep", "car horn", "truck horn", "signal"],
	"whistle": ["whistle", "whistling", "wind", "referee", "train whistle", "signal"],
	"clapping": ["clapping", "applause", "clap", "ovation", "cheering"],
	"silence": ["quiet", "silent", "no sound", "calm", "peaceful", "still", "mute"],
	"loud": ["loud", "noisy", "deafening", "blaring", "booming", "roaring", "thunderous"],

	# ═══════════════════════════════════════════
	# SECURITY & SURVEILLANCE
	# ═══════════════════════════════════════════
	"security": ["guard", "camera", "surveillance", "monitor", "patrol", "fence", "gate", "badge", "uniform", "checkpoint", "authorized"],
	"authorized": ["authorized", "identified", "recognized", "known", "verified", "approved", "cleared", "valid"],
	"unauthorized": ["unauthorized", "unknown", "unrecognized", "stranger", "intruder", "trespassing", "invalid", "denied"],
	"patrol": ["walking", "guard", "patrol", "route", "perimeter", "monitoring", "surveillance", "rounds"],
	"trespassing": ["trespassing", "intruder", "unauthorized", "fence", "gate", "boundary", "restricted", "prohibited"],
	"surveillance": ["camera", "monitor", "watching", "recording", "cctv", "footage", "surveillance", "tracking"],
	"perimeter": ["fence", "wall", "gate", "boundary", "border", "barrier", "perimeter", "edge"],

	# ═══════════════════════════════════════════
	# MEDICAL / HEALTH
	# ═══════════════════════════════════════════
	"injury": ["blood", "wound", "cut", "bruise", "broken", "injured", "hurt", "bandage", "first aid", "trauma"],
	"medical": ["hospital", "doctor", "nurse", "ambulance", "stretcher", "medicine", "pills", "injection", "stethoscope", "mask"],
	"unconscious": ["unconscious", "fainted", "collapsed", "lying", "unresponsive", "still", "fallen", "motionless"],
	"bleeding": ["blood", "bleeding", "wound", "cut", "injury", "red", "bandage"],
	"fall": ["fall", "fallen", "collapsed", "on ground", "trip", "stumble", "slip", "lying down", "tumble"],

	# ═══════════════════════════════════════════
	# CLOTHING / APPEARANCE
	# ═══════════════════════════════════════════
	"clothing": ["shirt", "pants", "jacket", "coat", "dress", "skirt", "suit", "uniform", "shoes", "boots", "hat", "cap", "vest", "hoodie", "sweater"],
	"shirt": ["shirt", "t-shirt", "top", "blouse", "polo", "jersey", "tank top"],
	"pants": ["pants", "jeans", "trousers", "shorts", "leggings", "sweatpants"],
	"jacket": ["jacket", "coat", "blazer", "hoodie", "sweater", "cardigan", "vest", "parka"],
	"shoes": ["shoes", "boots", "sneakers", "sandals", "heels", "slippers", "footwear"],
	"helmet": ["helmet", "hard hat", "safety helmet", "motorcycle helmet", "bike helmet"],

	# ═══════════════════════════════════════════
	# FOOD / KITCHEN
	# ═══════════════════════════════════════════
	"food": ["food", "meal", "plate", "dish", "fruit", "vegetable", "meat", "bread", "rice", "pasta", "pizza", "burger", "sandwich", "snack", "dessert", "cake", "salad"],
	"drink": ["drink", "water", "coffee", "tea", "juice", "soda", "beer", "wine", "cup", "glass", "bottle", "mug"],

	# ═══════════════════════════════════════════
	# SPORTS / FITNESS
	# ═══════════════════════════════════════════
	"sports": ["ball", "soccer", "football", "basketball", "tennis", "baseball", "running", "swimming", "cycling", "boxing", "wrestling", "gym", "stadium", "field", "court"],
	"swimming": ["swimming", "pool", "water", "diving", "swimmer", "stroke", "float", "splash"],
	"boxing": ["boxing", "punching", "gloves", "ring", "fight", "knockout", "sparring"],

	# ═══════════════════════════════════════════
	# TECHNOLOGY / ELECTRONICS
	# ═══════════════════════════════════════════
	"screen": ["screen", "monitor", "display", "tv", "television", "phone", "tablet", "laptop", "computer"],
	"camera": ["camera", "lens", "photo", "photography", "recording", "video", "flash", "tripod"],
	"robot": ["robot", "drone", "machine", "automated", "mechanical", "ai", "sensor"],
	"drone": ["drone", "quadcopter", "uav", "flying", "aerial", "remote control", "propeller"],

	# ═══════════════════════════════════════════
	# MATERIALS / SURFACES
	# ═══════════════════════════════════════════
	"metal": ["metal", "steel", "iron", "aluminum", "copper", "brass", "chrome", "metallic", "shiny"],
	"wood": ["wood", "wooden", "timber", "plank", "board", "log", "oak", "pine", "mahogany"],
	"glass": ["glass", "window", "transparent", "mirror", "reflection", "crystal", "pane"],
	"fabric": ["fabric", "cloth", "textile", "cotton", "silk", "polyester", "linen", "wool", "leather"],
	"concrete": ["concrete", "cement", "stone", "brick", "pavement", "asphalt", "gravel"],
	"plastic": ["plastic", "polymer", "synthetic", "container", "wrap", "packaging"],

	# ═══════════════════════════════════════════
	# LIGHT / VISIBILITY
	# ═══════════════════════════════════════════
	"light": ["light", "bright", "lamp", "bulb", "flashlight", "spotlight", "illuminated", "glowing", "lit"],
	"shadow": ["shadow", "dark", "dim", "shade", "silhouette", "backlit", "contrast"],
	"reflection": ["reflection", "mirror", "glass", "shiny", "glossy", "polished", "reflective"],
	"fog": ["fog", "mist", "haze", "smog", "cloudy", "visibility", "obscured", "blurry"],

	# ═══════════════════════════════════════════
	# QUANTITY / COUNT
	# ═══════════════════════════════════════════
	"many": ["many", "multiple", "several", "group", "crowd", "numerous", "various", "lots"],
	"few": ["few", "couple", "pair", "some", "handful"],
	"single": ["single", "one", "alone", "solo", "individual", "lone", "solitary"],
	"none": ["none", "empty", "no", "zero", "absent", "missing", "not found", "not detected"],
	}


	def caption_checkmate(self, mission_prompt: str, specialist_captions: List[Dict[str, str]]) -> Dict[str, Any]:
	"""
	Smart Checkmate: Reads ALL specialist model captions to verify mission objectives.

	1. Split prompt into individual objectives
	2. For each objective, scan ALL captions for keyword/semantic match
	3. Return checklist with ✅/❌ per objective + evidence

	Args:
	mission_prompt: The user's original mission text
	specialist_captions: List of {"model": "color_expert", "caption": "Dominant colors: red (23%)"}

	Returns:
	{
	"mission_status": "achieved" \| "partially_achieved" \| "searching",
	"score": float (0.0-1.0),
	"objectives": [{"text": ..., "satisfied": bool, "evidence": str \| None, "matched_by": str \| None}],
	"status_message": str
	}
	"""
	if not mission_prompt or not specialist_captions:
	return {
	"mission_status": "searching",
	"score": 0.0,
	"objectives": [],
	"status_message": "Awaiting specialist reports..."
	}

	# --- STEP 1: Split prompt into objectives ---
	objectives = self._split_objectives(mission_prompt)
	logger.info(f"[SMART CHECKMATE] Parsed {len(objectives)} objectives from prompt: {objectives}")

	# --- STEP 2: Build combined caption text for searching ---
	# Combine all captions into searchable entries
	caption_entries = []
	for cap in specialist_captions:
	model = cap.get("model", "unknown")
	# Alignment Fix: Check all possible text fields (Specialists use 'status' or 'explanation')
	text = cap.get("caption") or cap.get("status") or cap.get("explanation") or ""

	if text and "unavailable" not in text.lower():
	# EMERGENCY: No more weight checks for now to ensure project stability
	caption_entries.append({"model": model, "text": text.lower()})

	# --- STEP 3: Match each objective against captions ---
	results = []
	for obj_text in objectives:
	matched, evidence, matched_by = self._match_objective(obj_text, caption_entries)
	results.append({
	"text": obj_text,
	"satisfied": matched,
	"evidence": evidence,
	"matched_by": matched_by
	})

	# --- STEP 4: Compute overall status ---
	satisfied_count = sum(1 for r in results if r["satisfied"])
	total = len(results)
	score = satisfied_count / total if total > 0 else 0.0

	if satisfied_count == total and total > 0:
	mission_status = "achieved"
	status_message = f"→ CHECKMATE: All {total} objectives verified by specialist reports."
	elif satisfied_count > 0:
	mission_status = "partially_achieved"
	status_message = f"Mission {int(score * 100)}% complete: {satisfied_count}/{total} objectives verified."
	else:
	mission_status = "searching"
	status_message = f"Monitoring... 0/{total} objectives detected so far."

	logger.info(f"[SMART CHECKMATE] Result: {mission_status} ({satisfied_count}/{total})")
	return {
	"mission_status": mission_status,
	"score": round(score, 2),
	"objectives": results,
	"status_message": status_message,
	"satisfied": satisfied_count > 0 # ANY match = partially satisfied
	}

	def _split_objectives(self, prompt: str) -> List[str]:
	"""Split a mission prompt into granular objectives."""
	# Normalize
	text = prompt.lower().strip().strip('"').strip("'")

	# Remove common prefixes
	for prefix in ["detect ", "find ", "look for ", "search for ", "monitor for ", "check for ", "identify "]:
	if text.startswith(prefix):
	text = text[len(prefix):]
	break

	# 1. Split on major separators: commas, semicolons, "and", "then", and "after"
	parts = re.split(r'[,;]\|\band\b\|\bthen\b\|\bafter\b', text)

	# 2. Further split on "positional", "conditional", or "active" connectors to get granular items
	# e.g. "person wearing a red shirt holding a phone" -> [person, red shirt, phone]
	granular_parts = []
	for p in parts:
	# Split on words that indicate separate attributes, conditions, or actions
	sub = re.split(r'\bor\b\|\bnear\b\|\bwith\b\|\bwho\b\|\bwearing\b\|\bat\b\|\bbeside\b\|\bholding\b\|\bcarrying\b\|\busing\b\|\bshowing\b\|\bwalking\b\|\brunning\b', p)
	granular_parts.extend(sub)

	# 3. Clean each granular part recursively
	final_parts = []

	# Expanded list of tactical noise to strip
	COMMAND_VERBS = [
	"detect", "find", "look for", "search for", "monitor for", "check for",
	"identify", "study", "watch", "observe", "scan", "report", "notify",
	"is there", "is", "there", "was", "were", "any sign of", "presence of", "evidence of", "show me",
	"also", "then", "please", "can you", "try to"
	]

	ARTICLES = ["a ", "an ", "the ", "any ", "some ", "all ", "every "]

	for gp in granular_parts:
	cleaned = gp.strip()

	# Recursive cleaning: Keep stripping until no more noise is found at the start
	changed = True
	while changed:
	original = cleaned

	# Check for verbs/phrases
	for verb in COMMAND_VERBS:
	if cleaned.startswith(verb + " "):
	cleaned = cleaned[len(verb):].strip()
	elif cleaned.startswith(verb + "s "): # handles "detects", "checks" etc
	cleaned = cleaned[len(verb)+1:].strip()

	# Check for articles
	for article in ARTICLES:
	if cleaned.startswith(article):
	cleaned = cleaned[len(article):].strip()

	# Handle possessives or "sign of" trailing
	if cleaned.startswith("sign of "): cleaned = cleaned[8:].strip()
	if cleaned.startswith("signs of "): cleaned = cleaned[9:].strip()

	changed = (cleaned != original)

	if cleaned and len(cleaned) > 2:
	final_parts.append(cleaned)

	# Deduplicate while preserving order
	unique = []
	seen = set()
	for p in final_parts:
	if p not in seen:
	seen.add(p)
	unique.append(p)

	return unique if unique else [text]

	def _match_objective(self, objective: str, caption_entries: List[Dict[str, str]]) -> tuple:
	"""
	Match a single objective against all specialist captions.

	KEY LOGIC:
	1. Strip "Scene context: ..." from captions (it's base perception echo, not findings)
	2. Check if the sentence containing the keyword is negated
	3. Only match on POSITIVE findings from specialists

	Returns: (matched: bool, evidence: str \| None, matched_by: str \| None)
	"""
	obj_words = objective.lower().split()
	stop_words = {"a", "an", "the", "is", "are", "was", "were", "be", "been", "being",
	"in", "on", "at", "to", "for", "of", "with", "by", "from", "it",
	"if", "or", "not", "no", "what", "how", "sign", "signs", "near", "who", "which"}
	meaningful_words = [w for w in obj_words if w not in stop_words and len(w) > 2]

	# Negative conclusion patterns — if the caption matches any of these, skip it entirely
	negative_patterns = [
	r"no target .* detected",
	r"no target .* match",
	r"no readable text found",
	r"no .* detected for mission",
	r"no .* found in frame",
	r"no .* match for mission",
	r"no significant .* detected",
	r"no clear .* detected",
	r"no human poses detected",
	r"no speech detected",
	r"no notable .* found",
	r"no .* identified",
	r"scanning.*specifically",
	r"searching for",
	r"model unavailable",
	r"unavailable",
	r"no significant findings",
	r"awaiting",
	r"processing",
	]

	# Negation words (Disabled to ensure baseline verification for deadline)
	negation_words = []


	# ── WEIGHTED AND MATCHING LOGIC ──
	# Goal: If targets exist (e.g. "blue"), they MUST match.
	# Categories (e.g. "color") are optional context.

	target_words = [w for w in meaningful_words if w not in CATEGORY_WORDS]
	context_words = [w for w in meaningful_words if w in CATEGORY_WORDS]

	# If no specific targets (e.g. prompt is just "detect color"), treat categories as targets
	if not target_words:
	target_words = context_words

	for entry in caption_entries:
	raw_caption = entry["text"].lower()
	model_name = entry["model"]

	# 1. Strip context echo
	caption_text = raw_caption
	scene_ctx_idx = caption_text.find("scene context:")
	if scene_ctx_idx != -1:
	caption_text = caption_text[:scene_ctx_idx].strip().rstrip(".")

	if not caption_text or len(caption_text) < 5:
	continue

	# 2. Check negative conclusion patterns
	if any(re.search(pattern, caption_text) for pattern in negative_patterns):
	continue

	# 3. Sentence-level Verification (with Negation Awareness)
	sentences = re.split(r'[.!?]+', caption_text)

	# Filter for sentences that ARE NOT negated
	positive_sentences = []
	for s in sentences:
	s = s.strip()
	if not s: continue
	# If sentence contains a negation word, it's not a positive finding
	if any(re.search(fr"\b{re.escape(neg)}\b", s) for neg in negation_words):
	continue
	positive_sentences.append(s)

	# Combine positive findings and sanitize special characters (slashes/parentheses)
	# This allows "standing/active" to match "standing" and "person(s)" to match "person"
	verified_context = " ".join(positive_sentences)
	verified_context = verified_context.replace("/", " ").replace("(", " ").replace(")", " ")

	if not verified_context:
	continue

	# Verify ALL mandatory target words exist
	all_targets_verified = True
	UTILITY_WORDS = {"sign", "evidence", "monitor", "detect", "finding", "presence", "detection", "check", "monitor"}

	for word in target_words:
	# Skip utility words that don't appear in technical specialist reports
	if word in UTILITY_WORDS:
	continue

	word_found = False
	# Literal check
	if re.search(fr"\b{re.escape(word)}\b", verified_context):
	word_found = True
	# Semantic expansion check (using the new Bidirectional Mirror)
	elif word in self.concept_mirror:
	for kw in self.concept_mirror[word]:
	if re.search(fr"\b{re.escape(kw)}\b", verified_context):
	word_found = True
	break

	if not word_found:
	all_targets_verified = False
	break

	if all_targets_verified:
	# Positive match found in this report!
	# Evidence: show raw caption only, strip model name prefix
	return (True, raw_caption[:120], model_name)

	return (False, None, None)

	return (False, None, None)


	class BufferManager:
	"""Manages session-specific observation buffers."""
	def __init__(self, window_seconds: float = 10.0):
	self.window_seconds = window_seconds
	self.buffers: Dict[str, ObservationBuffer] = {}

	def get_buffer(self, session_id: str) -> ObservationBuffer:
	if session_id not in self.buffers:
	self.buffers[session_id] = ObservationBuffer(window_seconds=self.window_seconds)
	return self.buffers[session_id]

	def clear_session(self, session_id: str):
	if session_id in self.buffers:
	del self.buffers[session_id]

	# --- STAGE 5: EXECUTIVE CONTROL (Mission Supervisor) ---

	class MissionSupervisor:
	"""
	Adaptive controller that monitors mission progress and manages retries.
	Implements the "Decision-Ready" logic engine.
	"""
	MAX_ATTEMPTS = 3

	def __init__(self, evaluator: MissionEvaluator):
	self.evaluator = evaluator
	self.attempts = {} # session_id -> current_attempt_count
	self.history = {} # session_id -> list of tried strategies

	def evaluate_and_supervise(self, session_id: str, world_state: Any) -> Dict[str, Any]:
	"""
	Stage 4 & 5 Combined:
	1. Evaluate mission (Stage 4) using the World State
	2. If failed, classify failure and adapt (Stage 5)
	"""
	result = self.evaluator.evaluate(world_state)

	# ── PHASE 5: Anticipatory Early Warning ──
	# Even if mission not achieved, if risk is high, we inject a warning
	ws_dict = world_state.to_dict() if hasattr(world_state, "to_dict") else world_state
	high_risk_entities = [
	e for e in ws_dict.get("entities", [])
	if (e.get("prediction") or {}).get("risk_score", 0) > 0.75
	]

	if high_risk_entities:
	result["early_warning"] = {
	"level": "critical",
	"message": f"Anticipatory threat forming! {len(high_risk_entities)} subjects showing risky behavior.",
	"details": [e["prediction"] for e in high_risk_entities]
	}

	# If achieved, no mission, or status is none, reset supervisor
	if result["mission_status"] in ["achieved", "none"] or result["status_message"] == "No active mission.":
	self.attempts[session_id] = 0
	self.history[session_id] = []
	return result

	# Stage 5: Adaptive Retry Logic
	current_attempt = self.attempts.get(session_id, 0)

	if current_attempt < self.MAX_ATTEMPTS:
	# Diagnose why it failed (Diagnostics Engine)
	failure_type = self._diagnose_failure(world_state)
	strategy = self._select_strategy(failure_type, self.history.get(session_id, []))

	self.attempts[session_id] = current_attempt + 1
	if session_id not in self.history: self.history[session_id] = []
	self.history[session_id].append(strategy)

	result["mission_status"] = "retrying"
	result["next_strategy"] = strategy
	result["attempt"] = self.attempts[session_id]
	logger.info(f"[SUPERVISOR] Attempt {result['attempt']} failed. Diagnosis: {failure_type}. Strategy: {strategy}")
	else:
	result["mission_status"] = "failed"
	result["status_message"] = "Mission failed after 3 attempts. Target not found or unreachable."
	logger.warning(f"[SUPERVISOR] Mission FAILED for session {session_id}.")

	return result

	def _diagnose_failure(self, world_state: Any) -> str:
	"""Situational Diagnostic Engine: Why is the mission stalling?"""
	ws_dict = world_state.to_dict() if hasattr(world_state, "to_dict") else world_state
	entities = ws_dict.get("entities", [])

	# 1. Lighting & Environment
	if ws_dict.get("lighting") == "low": return "low_light"
	if ws_dict.get("noise_level", 0.0) > 0.6: return "high_noise"

	# 2. Target Specific Issues (Risk & Uncertainty)
	if entities:
	best_e = max(entities, key=lambda e: e.get("confidence", 0))
	pred = best_e.get("prediction") or {}

	if pred.get("uncertainty", 0) > 0.6: return "high_perception_uncertainty"
	if pred.get("risk_score", 0) > 0.6: return "high_anticipatory_risk"

	if best_e.get("confidence", 0) < 0.4:
	return "low_confidence_match"

	# 3. Check for temporal stagnation (Is it seen but not 'developing' in attributes?)
	history = best_e.get("history", [])
	if len(history) > 5:
	states = [h.get("state") for h in history[-5:]]
	if all(s == states[0] for s in states):
	return "temporal_stagnation"

	# 3. Sensor Issues
	if ws_dict.get("target_status") == "occluded": return "occlusion"

	return "target_not_found"

	def _select_strategy(self, failure_type: str, history: List[str]) -> str:
	"""ROI-driven Strategy Selection: Pick bestSuccess/Cost ratio."""

	# Strategy Catalog: {name: (success_prob, resource_cost)}
	strategies = {
	"low_light": [
	("enable_thermal", 0.9, 4),
	("increase_gain", 0.6, 1),
	("lower_thresholds", 0.2, 0)
	],
	"high_noise": [
	("switch_to_visual_only", 0.7, 1),
	("noise_gating", 0.5, 2)
	],
	"low_confidence_match": [
	("switch_to_specialist", 0.8, 2),
	("zoom_in", 0.5, 1)
	],
	"high_perception_uncertainty": [
	("active_sensing_sweep", 0.8, 3), # Multi-model cross-check
	("widen_fov", 0.4, 1)
	],
	"high_anticipatory_risk": [
	("increase_frame_rate", 0.7, 5), # Hardware intensive
	("switch_to_specialist", 0.9, 2)
	],
	"temporal_stagnation": [
	("widen_fov", 0.4, 1),
	("lower_semantic_thresholds", 0.3, 1)
	],
	"target_not_found": [
	("widen_fov", 0.5, 1),
	("request_human_clarification", 1.0, 10) # Human is high cost!
	]
	}

	candidates = strategies.get(failure_type, [("lower_thresholds", 0.2, 0)])

	# Filter out already tried strategies
	untried = [s for s in candidates if s[0] not in history]
	if not untried: return "human_intervention_required"

	# Rank by ROI: Success Prob - (Cost * 0.1) - Basic ROI formula
	# We want high success but low cost.
	untried.sort(key=lambda x: x[1] - (x[2] * 0.1), reverse=True)

	return untried[0][0]

	# Singleton instances
	mission_evaluator = MissionEvaluator()
	buffer_manager = BufferManager()
	mission_supervisor = MissionSupervisor(mission_evaluator)
	buffer_manager = BufferManager()
	mission_supervisor = MissionSupervisor(mission_evaluator)