Spaces:

dpv007
/

cloud

Sleeping

App Files Files Community

dpv007 commited on Dec 12, 2025

Commit

9a09ec4

verified ·

1 Parent(s): 2d03b8b

Update app.py

Browse files

Files changed (1) hide show

app.py +472 -777

app.py CHANGED Viewed

@@ -1,19 +1,6 @@
-# app.py
 """
-Elderly HealthWatch AI Backend (FastAPI)
-Pipeline:
- - receive images
- - run VLM (remote gradio / chat_fn) -> JSON feature vector + raw text
- - run LLM (remote gradio /chat) -> structured risk JSON (per requested schema)
- - continue rest of processing and store results
-Notes:
- - Add gradio_client==1.13.2 (or another compatible 1.x) to requirements.txt
- - If VLM/LLM Spaces are private, set HF_TOKEN in the environment for authentication.
- - This version includes a robust regex-based extractor that finds the outermost {...} block
-   in the LLM output, extracts numeric values for the required keys, and always returns
-   numeric defaults (no NaN) so frontends will not receive null/None for numeric fields.
- - This variant logs raw LLM output and the parsed JSON using Python logging.
 """
 import io
@@ -31,272 +18,293 @@ from fastapi import FastAPI, UploadFile, File, BackgroundTasks, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
 from PIL import Image
 import numpy as np
-import cv2  # opencv-python-headless expected installed
-# Optional gradio client (for VLM + LLM calls)
 try:
-    from gradio_client import Client, handle_file  # type: ignore
     GRADIO_AVAILABLE = True
 except Exception:
     GRADIO_AVAILABLE = False
-# Configure logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger("elderly_healthwatch")
-# Configuration for remote VLM and LLM spaces (change to your target Space names)
 GRADIO_VLM_SPACE = os.getenv("GRADIO_SPACE", "developer0hye/Qwen3-VL-8B-Instruct")
 LLM_GRADIO_SPACE = os.getenv("LLM_GRADIO_SPACE", "Tonic/med-gpt-oss-20b-demo")
 HF_TOKEN = os.getenv("HF_TOKEN", None)
-# Default VLM prompt
 DEFAULT_VLM_PROMPT = (
     "From the provided face/eye images, compute the required screening features "
     "(pallor, sclera yellowness, redness, mobility metrics, quality checks) "
     "and output a clean JSON feature vector only."
 )
-# Default LLM prompts / metadata (stricter: force JSON-only output)
-LLM_MODEL_IDENTITY = os.getenv(
-    "LLM_MODEL_IDENTITY",
-    "You are GPT-Tonic, a large language model trained by TonicAI for clinical reasoning."
 )
-LLM_SYSTEM_PROMPT = os.getenv(
-    "LLM_SYSTEM_PROMPT",
-    "System: This assistant MUST ONLY OUTPUT a single valid JSON object as its response — no prose, no explanations, no code fences, no annotations. The JSON must follow the schema requested by the user."
-)
-LLM_DEVELOPER_PROMPT = os.getenv(
-    "LLM_DEVELOPER_PROMPT",
-    "Developer: Output ONLY a single valid JSON object with keys: risk_score, jaundice_probability, anemia_probability, hydration_issue_probability, neurological_issue_probability, summary, recommendation, confidence. Do NOT include any extra fields or natural language outside the JSON object."
 )
-# Try MTCNN libs; fallback to OpenCV haar cascades
-_MTCNN_IMPL = None
-try:
-    from facenet_pytorch import MTCNN as FacenetMTCNN  # type: ignore
-    _MTCNN_IMPL = "facenet_pytorch"
-except Exception:
-    FacenetMTCNN = None
-    _MTCNN_IMPL = None
-if _MTCNN_IMPL is None:
     try:
-        from mtcnn import MTCNN as ClassicMTCNN  # type: ignore
-        _MTCNN_IMPL = "mtcnn"
     except Exception:
-        ClassicMTCNN = None
-def create_mtcnn_or_fallback():
-    if _MTCNN_IMPL == "facenet_pytorch" and FacenetMTCNN is not None:
-        try:
-            return FacenetMTCNN(keep_all=False, device="cpu")
-        except Exception:
-            pass
-    if _MTCNN_IMPL == "mtcnn" and ClassicMTCNN is not None:
-        try:
-            return ClassicMTCNN()
-        except Exception:
-            pass
-    # OpenCV Haar fallback
     try:
-        face_cascade_path = os.path.join(cv2.data.haarcascades, "haarcascade_frontalface_default.xml")
-        eye_cascade_path = os.path.join(cv2.data.haarcascades, "haarcascade_eye.xml")
-        if os.path.exists(face_cascade_path) and os.path.exists(eye_cascade_path):
             return {
                 "impl": "opencv",
-                "face_cascade": cv2.CascadeClassifier(face_cascade_path),
-                "eye_cascade": cv2.CascadeClassifier(eye_cascade_path)
-            }
     except Exception:
         pass
-    return None
-mtcnn = create_mtcnn_or_fallback()
-app = FastAPI(title="Elderly HealthWatch AI Backend")
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=["*"],
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
-# In-memory DB for demo
-screenings_db: Dict[str, Dict[str, Any]] = {}
-# -----------------------
-# Utility helpers
-# -----------------------
 def load_image_from_bytes(bytes_data: bytes) -> Image.Image:
     return Image.open(io.BytesIO(bytes_data)).convert("RGB")
-def estimate_eye_openness_from_detection(confidence: float) -> float:
-    try:
-        conf = float(confidence)
-        openness = min(max((conf * 1.15), 0.0), 1.0)
-        return openness
-    except Exception:
         return 0.0
-# -----------------------
-# Regex-based robust extractor
-# -----------------------
-def extract_json_via_regex(raw_text: str) -> Dict[str, Any]:
-    """
-    1) Finds the outermost { ... } block in raw_text.
-    2) Extracts numeric values after the listed keys using regex, tolerating:
-       - quotes, spaces, percent signs, percent numbers like "55%", strings like "0.12", integers, or numbers in quotes.
-    3) Returns a dict with numeric fields GUARANTEED to be floats (no None/NaN), and string fields for summary/recommendation.
-    """
-    # Find the first {...} block (outermost approximation)
     match = re.search(r"\{[\s\S]*\}", raw_text)
     if not match:
         raise ValueError("No JSON-like block found in LLM output")
     block = match.group(0)
-    def find_number_for_key(key: str) -> Optional[float]:
-        """
-        Returns a float in range 0..1 for probabilities, and raw numeric for other keys depending on usage.
-        This helper returns None if not found; caller will replace with defaults (0.0).
-        """
-        # Try multiple patterns to be robust
-        # Pattern captures numbers possibly with % and optional quotes, e.g. "45%", '0.12', 0.5, " 87 "
         patterns = [
-            rf'"{key}"\s*:\s*["\']?\s*([-+]?\d+(\.\d+)?)\s*%?\s*["\']?',  # "key": "45%" or "key": 0.45
             rf"'{key}'\s*:\s*['\"]?\s*([-+]?\d+(\.\d+)?)\s*%?\s*['\"]?",
-            rf'\b{key}\b\s*:\s*["\']?\s*([-+]?\d+(\.\d+)?)\s*%?\s*["\']?',  # key: 45%
-            rf'"{key}"\s*:\s*["\']([^"\']+)["\']',  # capture quoted text (for non-numeric attempts)
-            rf"'{key}'\s*:\s*['\"]([^'\"]+)['\"]"
         ]
         for pat in patterns:
             m = re.search(pat, block, flags=re.IGNORECASE)
-            if not m:
-                continue
-            g = m.group(1)
-            if g is None:
-                continue
-            s = str(g).strip()
-            # Remove percent sign if present
-            s = s.replace("%", "").strip()
-            # Try to coerce to float
-            try:
-                val = float(s)
-                return val
-            except Exception:
-                # not numeric
-                return None
         return None
-    def find_text_for_key(key: str) -> str:
-        # capture "key": "some text" allowing single/double quotes and also unquoted until comma/}
         m = re.search(rf'"{key}"\s*:\s*"([^"]*)"', block, flags=re.IGNORECASE)
         if m:
             return m.group(1).strip()
         m = re.search(rf"'{key}'\s*:\s*'([^']*)'", block, flags=re.IGNORECASE)
         if m:
             return m.group(1).strip()
-        # fallback: key: some text (unquoted) up to comma or }
         m = re.search(rf'\b{key}\b\s*:\s*([^\n,}}]+)', block, flags=re.IGNORECASE)
         if m:
             return m.group(1).strip().strip('",')
         return ""
-    # Extract raw numeric candidates
-    raw_risk = find_number_for_key("risk_score")
-    raw_jaundice = find_number_for_key("jaundice_probability")
-    raw_anemia = find_number_for_key("anemia_probability")
-    raw_hydration = find_number_for_key("hydration_issue_probability")
-    raw_neuro = find_number_for_key("neurological_issue_probability")
-    raw_conf = find_number_for_key("confidence")
-    # Normalize:
-    # - For probabilities: if value > 1 and <=100 => treat as percent -> divide by 100. If <=1 treat as fraction.
-    def normalize_prob(v: Optional[float]) -> float:
-        if v is None:
-            return 0.0
-        if v > 1.0 and v <= 100.0:
-            return max(0.0, min(1.0, v / 100.0))
-        # if v is large >100, clamp to 1.0
-        if v > 100.0:
-            return 1.0
-        # otherwise assume already 0..1
-        return max(0.0, min(1.0, v))
-    jaundice_probability = normalize_prob(raw_jaundice)
-    anemia_probability = normalize_prob(raw_anemia)
-    hydration_issue_probability = normalize_prob(raw_hydration)
-    neurological_issue_probability = normalize_prob(raw_neuro)
-    confidence = normalize_prob(raw_conf)
-    # risk_score: return in 0..100
-    def normalize_risk(v: Optional[float]) -> float:
-        if v is None:
-            return 0.0
-        if v <= 1.0:
-            # fraction given -> scale to 0..100
-            return round(max(0.0, min(100.0, v * 100.0)), 2)
-        # if between 1 and 100, assume it's already 0..100
-        if v > 1.0 and v <= 100.0:
-            return round(max(0.0, min(100.0, v)), 2)
-        # clamp anything insane
-        return round(max(0.0, min(100.0, v if v < float('inf') else 100.0)), 2)
-    risk_score = normalize_risk(raw_risk)
-    summary = find_text_for_key("summary")
-    recommendation = find_text_for_key("recommendation")
-    out = {
-        "risk_score": risk_score,
-        "jaundice_probability": round(jaundice_probability, 4),
-        "anemia_probability": round(anemia_probability, 4),
-        "hydration_issue_probability": round(hydration_issue_probability, 4),
-        "neurological_issue_probability": round(neurological_issue_probability, 4),
-        "confidence": round(confidence, 4),
-        "summary": summary,
-        "recommendation": recommendation
     }
-    return out
-# -----------------------
-# Gradio / VLM helper (returns parsed dict OR None, plus raw text)
-# -----------------------
-def get_gradio_client_for_space(space: str) -> Client:
     if not GRADIO_AVAILABLE:
-        raise RuntimeError("gradio_client not installed in this environment. Add gradio_client to requirements.txt.")
-    if HF_TOKEN:
-        return Client(space, hf_token=HF_TOKEN)
-    return Client(space)
-def run_vlm_and_get_features(face_path: str, eye_path: str, prompt: Optional[str] = None) -> Tuple[Optional[Dict[str, Any]], str]:
-    """
-    Synchronous call to remote VLM (gradio /chat_fn). Returns tuple:
-       (parsed_features_dict_or_None, raw_text_response_str)
-    We attempt to parse JSON as before, but always return the original raw text so it can be
-    forwarded verbatim to the LLM if desired.
-    """
     prompt = prompt or DEFAULT_VLM_PROMPT
     if not os.path.exists(face_path) or not os.path.exists(eye_path):
-        raise FileNotFoundError("Face or eye image path missing for VLM call.")
-    if not GRADIO_AVAILABLE:
-        raise RuntimeError("gradio_client not available in this environment.")
-    client = get_gradio_client_for_space(GRADIO_VLM_SPACE)
     message = {"text": prompt, "files": [handle_file(face_path), handle_file(eye_path)]}
     try:
-        logger.info("Calling VLM Space %s", GRADIO_VLM_SPACE)
         result = client.predict(message=message, history=[], api_name="/chat_fn")
     except Exception as e:
         logger.exception("VLM call failed")
         raise RuntimeError(f"VLM call failed: {e}")
-    if not result:
-        raise RuntimeError("Empty response from VLM")
     # Normalize result
     if isinstance(result, (list, tuple)):
         out = result[0]
@@ -304,224 +312,184 @@ def run_vlm_and_get_features(face_path: str, eye_path: str, prompt: Optional[str
         out = result
     else:
         out = {"text": str(result)}
-    if not isinstance(out, dict):
-        raise RuntimeError("Unexpected VLM output format (expected dict with 'text' key)")
-    text_out = out.get("text") or out.get("output") or None
-    if not text_out:
-        text_out = json.dumps(out)
-    # Try to parse JSON but remember raw text always
-    parsed_features = None
     try:
-        parsed_features = json.loads(text_out)
-        if not isinstance(parsed_features, dict):
-            parsed_features = None
     except Exception:
         try:
-            s = text_out
-            first = s.find("{")
-            last = s.rfind("}")
             if first != -1 and last != -1 and last > first:
-                maybe = s[first:last+1]
-                parsed_features = json.loads(maybe)
-                if not isinstance(parsed_features, dict):
-                    parsed_features = None
-            else:
-                parsed_features = None
         except Exception:
-            parsed_features = None
-    return parsed_features, text_out
-# -----------------------
-# Gradio / LLM helper (defensive, with retry + clamps)
-# -----------------------
-def run_llm_on_vlm(vlm_features_or_raw: Any,
-                   max_new_tokens: int = 1024,
-                   temperature: float = 0.0,
-                   reasoning_effort: str = "medium",
-                   model_identity: Optional[str] = None,
-                   system_prompt: Optional[str] = None,
-                   developer_prompt: Optional[str] = None) -> Dict[str, Any]:
-    """
-    Call the remote LLM Space's /chat endpoint with defensive input handling and a single retry.
-    - Coerces types (int for tokens), clamps ranges where remote spaces often expect them.
-    - Retries once with safe defaults if the Space rejects the inputs (e.g. temperature too low).
-    - Logs and returns regex-extracted JSON as before.
-    """
-    if not GRADIO_AVAILABLE:
-        raise RuntimeError("gradio_client not installed. Add gradio_client to requirements.txt")
-    # Try to import AppError for specific handling; fallback to Exception if unavailable
-    try:
-        from gradio_client import AppError  # type: ignore
-    except Exception:
-        AppError = Exception  # fallback
-    client = get_gradio_client_for_space(LLM_GRADIO_SPACE)
-    model_identity = model_identity or LLM_MODEL_IDENTITY
-    system_prompt = system_prompt or LLM_SYSTEM_PROMPT
-    developer_prompt = developer_prompt or LLM_DEVELOPER_PROMPT
-    # Prepare the combined prompt: use raw string as-is, otherwise json.dumps the dict
-    if isinstance(vlm_features_or_raw, str):
-        vlm_json_str = vlm_features_or_raw
-    else:
-        vlm_json_str = json.dumps(vlm_features_or_raw, default=str)
-    # Strong, explicit instruction to output only JSON
     instruction = (
-        "\n\nSTRICT INSTRUCTIONS (READ CAREFULLY):\n"
-        "1) OUTPUT ONLY a single valid JSON object and nothing else — no prose, no explanation, no code fences.\n"
-        "2) The JSON MUST include these keys: risk_score, jaundice_probability, anemia_probability, "
         "hydration_issue_probability, neurological_issue_probability, summary, recommendation, confidence.\n"
-        "3) Use numeric values for probabilities (0..1) and for risk_score (0..100). Use strings for summary and recommendation.\n"
-        "4) Do NOT mention disease names in summary or recommendation; use neutral wording only.\n"
-        "If you cannot estimate a value, set it to null.\n\n"
-        "Now, based on the VLM output below, produce ONLY the JSON object described above.\n\n"
-        "===BEGIN VLM OUTPUT===\n"
-        f"{vlm_json_str}\n"
-        "===END VLM OUTPUT===\n\n"
-    )
-    input_payload_str = instruction
-    # Defensive coercion / clamps
-    try_max_new_tokens = int(max_new_tokens) if max_new_tokens is not None else 1024
-    if try_max_new_tokens <= 0:
-        try_max_new_tokens = 1024
-    try_temperature = float(temperature) if temperature is not None else 0.0
-    # Many demos require temperature >= 0.1; clamp to 0.1 minimum to avoid validation failures
-    if try_temperature < 0.1:
-        try_temperature = 0.1
-    # prepare kwargs for predict
-    predict_kwargs = dict(
-        input_data=input_payload_str,
-        max_new_tokens=float(try_max_new_tokens),
-        model_identity=model_identity,
-        system_prompt=system_prompt,
-        developer_prompt=developer_prompt,
-        reasoning_effort=reasoning_effort,
-        temperature=float(try_temperature),
-        top_p=0.9,
-        top_k=50,
-        repetition_penalty=1.0,
-        api_name="/chat"
     )
-    # attempt + one retry with safer defaults if AppError occurs
-    last_exc = None
-    for attempt in (1, 2):
-        try:
-            logger.info("Calling LLM Space %s (attempt %d) with temperature=%s, max_new_tokens=%s",
-                        LLM_GRADIO_SPACE, attempt, predict_kwargs.get("temperature"), predict_kwargs.get("max_new_tokens"))
-            result = client.predict(**predict_kwargs)
-            # normalize to string
-            if isinstance(result, (dict, list)):
-                text_out = json.dumps(result)
-            else:
-                text_out = str(result)
-            if not text_out or len(text_out.strip()) == 0:
-                raise RuntimeError("LLM returned empty response")
-            logger.info("LLM raw output:\n%s", text_out)
-            # parse with regex extractor (may raise)
-            parsed = extract_json_via_regex(text_out)
-            if not isinstance(parsed, dict):
-                raise ValueError("Parsed LLM output is not a JSON object/dict")
-            # pretty log parsed JSON
-            try:
-                logger.info("LLM parsed JSON:\n%s", json.dumps(parsed, indent=2, ensure_ascii=False))
-            except Exception:
-                logger.info("LLM parsed JSON (raw dict): %s", str(parsed))
-            # defensive clamps (same as before)
-            def safe_prob(val):
-                try:
-                    v = float(val)
-                    return max(0.0, min(1.0, v))
-                except Exception:
-                    return 0.0
-            for k in [
-                "jaundice_probability",
-                "anemia_probability",
-                "hydration_issue_probability",
-                "neurological_issue_probability"
-            ]:
-                parsed[k] = safe_prob(parsed.get(k, 0.0))
-            try:
-                rs = float(parsed.get("risk_score", 0.0))
-                parsed["risk_score"] = round(max(0.0, min(100.0, rs)), 2)
-            except Exception:
-                parsed["risk_score"] = 0.0
-            parsed["confidence"] = safe_prob(parsed.get("confidence", 0.0))
-            parsed["summary"] = str(parsed.get("summary", "") or "").strip()
-            parsed["recommendation"] = str(parsed.get("recommendation", "") or "").strip()
-            for k in [
-                "jaundice_probability",
-                "anemia_probability",
-                "hydration_issue_probability",
-                "neurological_issue_probability",
-                "confidence",
-                "risk_score"
-            ]:
-                parsed[f"{k}_was_missing"] = False
-            return parsed
-        except AppError as app_e:
-            # Specific remote validation error: log and attempt a single retry with ultra-safe defaults
-            logger.exception("LLM AppError (remote validation failed) on attempt %d: %s", attempt, str(app_e))
-            last_exc = app_e
-            if attempt == 1:
-                # tighten inputs and retry: force temperature=0.2, max_new_tokens=512
-                predict_kwargs["temperature"] = 0.2
-                predict_kwargs["max_new_tokens"] = float(512)
-                logger.info("Retrying LLM call with temperature=0.2 and max_new_tokens=512")
-                continue
-            else:
-                # no more retries
-                raise RuntimeError(f"LLM call failed (AppError): {app_e}")
-        except Exception as e:
-            logger.exception("LLM call failed on attempt %d: %s", attempt, str(e))
-            last_exc = e
-            # try one retry only for non-AppError exceptions
-            if attempt == 1:
-                predict_kwargs["temperature"] = 0.2
-                predict_kwargs["max_new_tokens"] = float(512)
-                continue
-            raise RuntimeError(f"LLM call failed: {e}")
-    # if we reach here, raise last caught exception
-    raise RuntimeError(f"LLM call ultimately failed: {last_exc}")
-# -----------------------
-# API endpoints
-# -----------------------
 @app.get("/")
 async def read_root():
     return {"message": "Elderly HealthWatch AI Backend"}
 @app.get("/health")
 async def health_check():
-    impl = None
-    if mtcnn is None:
-        impl = "none"
-    elif isinstance(mtcnn, dict) and mtcnn.get("impl") == "opencv":
-        impl = "opencv_haar_fallback"
-    else:
-        impl = _MTCNN_IMPL
     return {
         "status": "healthy",
-        "detector": impl,
         "vlm_available": GRADIO_AVAILABLE,
         "vlm_space": GRADIO_VLM_SPACE,
         "llm_space": LLM_GRADIO_SPACE
@@ -529,107 +497,46 @@ async def health_check():
 @app.post("/api/v1/validate-eye-photo")
 async def validate_eye_photo(image: UploadFile = File(...)):
-    """
-    Lightweight validation endpoint. Uses available detector (facenet/mtcnn/opencv) to check face/eye detection.
-    For full pipeline, use /api/v1/upload which invokes VLM+LLM in background.
-    """
-    if mtcnn is None:
-        raise HTTPException(status_code=500, detail="No face detector available in this deployment.")
     try:
         content = await image.read()
         if not content:
-            raise HTTPException(status_code=400, detail="Empty file uploaded.")
         pil_img = load_image_from_bytes(content)
-        img_arr = np.asarray(pil_img)  # RGB
-        # facenet-pytorch branch
-        if not isinstance(mtcnn, dict) and _MTCNN_IMPL == "facenet_pytorch":
-            try:
-                boxes, probs, landmarks = mtcnn.detect(pil_img, landmarks=True)
-                if boxes is None or len(boxes) == 0:
-                    return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                            "message_english": "No face detected. Please ensure your face is clearly visible in the frame.",
-                            "message_hindi": "कोई चेहरा नहीं मिला। कृपया सुनिश्चित करें कि आपका चेहरा फ्रेम में स्पष्ट रूप से दिखाई दे रहा है।"}
-                prob = float(probs[0]) if probs is not None else 0.0
-                lm = landmarks[0] if landmarks is not None else None
-                if lm is not None and len(lm) >= 2:
-                    left_eye = {"x": float(lm[0][0]), "y": float(lm[0][1])}
-                    right_eye = {"x": float(lm[1][0]), "y": float(lm[1][1])}
-                else:
-                    left_eye = right_eye = None
-                eye_openness_score = estimate_eye_openness_from_detection(prob)
-                is_valid = eye_openness_score >= 0.3
-                return {"valid": bool(is_valid), "face_detected": True, "eye_openness_score": round(eye_openness_score, 2),
-                        "message_english": "Photo looks good! Eyes are properly open." if is_valid else "Eyes appear to be closed or partially closed. Please open your eyes wide and try again.",
-                        "message_hindi": "फोटो अच्छी है! आंखें ठीक से खुली हैं।" if is_valid else "आंखें बंद या आंशिक रूप से बंद दिखाई दे रही हैं। कृपया अपनी आंखें चौड��ी खोलें और पुनः प्रयास करें।",
-                        "eye_landmarks": {"left_eye": left_eye, "right_eye": right_eye}}
-            except Exception:
-                traceback.print_exc()
-                raise HTTPException(status_code=500, detail="Face detector failed during inference.")
-        # classic mtcnn branch
-        if not isinstance(mtcnn, dict) and _MTCNN_IMPL == "mtcnn":
-            try:
-                detections = mtcnn.detect_faces(img_arr)
-            except Exception:
-                detections = mtcnn.detect_faces(pil_img)
-            if not detections:
-                return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                        "message_english": "No face detected. Please ensure your face is clearly visible in the frame.",
-                        "message_hindi": "कोई चेहरा नहीं मिला। कृपया सुनिश्चित करें कि आपका चेहरा फ्रेम में स्पष्ट रूप से दिखाई दे रहा है।"}
-            face = detections[0]
-            keypoints = face.get("keypoints", {})
-            left_eye = keypoints.get("left_eye")
-            right_eye = keypoints.get("right_eye")
-            confidence = float(face.get("confidence", 0.0))
-            eye_openness_score = estimate_eye_openness_from_detection(confidence)
-            is_valid = eye_openness_score >= 0.3
-            return {"valid": bool(is_valid), "face_detected": True, "eye_openness_score": round(eye_openness_score, 2),
-                    "message_english": "Photo looks good! Eyes are properly open." if is_valid else "Eyes appear to be closed or partially closed. Please open your eyes wide and try again.",
-                    "message_hindi": "फोटो अच्छी है! आंखें ठीक से खुली हैं।" if is_valid else "आंखें बंद या आंशिक रूप से बंद दिखाई दे रही हैं। कृपया अपनी आंखें चौड़ी खोलें और पुनः प्रयास करें।",
-                    "eye_landmarks": {"left_eye": left_eye, "right_eye": right_eye}}
-        # OpenCV Haar cascade fallback
-        if isinstance(mtcnn, dict) and mtcnn.get("impl") == "opencv":
-            try:
-                gray = cv2.cvtColor(img_arr, cv2.COLOR_RGB2GRAY)
-                face_cascade = mtcnn["face_cascade"]
-                eye_cascade = mtcnn["eye_cascade"]
-                faces = face_cascade.detectMultiScale(gray, scaleFactor=1.1, minNeighbors=4, minSize=(60, 60))
-                if len(faces) == 0:
-                    return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                            "message_english": "No face detected. Please ensure your face is clearly visible in the frame.",
-                            "message_hindi": "कोई चेहरा नहीं मिला। कृपया सुनिश्चित करें कि आपका चेहरा फ्रेम में स्पष्ट रूप से दिखाई दे रहा है।"}
-                (x, y, w, h) = faces[0]
-                roi_gray = gray[y:y+h, x:x+w]
-                eyes = eye_cascade.detectMultiScale(roi_gray, scaleFactor=1.1, minNeighbors=5, minSize=(20, 10))
-                eye_openness_score = 1.0 if len(eyes) >= 1 else 0.0
-                is_valid = eye_openness_score >= 0.3
-                left_eye = None
-                right_eye = None
-                if len(eyes) >= 1:
-                    ex, ey, ew, eh = eyes[0]
-                    cx = float(x + ex + ew/2)
-                    cy = float(y + ey + eh/2)
-                    left_eye = {"x": cx, "y": cy}
-                return {"valid": bool(is_valid), "face_detected": True, "eye_openness_score": round(eye_openness_score, 2),
-                        "message_english": "Photo looks good! Eyes are detected." if is_valid else "Eyes not detected. Please open your eyes wide and try again.",
-                        "message_hindi": "फोटो अच्छी है! आंखें मिलीं।" if is_valid else "आंखें नहीं मिलीं। कृपया अपनी आंखें चौड़ी खोलें और पुनः प्रयास करें।",
-                        "eye_landmarks": {"left_eye": left_eye, "right_eye": right_eye}}
-            except Exception:
-                traceback.print_exc()
-                raise HTTPException(status_code=500, detail="OpenCV fallback detector failed.")
-        raise HTTPException(status_code=500, detail="Invalid detector configuration.")
-    except HTTPException:
-        raise
     except Exception as e:
-        traceback.print_exc()
-        return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                "message_english": "Error processing image. Please try again.",
-                "message_hindi": "छवि प्रोसेस करने में त्रुटि। कृपया पुनः प्रयास करें।",
-                "error": str(e)}
 @app.post("/api/v1/upload")
 async def upload_images(
@@ -637,25 +544,21 @@ async def upload_images(
     face_image: UploadFile = File(...),
     eye_image: UploadFile = File(...)
 ):
-    """
-    Save images and enqueue background processing. VLM -> LLM runs inside process_screening.
-    """
     try:
         screening_id = str(uuid.uuid4())
-        now = datetime.utcnow().isoformat() + "Z"
-        tmp_dir = "/tmp/elderly_healthwatch"
-        os.makedirs(tmp_dir, exist_ok=True)
-        face_path = os.path.join(tmp_dir, f"{screening_id}_face.jpg")
-        eye_path = os.path.join(tmp_dir, f"{screening_id}_eye.jpg")
-        face_bytes = await face_image.read()
-        eye_bytes = await eye_image.read()
         with open(face_path, "wb") as f:
-            f.write(face_bytes)
         with open(eye_path, "wb") as f:
-            f.write(eye_bytes)
         screenings_db[screening_id] = {
             "id": screening_id,
-            "timestamp": now,
             "face_image_path": face_path,
             "eye_image_path": eye_path,
             "status": "queued",
@@ -664,331 +567,123 @@ async def upload_images(
             "disease_predictions": [],
             "recommendations": {}
         }
         background_tasks.add_task(process_screening, screening_id)
         return {"screening_id": screening_id}
     except Exception as e:
-        traceback.print_exc()
-        raise HTTPException(status_code=500, detail=f"Failed to upload images: {e}")
 @app.post("/api/v1/analyze/{screening_id}")
 async def analyze_screening(screening_id: str, background_tasks: BackgroundTasks):
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
-    if screenings_db[screening_id].get("status") == "processing":
         return {"message": "Already processing"}
     screenings_db[screening_id]["status"] = "queued"
     background_tasks.add_task(process_screening, screening_id)
     return {"message": "Analysis enqueued"}
 @app.get("/api/v1/status/{screening_id}")
 async def get_status(screening_id: str):
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
-    status = screenings_db[screening_id].get("status", "unknown")
     progress = 50 if status == "processing" else (100 if status == "completed" else 0)
     return {"screening_id": screening_id, "status": status, "progress": progress}
 @app.get("/api/v1/results/{screening_id}")
 async def get_results(screening_id: str):
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
     return screenings_db[screening_id]
 @app.get("/api/v1/history/{user_id}")
 async def get_history(user_id: str):
     history = [s for s in screenings_db.values() if s.get("user_id") == user_id]
     return {"screenings": history}
-# -----------------------
-# Immediate VLM -> LLM routes (return vitals in one call)
-# -----------------------
 @app.post("/api/v1/get-vitals")
 async def get_vitals_from_upload(
     face_image: UploadFile = File(...),
     eye_image: UploadFile = File(...)
 ):
-    """
-    Run VLM -> LLM pipeline synchronously (but off the event loop) and return:
-      { vlm_features, vlm_raw, structured_risk }
-    """
     if not GRADIO_AVAILABLE:
-        raise HTTPException(status_code=500, detail="VLM/LLM client not available in this deployment.")
-    # save files to a temp directory
     try:
-        tmp_dir = "/tmp/elderly_healthwatch"
-        os.makedirs(tmp_dir, exist_ok=True)
         uid = str(uuid.uuid4())
-        face_path = os.path.join(tmp_dir, f"{uid}_face.jpg")
-        eye_path = os.path.join(tmp_dir, f"{uid}_eye.jpg")
-        face_bytes = await face_image.read()
-        eye_bytes = await eye_image.read()
         with open(face_path, "wb") as f:
-            f.write(face_bytes)
         with open(eye_path, "wb") as f:
-            f.write(eye_bytes)
-    except Exception as e:
-        logger.exception("Failed saving uploaded images")
-        raise HTTPException(status_code=500, detail=f"Failed saving images: {e}")
-    try:
-        # Run VLM (off the event loop)
-        vlm_features, vlm_raw = await asyncio.to_thread(run_vlm_and_get_features, face_path, eye_path)
-        # Prefer sending raw vlm text to LLM (same behavior as process_screening)
         llm_input = vlm_raw if vlm_raw else (vlm_features if vlm_features else "{}")
-        # Run LLM (off the event loop)
-        structured_risk = await asyncio.to_thread(run_llm_on_vlm, llm_input)
-        # Return merged result
         return {
             "vlm_features": vlm_features,
             "vlm_raw": vlm_raw,
             "structured_risk": structured_risk
         }
     except Exception as e:
-        logger.exception("get_vitals_from_upload pipeline failed")
-        raise HTTPException(status_code=500, detail=f"Pipeline failed: {e}")
 @app.post("/api/v1/get-vitals/{screening_id}")
 async def get_vitals_for_screening(screening_id: str):
-    """
-    Re-run VLM->LLM on images already stored for `screening_id` in screenings_db.
-    Useful for re-processing or debugging.
-    """
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
     entry = screenings_db[screening_id]
     face_path = entry.get("face_image_path")
     eye_path = entry.get("eye_image_path")
     if not (face_path and os.path.exists(face_path) and eye_path and os.path.exists(eye_path)):
-        raise HTTPException(status_code=400, detail="Stored images missing for this screening")
     try:
-        # Run VLM off the event loop
-        vlm_features, vlm_raw = await asyncio.to_thread(run_vlm_and_get_features, face_path, eye_path)
         llm_input = vlm_raw if vlm_raw else (vlm_features if vlm_features else "{}")
-        structured_risk = await asyncio.to_thread(run_llm_on_vlm, llm_input)
-        # Optionally store this run's outputs back into the DB for inspection
-        entry.setdefault("ai_results", {})
-        entry["ai_results"].update({
             "vlm_features": vlm_features,
             "vlm_raw": vlm_raw,
             "structured_risk": structured_risk,
             "last_vitals_run": datetime.utcnow().isoformat() + "Z"
         })
         return {
             "screening_id": screening_id,
             "vlm_features": vlm_features,
             "vlm_raw": vlm_raw,
             "structured_risk": structured_risk
         }
     except Exception as e:
-        logger.exception("get_vitals_for_screening pipeline failed")
-        raise HTTPException(status_code=500, detail=f"Pipeline failed: {e}")
-# -----------------------
-# Main processing pipeline
-# -----------------------
-async def process_screening(screening_id: str):
-    """
-    Main pipeline:
-     - load images
-     - quick detector-based quality metrics
-     - run VLM -> vlm_features (dict or None) + vlm_raw (string)
-     - run LLM on vlm_raw (preferred) or vlm_features -> structured risk JSON
-     - merge results into ai_results and finish
-    """
-    try:
-        if screening_id not in screenings_db:
-            logger.error("[process_screening] screening %s not found", screening_id)
-            return
-        screenings_db[screening_id]["status"] = "processing"
-        logger.info("[process_screening] Starting %s", screening_id)
-        entry = screenings_db[screening_id]
-        face_path = entry.get("face_image_path")
-        eye_path = entry.get("eye_image_path")
-        if not (face_path and os.path.exists(face_path)):
-            raise RuntimeError("Face image missing")
-        if not (eye_path and os.path.exists(eye_path)):
-            raise RuntimeError("Eye image missing")
-        face_img = Image.open(face_path).convert("RGB")
-        eye_img = Image.open(eye_path).convert("RGB")
-        # Basic detection + quality metrics (facenet/mtcnn/opencv)
-        face_detected = False
-        face_confidence = 0.0
-        left_eye_coord = right_eye_coord = None
-        if mtcnn is not None and not isinstance(mtcnn, dict) and (_MTCNN_IMPL == "facenet_pytorch" or _MTCNN_IMPL == "mtcnn"):
-            try:
-                if _MTCNN_IMPL == "facenet_pytorch":
-                    boxes, probs, landmarks = mtcnn.detect(face_img, landmarks=True)
-                    if boxes is not None and len(boxes) > 0:
-                        face_detected = True
-                        face_confidence = float(probs[0]) if probs is not None else 0.0
-                        if landmarks is not None:
-                            lm = landmarks[0]
-                            if len(lm) >= 2:
-                                left_eye_coord = {"x": float(lm[0][0]), "y": float(lm[0][1])}
-                                right_eye_coord = {"x": float(lm[1][0]), "y": float(lm[1][1])}
-                else:
-                    arr = np.asarray(face_img)
-                    detections = mtcnn.detect_faces(arr)
-                    if detections:
-                        face_detected = True
-                        face_confidence = float(detections[0].get("confidence", 0.0))
-                        k = detections[0].get("keypoints", {})
-                        left_eye_coord = k.get("left_eye")
-                        right_eye_coord = k.get("right_eye")
-            except Exception:
-                traceback.print_exc()
-        if isinstance(mtcnn, dict) and mtcnn.get("impl") == "opencv":
-            try:
-                arr = np.asarray(face_img)
-                gray = cv2.cvtColor(arr, cv2.COLOR_RGB2GRAY)
-                face_cascade = mtcnn["face_cascade"]
-                eye_cascade = mtcnn["eye_cascade"]
-                faces = face_cascade.detectMultiScale(gray, scaleFactor=1.1, minNeighbors=4, minSize=(60, 60))
-                if len(faces) > 0:
-                    face_detected = True
-                    (x, y, w, h) = faces[0]
-                    face_confidence = min(1.0, (w*h) / (arr.shape[0]*arr.shape[1]) * 4.0)
-                    roi_gray = gray[y:y+h, x:x+w]
-                    eyes = eye_cascade.detectMultiScale(roi_gray, scaleFactor=1.1, minNeighbors=5, minSize=(20, 10))
-                    if len(eyes) >= 1:
-                        ex, ey, ew, eh = eyes[0]
-                        left_eye_coord = {"x": float(x + ex + ew/2), "y": float(y + ey + eh/2)}
-            except Exception:
-                traceback.print_exc()
-        face_quality_score = 0.85 if face_detected and face_confidence > 0.6 else 0.45
-        quality_metrics = {
-            "face_detected": face_detected,
-            "face_confidence": round(face_confidence, 3),
-            "face_quality_score": round(face_quality_score, 2),
-            "eye_coords": {"left_eye": left_eye_coord, "right_eye": right_eye_coord},
-            "face_brightness": int(np.mean(np.asarray(face_img.convert("L")))),
-            "face_blur_estimate": int(np.var(np.asarray(face_img.convert("L"))))
-        }
-        screenings_db[screening_id]["quality_metrics"] = quality_metrics
-        # --------------------------
-        # RUN VLM -> get vlm_features + vlm_raw
-        # --------------------------
-        vlm_features = None
-        vlm_raw = None
-        try:
-            vlm_features, vlm_raw = run_vlm_and_get_features(face_path, eye_path)
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({
-                "vlm_features": vlm_features,
-                "vlm_raw": vlm_raw
-            })
-        except Exception as e:
-            logger.exception("VLM feature extraction failed")
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({"vlm_error": str(e)})
-            vlm_features = None
-            vlm_raw = None
-        # --------------------------
-        # RUN LLM on vlm_raw (preferred) or vlm_features -> structured risk JSON
-        # --------------------------
-        structured_risk = None
-        try:
-            if vlm_raw:
-                structured_risk = run_llm_on_vlm(vlm_raw)
-            elif vlm_features:
-                structured_risk = run_llm_on_vlm(vlm_features)
-            else:
-                # Fallback if VLM failed: produce conservative defaults
-                structured_risk = {
-                    "risk_score": 0.0,
-                    "jaundice_probability": 0.0,
-                    "anemia_probability": 0.0,
-                    "hydration_issue_probability": 0.0,
-                    "neurological_issue_probability": 0.0,
-                    "summary": "",
-                    "recommendation": "",
-                    "confidence": 0.0
-                }
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({"structured_risk": structured_risk})
-        except Exception as e:
-            logger.exception("LLM processing failed")
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({"llm_error": str(e)})
-            structured_risk = {
-                "risk_score": 0.0,
-                "jaundice_probability": 0.0,
-                "anemia_probability": 0.0,
-                "hydration_issue_probability": 0.0,
-                "neurological_issue_probability": 0.0,
-                "summary": "",
-                "recommendation": "",
-                "confidence": 0.0
-            }
-        # Use structured_risk for summary recommendations & simple disease inference placeholders
-        hem = screenings_db[screening_id]["ai_results"].get("medical_insights", {}).get("hemoglobin_estimate", None)
-        bil = screenings_db[screening_id]["ai_results"].get("medical_insights", {}).get("bilirubin_estimate", None)
-        # Keep older ai_results shape for backward compatibility (if you want)
-        screenings_db[screening_id].setdefault("ai_results", {})
-        screenings_db[screening_id]["ai_results"].update({
-            "processing_time_ms": 1200
-        })
-        # disease_predictions & recommendations can be built from structured_risk if needed
-        disease_predictions = [
-            {
-                "condition": "Anemia-like-signs",  # internal tag (not surfaced in LLM summary)
-                "risk_level": "Medium" if structured_risk.get("anemia_probability", 0.0) > 0.5 else "Low",
-                "probability": structured_risk.get("anemia_probability", 0.0),
-                "confidence": structured_risk.get("confidence", 0.0)
-            },
-            {
-                "condition": "Jaundice-like-signs",
-                "risk_level": "Medium" if structured_risk.get("jaundice_probability", 0.0) > 0.5 else "Low",
-                "probability": structured_risk.get("jaundice_probability", 0.0),
-                "confidence": structured_risk.get("confidence", 0.0)
-            }
-        ]
-        recommendations = {
-            "action_needed": "consult" if structured_risk.get("risk_score", 0.0) > 30.0 else "monitor",
-            "message_english": structured_risk.get("recommendation", "") or f"Please follow up with a health professional if concerns persist.",
-            "message_hindi": ""  # could be auto-translated if desired
-        }
-        screenings_db[screening_id].update({
-            "status": "completed",
-            "disease_predictions": disease_predictions,
-            "recommendations": recommendations
-        })
-        logger.info("[process_screening] Completed %s", screening_id)
-    except Exception as e:
-        traceback.print_exc()
-        if screening_id in screenings_db:
-            screenings_db[screening_id]["status"] = "failed"
-            screenings_db[screening_id]["error"] = str(e)
-        else:
-            logger.error("[process_screening] Failed for unknown screening %s: %s", screening_id, str(e))
-# -----------------------
-# Run server (for local debugging)
-# -----------------------
 if __name__ == "__main__":
     import uvicorn
-    uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=False)

 """
+Elderly HealthWatch AI Backend (FastAPI) - Refactored
+Simplified architecture with same API routes for frontend compatibility.
 """
 import io
 from fastapi.middleware.cors import CORSMiddleware
 from PIL import Image
 import numpy as np
+import cv2
 try:
+    from gradio_client import Client, handle_file
     GRADIO_AVAILABLE = True
 except Exception:
     GRADIO_AVAILABLE = False
+# ============================================================================
+# Configuration
+# ============================================================================
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger("elderly_healthwatch")
 GRADIO_VLM_SPACE = os.getenv("GRADIO_SPACE", "developer0hye/Qwen3-VL-8B-Instruct")
 LLM_GRADIO_SPACE = os.getenv("LLM_GRADIO_SPACE", "Tonic/med-gpt-oss-20b-demo")
 HF_TOKEN = os.getenv("HF_TOKEN", None)
 DEFAULT_VLM_PROMPT = (
     "From the provided face/eye images, compute the required screening features "
     "(pallor, sclera yellowness, redness, mobility metrics, quality checks) "
     "and output a clean JSON feature vector only."
 )
+LLM_SYSTEM_PROMPT = (
+    "System: This assistant MUST ONLY OUTPUT a single valid JSON object as its response — "
+    "no prose, no explanations, no code fences, no annotations."
 )
+LLM_DEVELOPER_PROMPT = (
+    "Developer: Output ONLY a single valid JSON object with keys: risk_score, "
+    "jaundice_probability, anemia_probability, hydration_issue_probability, "
+    "neurological_issue_probability, summary, recommendation, confidence. "
+    "Do NOT include any extra fields or natural language outside the JSON object."
 )
+TMP_DIR = "/tmp/elderly_healthwatch"
+os.makedirs(TMP_DIR, exist_ok=True)
+# In-memory database
+screenings_db: Dict[str, Dict[str, Any]] = {}
+# ============================================================================
+# Face Detection Setup
+# ============================================================================
+def setup_face_detector():
+    """Initialize face detector (MTCNN or OpenCV fallback)"""
+    # Try facenet-pytorch MTCNN
     try:
+        from facenet_pytorch import MTCNN
+        return MTCNN(keep_all=False, device="cpu"), "facenet_pytorch"
     except Exception:
+        pass
+    # Try classic MTCNN
     try:
+        from mtcnn import MTCNN
+        return MTCNN(), "mtcnn"
+    except Exception:
+        pass
+    # OpenCV Haar cascade fallback
+    try:
+        face_path = os.path.join(cv2.data.haarcascades, "haarcascade_frontalface_default.xml")
+        eye_path = os.path.join(cv2.data.haarcascades, "haarcascade_eye.xml")
+        if os.path.exists(face_path) and os.path.exists(eye_path):
             return {
                 "impl": "opencv",
+                "face_cascade": cv2.CascadeClassifier(face_path),
+                "eye_cascade": cv2.CascadeClassifier(eye_path)
+            }, "opencv"
     except Exception:
         pass
+    return None, None
+face_detector, detector_type = setup_face_detector()
+# ============================================================================
+# Utility Functions
+# ============================================================================
 def load_image_from_bytes(bytes_data: bytes) -> Image.Image:
     return Image.open(io.BytesIO(bytes_data)).convert("RGB")
+def normalize_probability(val: Optional[float]) -> float:
+    """Normalize probability to 0-1 range"""
+    if val is None:
         return 0.0
+    if val > 1.0 and val <= 100.0:
+        return max(0.0, min(1.0, val / 100.0))
+    if val > 100.0:
+        return 1.0
+    return max(0.0, min(1.0, val))
+def normalize_risk_score(val: Optional[float]) -> float:
+    """Normalize risk score to 0-100 range"""
+    if val is None:
+        return 0.0
+    if val <= 1.0:
+        return round(max(0.0, min(100.0, val * 100.0)), 2)
+    return round(max(0.0, min(100.0, val)), 2)
+# ============================================================================
+# Face Detection Functions
+# ============================================================================
+def detect_face_and_eyes(pil_img: Image.Image) -> Dict[str, Any]:
+    """Detect face and eyes, return quality metrics"""
+    if face_detector is None:
+        return {
+            "face_detected": False,
+            "face_confidence": 0.0,
+            "eye_openness_score": 0.0,
+            "left_eye": None,
+            "right_eye": None
+        }
+    img_arr = np.asarray(pil_img)
+    # Facenet-pytorch MTCNN
+    if detector_type == "facenet_pytorch":
+        try:
+            boxes, probs, landmarks = face_detector.detect(pil_img, landmarks=True)
+            if boxes is None or len(boxes) == 0:
+                return {"face_detected": False, "face_confidence": 0.0, "eye_openness_score": 0.0,
+                        "left_eye": None, "right_eye": None}
+            confidence = float(probs[0]) if probs is not None else 0.0
+            lm = landmarks[0] if landmarks is not None else None
+            left_eye = right_eye = None
+            if lm is not None and len(lm) >= 2:
+                left_eye = {"x": float(lm[0][0]), "y": float(lm[0][1])}
+                right_eye = {"x": float(lm[1][0]), "y": float(lm[1][1])}
+            return {
+                "face_detected": True,
+                "face_confidence": confidence,
+                "eye_openness_score": min(max(confidence * 1.15, 0.0), 1.0),
+                "left_eye": left_eye,
+                "right_eye": right_eye
+            }
+        except Exception as e:
+            logger.exception("Facenet MTCNN detection failed")
+            return {"face_detected": False, "face_confidence": 0.0, "eye_openness_score": 0.0,
+                    "left_eye": None, "right_eye": None}
+    # Classic MTCNN
+    elif detector_type == "mtcnn":
+        try:
+            detections = face_detector.detect_faces(img_arr)
+            if not detections:
+                return {"face_detected": False, "face_confidence": 0.0, "eye_openness_score": 0.0,
+                        "left_eye": None, "right_eye": None}
+            face = detections[0]
+            keypoints = face.get("keypoints", {})
+            confidence = float(face.get("confidence", 0.0))
+            return {
+                "face_detected": True,
+                "face_confidence": confidence,
+                "eye_openness_score": min(max(confidence * 1.15, 0.0), 1.0),
+                "left_eye": keypoints.get("left_eye"),
+                "right_eye": keypoints.get("right_eye")
+            }
+        except Exception as e:
+            logger.exception("Classic MTCNN detection failed")
+            return {"face_detected": False, "face_confidence": 0.0, "eye_openness_score": 0.0,
+                    "left_eye": None, "right_eye": None}
+    # OpenCV fallback
+    elif detector_type == "opencv":
+        try:
+            gray = cv2.cvtColor(img_arr, cv2.COLOR_RGB2GRAY)
+            faces = face_detector["face_cascade"].detectMultiScale(
+                gray, scaleFactor=1.1, minNeighbors=4, minSize=(60, 60)
+            )
+            if len(faces) == 0:
+                return {"face_detected": False, "face_confidence": 0.0, "eye_openness_score": 0.0,
+                        "left_eye": None, "right_eye": None}
+            (x, y, w, h) = faces[0]
+            roi_gray = gray[y:y+h, x:x+w]
+            eyes = face_detector["eye_cascade"].detectMultiScale(
+                roi_gray, scaleFactor=1.1, minNeighbors=5, minSize=(20, 10)
+            )
+            eye_openness = 1.0 if len(eyes) >= 1 else 0.0
+            left_eye = None
+            if len(eyes) >= 1:
+                ex, ey, ew, eh = eyes[0]
+                left_eye = {"x": float(x + ex + ew/2), "y": float(y + ey + eh/2)}
+            confidence = min(1.0, (w*h) / (img_arr.shape[0]*img_arr.shape[1]) * 4.0)
+            return {
+                "face_detected": True,
+                "face_confidence": confidence,
+                "eye_openness_score": eye_openness,
+                "left_eye": left_eye,
+                "right_eye": None
+            }
+        except Exception as e:
+            logger.exception("OpenCV detection failed")
+            return {"face_detected": False, "face_confidence": 0.0, "eye_openness_score": 0.0,
+                    "left_eye": None, "right_eye": None}
+    return {"face_detected": False, "face_confidence": 0.0, "eye_openness_score": 0.0,
+            "left_eye": None, "right_eye": None}
+# ============================================================================
+# JSON Extraction from LLM Output
+# ============================================================================
+def extract_json_from_llm_output(raw_text: str) -> Dict[str, Any]:
+    """Extract and normalize JSON from LLM output using regex"""
     match = re.search(r"\{[\s\S]*\}", raw_text)
     if not match:
         raise ValueError("No JSON-like block found in LLM output")
     block = match.group(0)
+    def find_number(key: str) -> Optional[float]:
         patterns = [
+            rf'"{key}"\s*:\s*["\']?\s*([-+]?\d+(\.\d+)?)\s*%?\s*["\']?',
             rf"'{key}'\s*:\s*['\"]?\s*([-+]?\d+(\.\d+)?)\s*%?\s*['\"]?",
+            rf'\b{key}\b\s*:\s*["\']?\s*([-+]?\d+(\.\d+)?)\s*%?\s*["\']?',
         ]
         for pat in patterns:
             m = re.search(pat, block, flags=re.IGNORECASE)
+            if m and m.group(1):
+                try:
+                    return float(m.group(1).replace("%", "").strip())
+                except Exception:
+                    pass
         return None
+    def find_text(key: str) -> str:
         m = re.search(rf'"{key}"\s*:\s*"([^"]*)"', block, flags=re.IGNORECASE)
         if m:
             return m.group(1).strip()
         m = re.search(rf"'{key}'\s*:\s*'([^']*)'", block, flags=re.IGNORECASE)
         if m:
             return m.group(1).strip()
         m = re.search(rf'\b{key}\b\s*:\s*([^\n,}}]+)', block, flags=re.IGNORECASE)
         if m:
             return m.group(1).strip().strip('",')
         return ""
+    return {
+        "risk_score": normalize_risk_score(find_number("risk_score")),
+        "jaundice_probability": round(normalize_probability(find_number("jaundice_probability")), 4),
+        "anemia_probability": round(normalize_probability(find_number("anemia_probability")), 4),
+        "hydration_issue_probability": round(normalize_probability(find_number("hydration_issue_probability")), 4),
+        "neurological_issue_probability": round(normalize_probability(find_number("neurological_issue_probability")), 4),
+        "confidence": round(normalize_probability(find_number("confidence")), 4),
+        "summary": find_text("summary"),
+        "recommendation": find_text("recommendation")
     }
+# ============================================================================
+# VLM & LLM Integration
+# ============================================================================
+def get_gradio_client(space: str) -> Client:
+    """Get Gradio client with optional auth"""
     if not GRADIO_AVAILABLE:
+        raise RuntimeError("gradio_client not installed")
+    return Client(space, hf_token=HF_TOKEN) if HF_TOKEN else Client(space)
+def call_vlm(face_path: str, eye_path: str, prompt: Optional[str] = None) -> Tuple[Optional[Dict], str]:
+    """Call VLM and return (parsed_features, raw_text)"""
     prompt = prompt or DEFAULT_VLM_PROMPT
     if not os.path.exists(face_path) or not os.path.exists(eye_path):
+        raise FileNotFoundError("Face or eye image path missing")
+    client = get_gradio_client(GRADIO_VLM_SPACE)
     message = {"text": prompt, "files": [handle_file(face_path), handle_file(eye_path)]}
     try:
+        logger.info("Calling VLM Space: %s", GRADIO_VLM_SPACE)
         result = client.predict(message=message, history=[], api_name="/chat_fn")
     except Exception as e:
         logger.exception("VLM call failed")
         raise RuntimeError(f"VLM call failed: {e}")
     # Normalize result
     if isinstance(result, (list, tuple)):
         out = result[0]
         out = result
     else:
         out = {"text": str(result)}
+    text_out = out.get("text") or out.get("output") or json.dumps(out)
+    # Try to parse JSON
+    parsed = None
     try:
+        parsed = json.loads(text_out)
+        if not isinstance(parsed, dict):
+            parsed = None
     except Exception:
+        # Try to extract JSON from text
         try:
+            first = text_out.find("{")
+            last = text_out.rfind("}")
             if first != -1 and last != -1 and last > first:
+                parsed = json.loads(text_out[first:last+1])
+                if not isinstance(parsed, dict):
+                    parsed = None
         except Exception:
+            parsed = None
+    return parsed, text_out
+def call_llm(vlm_output: Any) -> Dict[str, Any]:
+    """Call LLM with VLM output and return structured risk assessment"""
+    if not GRADIO_AVAILABLE:
+        raise RuntimeError("gradio_client not installed")
+    client = get_gradio_client(LLM_GRADIO_SPACE)
+    # Prepare input
+    vlm_text = vlm_output if isinstance(vlm_output, str) else json.dumps(vlm_output, default=str)
     instruction = (
+        "\n\nSTRICT INSTRUCTIONS:\n"
+        "1) OUTPUT ONLY a single valid JSON object — no prose, no code fences.\n"
+        "2) Include keys: risk_score, jaundice_probability, anemia_probability, "
         "hydration_issue_probability, neurological_issue_probability, summary, recommendation, confidence.\n"
+        "3) Use numeric values for probabilities (0-1) and risk_score (0-100).\n"
+        "4) Use neutral wording in summary/recommendation.\n\n"
+        "VLM Output:\n" + vlm_text + "\n"
     )
+    # Call with safe defaults
+    try:
+        logger.info("Calling LLM Space: %s", LLM_GRADIO_SPACE)
+        result = client.predict(
+            input_data=instruction,
+            max_new_tokens=1024.0,
+            model_identity=os.getenv("LLM_MODEL_IDENTITY", "GPT-Tonic"),
+            system_prompt=LLM_SYSTEM_PROMPT,
+            developer_prompt=LLM_DEVELOPER_PROMPT,
+            reasoning_effort="medium",
+            temperature=0.2,
+            top_p=0.9,
+            top_k=50,
+            repetition_penalty=1.0,
+            api_name="/chat"
+        )
+        text_out = json.dumps(result) if isinstance(result, (dict, list)) else str(result)
+        logger.info("LLM raw output:\n%s", text_out)
+        parsed = extract_json_from_llm_output(text_out)
+        logger.info("LLM parsed JSON:\n%s", json.dumps(parsed, indent=2))
+        return parsed
+    except Exception as e:
+        logger.exception("LLM call failed")
+        raise RuntimeError(f"LLM call failed: {e}")
+# ============================================================================
+# Background Processing
+# ============================================================================
+async def process_screening(screening_id: str):
+    """Main processing pipeline"""
+    try:
+        if screening_id not in screenings_db:
+            logger.error("Screening %s not found", screening_id)
+            return
+        screenings_db[screening_id]["status"] = "processing"
+        logger.info("Starting processing for %s", screening_id)
+        entry = screenings_db[screening_id]
+        face_path = entry["face_image_path"]
+        eye_path = entry["eye_image_path"]
+        # Load images and get quality metrics
+        face_img = Image.open(face_path).convert("RGB")
+        detection_result = detect_face_and_eyes(face_img)
+        quality_metrics = {
+            "face_detected": detection_result["face_detected"],
+            "face_confidence": round(detection_result["face_confidence"], 3),
+            "face_quality_score": 0.85 if detection_result["face_detected"] else 0.45,
+            "eye_coords": {
+                "left_eye": detection_result["left_eye"],
+                "right_eye": detection_result["right_eye"]
+            },
+            "face_brightness": int(np.mean(np.asarray(face_img.convert("L")))),
+            "face_blur_estimate": int(np.var(np.asarray(face_img.convert("L"))))
+        }
+        screenings_db[screening_id]["quality_metrics"] = quality_metrics
+        # Call VLM
+        vlm_features, vlm_raw = await asyncio.to_thread(call_vlm, face_path, eye_path)
+        # Call LLM
+        llm_input = vlm_raw if vlm_raw else (vlm_features if vlm_features else "{}")
+        structured_risk = await asyncio.to_thread(call_llm, llm_input)
+        # Store results
+        screenings_db[screening_id]["ai_results"] = {
+            "vlm_features": vlm_features,
+            "vlm_raw": vlm_raw,
+            "structured_risk": structured_risk,
+            "processing_time_ms": 1200
+        }
+        # Build disease predictions
+        disease_predictions = [
+            {
+                "condition": "Anemia-like-signs",
+                "risk_level": "Medium" if structured_risk["anemia_probability"] > 0.5 else "Low",
+                "probability": structured_risk["anemia_probability"],
+                "confidence": structured_risk["confidence"]
+            },
+            {
+                "condition": "Jaundice-like-signs",
+                "risk_level": "Medium" if structured_risk["jaundice_probability"] > 0.5 else "Low",
+                "probability": structured_risk["jaundice_probability"],
+                "confidence": structured_risk["confidence"]
+            }
+        ]
+        recommendations = {
+            "action_needed": "consult" if structured_risk["risk_score"] > 30.0 else "monitor",
+            "message_english": structured_risk["recommendation"] or "Please follow up with a health professional if concerns persist.",
+            "message_hindi": ""
+        }
+        screenings_db[screening_id].update({
+            "status": "completed",
+            "disease_predictions": disease_predictions,
+            "recommendations": recommendations
+        })
+        logger.info("Completed processing for %s", screening_id)
+    except Exception as e:
+        logger.exception("Processing failed for %s", screening_id)
+        if screening_id in screenings_db:
+            screenings_db[screening_id]["status"] = "failed"
+            screenings_db[screening_id]["error"] = str(e)
+# ============================================================================
+# FastAPI App & Routes
+# ============================================================================
+app = FastAPI(title="Elderly HealthWatch AI Backend")
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
 @app.get("/")
 async def read_root():
     return {"message": "Elderly HealthWatch AI Backend"}
 @app.get("/health")
 async def health_check():
     return {
         "status": "healthy",
+        "detector": detector_type or "none",
         "vlm_available": GRADIO_AVAILABLE,
         "vlm_space": GRADIO_VLM_SPACE,
         "llm_space": LLM_GRADIO_SPACE
 @app.post("/api/v1/validate-eye-photo")
 async def validate_eye_photo(image: UploadFile = File(...)):
+    """Validate eye photo quality"""
+    if face_detector is None:
+        raise HTTPException(status_code=500, detail="No face detector available")
     try:
         content = await image.read()
         if not content:
+            raise HTTPException(status_code=400, detail="Empty file")
         pil_img = load_image_from_bytes(content)
+        result = detect_face_and_eyes(pil_img)
+        if not result["face_detected"]:
+            return {
+                "valid": False,
+                "face_detected": False,
+                "eye_openness_score": 0.0,
+                "message_english": "No face detected. Please ensure your face is clearly visible.",
+                "message_hindi": "कोई चेहरा नहीं मिला। कृपया सुनिश्चित करें कि आपका चेहरा स्पष्ट रूप से दिखाई दे।"
+            }
+        is_valid = result["eye_openness_score"] >= 0.3
+        return {
+            "valid": is_valid,
+            "face_detected": True,
+            "eye_openness_score": round(result["eye_openness_score"], 2),
+            "message_english": "Photo looks good! Eyes are properly open." if is_valid
+                             else "Eyes appear closed. Please open your eyes wide and try again.",
+            "message_hindi": "फोटो अच्छी है! आंखें ठीक से खुली हैं।" if is_valid
+                            else "आंखें बंद दिखाई दे रही हैं। कृपया अपनी आंखें चौड़ी खोलें।",
+            "eye_landmarks": {
+                "left_eye": result["left_eye"],
+                "right_eye": result["right_eye"]
+            }
+        }
     except Exception as e:
+        logger.exception("Validation failed")
+        raise HTTPException(status_code=500, detail=str(e))
 @app.post("/api/v1/upload")
 async def upload_images(
     face_image: UploadFile = File(...),
     eye_image: UploadFile = File(...)
 ):
+    """Upload images and start background processing"""
     try:
         screening_id = str(uuid.uuid4())
+        face_path = os.path.join(TMP_DIR, f"{screening_id}_face.jpg")
+        eye_path = os.path.join(TMP_DIR, f"{screening_id}_eye.jpg")
         with open(face_path, "wb") as f:
+            f.write(await face_image.read())
         with open(eye_path, "wb") as f:
+            f.write(await eye_image.read())
         screenings_db[screening_id] = {
             "id": screening_id,
+            "timestamp": datetime.utcnow().isoformat() + "Z",
             "face_image_path": face_path,
             "eye_image_path": eye_path,
             "status": "queued",
             "disease_predictions": [],
             "recommendations": {}
         }
         background_tasks.add_task(process_screening, screening_id)
         return {"screening_id": screening_id}
     except Exception as e:
+        logger.exception("Upload failed")
+        raise HTTPException(status_code=500, detail=str(e))
 @app.post("/api/v1/analyze/{screening_id}")
 async def analyze_screening(screening_id: str, background_tasks: BackgroundTasks):
+    """Re-analyze existing screening"""
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
+    if screenings_db[screening_id]["status"] == "processing":
         return {"message": "Already processing"}
     screenings_db[screening_id]["status"] = "queued"
     background_tasks.add_task(process_screening, screening_id)
     return {"message": "Analysis enqueued"}
 @app.get("/api/v1/status/{screening_id}")
 async def get_status(screening_id: str):
+    """Get processing status"""
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
+    status = screenings_db[screening_id]["status"]
     progress = 50 if status == "processing" else (100 if status == "completed" else 0)
     return {"screening_id": screening_id, "status": status, "progress": progress}
 @app.get("/api/v1/results/{screening_id}")
 async def get_results(screening_id: str):
+    """Get screening results"""
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
     return screenings_db[screening_id]
 @app.get("/api/v1/history/{user_id}")
 async def get_history(user_id: str):
+    """Get user screening history"""
     history = [s for s in screenings_db.values() if s.get("user_id") == user_id]
     return {"screenings": history}
 @app.post("/api/v1/get-vitals")
 async def get_vitals_from_upload(
     face_image: UploadFile = File(...),
     eye_image: UploadFile = File(...)
 ):
+    """Synchronous VLM + LLM pipeline"""
     if not GRADIO_AVAILABLE:
+        raise HTTPException(status_code=500, detail="VLM/LLM not available")
     try:
         uid = str(uuid.uuid4())
+        face_path = os.path.join(TMP_DIR, f"{uid}_face.jpg")
+        eye_path = os.path.join(TMP_DIR, f"{uid}_eye.jpg")
         with open(face_path, "wb") as f:
+            f.write(await face_image.read())
         with open(eye_path, "wb") as f:
+            f.write(await eye_image.read())
+        vlm_features, vlm_raw = await asyncio.to_thread(call_vlm, face_path, eye_path)
         llm_input = vlm_raw if vlm_raw else (vlm_features if vlm_features else "{}")
+        structured_risk = await asyncio.to_thread(call_llm, llm_input)
         return {
             "vlm_features": vlm_features,
             "vlm_raw": vlm_raw,
             "structured_risk": structured_risk
         }
     except Exception as e:
+        logger.exception("Get vitals failed")
+        raise HTTPException(status_code=500, detail=str(e))
 @app.post("/api/v1/get-vitals/{screening_id}")
 async def get_vitals_for_screening(screening_id: str):
+    """Re-run VLM + LLM on existing screening"""
     if screening_id not in screenings_db:
         raise HTTPException(status_code=404, detail="Screening not found")
     entry = screenings_db[screening_id]
     face_path = entry.get("face_image_path")
     eye_path = entry.get("eye_image_path")
     if not (face_path and os.path.exists(face_path) and eye_path and os.path.exists(eye_path)):
+        raise HTTPException(status_code=400, detail="Images missing")
     try:
+        vlm_features, vlm_raw = await asyncio.to_thread(call_vlm, face_path, eye_path)
         llm_input = vlm_raw if vlm_raw else (vlm_features if vlm_features else "{}")
+        structured_risk = await asyncio.to_thread(call_llm, llm_input)
+        entry.setdefault("ai_results", {}).update({
             "vlm_features": vlm_features,
             "vlm_raw": vlm_raw,
             "structured_risk": structured_risk,
             "last_vitals_run": datetime.utcnow().isoformat() + "Z"
         })
         return {
             "screening_id": screening_id,
             "vlm_features": vlm_features,
             "vlm_raw": vlm_raw,
             "structured_risk": structured_risk
         }
     except Exception as e:
+        logger.exception("Get vitals for screening failed")
+        raise HTTPException(status_code=500, detail=str(e))
 if __name__ == "__main__":
     import uvicorn
+    uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=