Spaces:

dpv007
/

cloud

Sleeping

App Files Files Community

dpv007 commited on Dec 12, 2025

Commit

7dedfff

verified ·

1 Parent(s): a83b25f

Update app.py

Browse files

Files changed (1) hide show

app.py +111 -791

app.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# app.py
 """
 Elderly HealthWatch AI Backend (FastAPI)
 Pipeline:
@@ -15,6 +14,7 @@ Notes:
     * always returns raw VLM output in API responses,
     * extracts JSON from VLM via regex when possible, and
     * sends only the face image to the VLM (not the eye image).
 """
 import io
@@ -51,6 +51,7 @@ logger = logging.getLogger("elderly_healthwatch")
 GRADIO_VLM_SPACE = os.getenv("GRADIO_SPACE", "developer0hye/Qwen3-VL-8B-Instruct")
 LLM_GRADIO_SPACE = os.getenv("LLM_GRADIO_SPACE", "Tonic/med-gpt-oss-20b-demo")
 HF_TOKEN = os.getenv("HF_TOKEN", None)
 # Default VLM prompt
 DEFAULT_VLM_PROMPT = (
@@ -245,6 +246,74 @@ def extract_json_via_regex(raw_text: str) -> Dict[str, Any]:
     }
     return out
 # -----------------------
 # Gradio / VLM helper (sends only face image, returns meta)
 # -----------------------
@@ -256,58 +325,77 @@ def get_gradio_client_for_space(space: str) -> Client:
     return Client(space)
 def run_vlm_and_get_features(face_path: str, eye_path: Optional[str] = None, prompt: Optional[str] = None,
-                             raise_on_file_delivery_failure: bool = False
                              ) -> Tuple[Optional[Dict[str, Any]], str, Dict[str, Any]]:
     """
-    Synchronous call to remote VLM (gradio /chat_fn). Sends ONLY the face image file.
     Returns tuple: (parsed_features_dict_or_None, raw_text_response_str, meta)
     meta includes:
       - vlm_file_delivery_ok (bool)  # expects ≥1 file acknowledged (face)
       - vlm_files_seen (int or None)
       - vlm_raw_len (int)
       - vlm_out_object (short repr)
     """
     prompt = prompt or DEFAULT_VLM_PROMPT
     if not os.path.exists(face_path):
         raise FileNotFoundError(f"Face image not found at: {face_path}")
-    if not os.path.exists(eye_path):
         raise FileNotFoundError(f"Eye image not found at: {eye_path}")
     face_size = os.path.getsize(face_path)
-    eye_size = os.path.getsize(eye_path)
-    logger.info(f"VLM input files - Face: {face_size} bytes, Eye: {eye_size} bytes")
-    if face_size == 0 or eye_size == 0:
-        raise ValueError("One or both images are empty (0 bytes)")
     if not GRADIO_AVAILABLE:
         raise RuntimeError("gradio_client not available in this environment.")
-    client = get_gradio_client_for_space(GRADIO_VLM_SPACE)
-    # Verify files can be opened as images
     try:
         Image.open(face_path).verify()
-        Image.open(eye_path).verify()
-        logger.info("Both images verified as valid")
     except Exception as e:
-        raise ValueError(f"Invalid image file(s): {e}")
-    message = {"text": prompt, "files": [handle_file(face_path), handle_file(eye_path)]}
-    logger.info(f"Calling VLM with message structure: text={len(prompt)} chars, files=2")
     client = get_gradio_client_for_space(GRADIO_VLM_SPACE)
-    # NOTE: only send face image to the Space
-    message = {"text": prompt, "files": [handle_file(face_path)]}
-    meta: Dict[str, Any] = {"vlm_file_delivery_ok": False, "vlm_files_seen": None, "vlm_raw_len": 0, "vlm_out_object": None}
     # SINGLE CALL (no retries)
     try:
-        logger.info("Calling VLM Space %s with 1 file (face only)", GRADIO_VLM_SPACE)
         result = client.predict(message=message, history=[], api_name="/chat_fn")
     except Exception as e:
         logger.exception("VLM call failed (no retries)")
@@ -407,772 +495,4 @@ def run_llm_on_vlm(vlm_features_or_raw: Any,
     Call the remote LLM Space's /chat endpoint with defensive input handling and a single retry.
     - Logs the VLM raw string and the chosen payload.
     - Sends cleaned JSON (json.dumps(vlm_features)) if vlm_features_or_raw is dict, else sends raw string.
-    - Uses regex to extract the final JSON from LLM raw output.
-    """
-    if not GRADIO_AVAILABLE:
-        raise RuntimeError("gradio_client not installed. Add gradio_client to requirements.txt")
-    # Try to import AppError for specific handling; fallback to Exception if unavailable
-    try:
-        from gradio_client import AppError  # type: ignore
-    except Exception:
-        AppError = Exception  # fallback
-    client = get_gradio_client_for_space(LLM_GRADIO_SPACE)
-    model_identity = model_identity or LLM_MODEL_IDENTITY
-    system_prompt = system_prompt or LLM_SYSTEM_PROMPT
-    developer_prompt = developer_prompt or LLM_DEVELOPER_PROMPT
-    # Decide what to send to LLM and log the raw input
-    if isinstance(vlm_features_or_raw, str):
-        vlm_raw_str = vlm_features_or_raw
-        logger.info("LLM input will be RAW VLM STRING (len=%d)", len(vlm_raw_str or ""))
-        vlm_json_str_to_send = vlm_raw_str if vlm_raw_str and vlm_raw_str.strip() else "{}"
-    else:
-        vlm_raw_str = json.dumps(vlm_features_or_raw, ensure_ascii=False) if vlm_features_or_raw else "{}"
-        logger.info("LLM input will be CLEANED VLM JSON (len=%d)", len(vlm_raw_str))
-        vlm_json_str_to_send = vlm_raw_str
-    # Build instruction payload
-    instruction = (
-        "\n\nSTRICT INSTRUCTIONS (READ CAREFULLY):\n"
-        "1) OUTPUT ONLY a single valid JSON object and nothing else — no prose, no explanation, no code fences.\n"
-        "2) The JSON MUST include these keys: risk_score, jaundice_probability, anemia_probability, "
-        "hydration_issue_probability, neurological_issue_probability, summary, recommendation, confidence.\n"
-        "3) Use numeric values for probabilities (0..1) and for risk_score (0..100). Use strings for summary and recommendation.\n"
-        "4) Do NOT mention disease names in summary or recommendation; use neutral wording only.\n"
-        "If you cannot estimate a value, set it to null.\n\n"
-        "Now, based on the VLM output below, produce ONLY the JSON object described above.\n\n"
-        "===BEGIN VLM OUTPUT===\n"
-        f"{vlm_json_str_to_send}\n"
-        "===END VLM OUTPUT===\n\n"
-    )
-    # Defensive coercion / clamps
-    try_max_new_tokens = int(max_new_tokens) if max_new_tokens is not None else 1024
-    if try_max_new_tokens <= 0:
-        try_max_new_tokens = 1024
-    try_temperature = float(temperature) if temperature is not None else 0.0
-    # Some Spaces validate temperature >= 0.1
-    if try_temperature < 0.1:
-        try_temperature = 0.1
-    predict_kwargs = dict(
-        input_data=instruction,
-        max_new_tokens=float(try_max_new_tokens),
-        model_identity=model_identity,
-        system_prompt=system_prompt,
-        developer_prompt=developer_prompt,
-        reasoning_effort=reasoning_effort,
-        temperature=float(try_temperature),
-        top_p=0.9,
-        top_k=50,
-        repetition_penalty=1.0,
-        api_name="/chat"
-    )
-    last_exc = None
-    for attempt in (1, 2):
-        try:
-            logger.info("Calling LLM Space %s (attempt %d) with temperature=%s, max_new_tokens=%s",
-                        LLM_GRADIO_SPACE, attempt, predict_kwargs.get("temperature"), predict_kwargs.get("max_new_tokens"))
-            result = client.predict(**predict_kwargs)
-            # normalize to string
-            if isinstance(result, (dict, list)):
-                text_out = json.dumps(result)
-            else:
-                text_out = str(result)
-            if not text_out or len(text_out.strip()) == 0:
-                raise RuntimeError("LLM returned empty response")
-            logger.info("LLM raw output (len=%d):\n%s", len(text_out or ""), (text_out[:2000] + "...") if len(text_out) > 2000 else text_out)
-            # parse with regex extractor (may raise)
-            parsed = None
-            try:
-                parsed = extract_json_via_regex(text_out)
-            except Exception:
-                # fallback: attempt json.loads naive
-                try:
-                    parsed = json.loads(text_out)
-                    if not isinstance(parsed, dict):
-                        parsed = None
-                except Exception:
-                    parsed = None
-            if parsed is None:
-                raise ValueError("Failed to extract JSON from LLM output")
-            # pretty log parsed JSON
-            try:
-                logger.info("LLM parsed JSON:\n%s", json.dumps(parsed, indent=2, ensure_ascii=False))
-            except Exception:
-                logger.info("LLM parsed JSON (raw dict): %s", str(parsed))
-            # defensive clamps (same as extractor expectations)
-            def safe_prob(val):
-                try:
-                    v = float(val)
-                    return max(0.0, min(1.0, v))
-                except Exception:
-                    return 0.0
-            for k in [
-                "jaundice_probability",
-                "anemia_probability",
-                "hydration_issue_probability",
-                "neurological_issue_probability"
-            ]:
-                parsed[k] = safe_prob(parsed.get(k, 0.0))
-            try:
-                rs = float(parsed.get("risk_score", 0.0))
-                parsed["risk_score"] = round(max(0.0, min(100.0, rs)), 2)
-            except Exception:
-                parsed["risk_score"] = 0.0
-            parsed["confidence"] = safe_prob(parsed.get("confidence", 0.0))
-            parsed["summary"] = str(parsed.get("summary", "") or "").strip()
-            parsed["recommendation"] = str(parsed.get("recommendation", "") or "").strip()
-            for k in [
-                "jaundice_probability",
-                "anemia_probability",
-                "hydration_issue_probability",
-                "neurological_issue_probability",
-                "confidence",
-                "risk_score"
-            ]:
-                parsed[f"{k}_was_missing"] = False
-            return parsed
-        except AppError as app_e:
-            logger.exception("LLM AppError (remote validation failed) on attempt %d: %s", attempt, str(app_e))
-            last_exc = app_e
-            if attempt == 1:
-                predict_kwargs["temperature"] = 0.2
-                predict_kwargs["max_new_tokens"] = float(512)
-                logger.info("Retrying LLM call with temperature=0.2 and max_new_tokens=512")
-                continue
-            else:
-                raise RuntimeError(f"LLM call failed (AppError): {app_e}")
-        except Exception as e:
-            logger.exception("LLM call failed on attempt %d: %s", attempt, str(e))
-            last_exc = e
-            if attempt == 1:
-                predict_kwargs["temperature"] = 0.2
-                predict_kwargs["max_new_tokens"] = float(512)
-                continue
-            raise RuntimeError(f"LLM call failed: {e}")
-    raise RuntimeError(f"LLM call ultimately failed: {last_exc}")
-# -----------------------
-# API endpoints
-# -----------------------
-@app.get("/")
-async def read_root():
-    return {"message": "Elderly HealthWatch AI Backend"}
-@app.get("/health")
-async def health_check():
-    impl = None
-    if mtcnn is None:
-        impl = "none"
-    elif isinstance(mtcnn, dict) and mtcnn.get("impl") == "opencv":
-        impl = "opencv_haar_fallback"
-    else:
-        impl = _MTCNN_IMPL
-    return {
-        "status": "healthy",
-        "detector": impl,
-        "vlm_available": GRADIO_AVAILABLE,
-        "vlm_space": GRADIO_VLM_SPACE,
-        "llm_space": LLM_GRADIO_SPACE
-    }
-@app.post("/api/v1/validate-eye-photo")
-async def validate_eye_photo(image: UploadFile = File(...)):
-    if mtcnn is None:
-        raise HTTPException(status_code=500, detail="No face detector available in this deployment.")
-    try:
-        content = await image.read()
-        if not content:
-            raise HTTPException(status_code=400, detail="Empty file uploaded.")
-        pil_img = load_image_from_bytes(content)
-        img_arr = np.asarray(pil_img)  # RGB
-        if not isinstance(mtcnn, dict) and _MTCNN_IMPL == "facenet_pytorch":
-            try:
-                boxes, probs, landmarks = mtcnn.detect(pil_img, landmarks=True)
-                if boxes is None or len(boxes) == 0:
-                    return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                            "message_english": "No face detected. Please ensure your face is clearly visible in the frame.",
-                            "message_hindi": "कोई चेहरा नहीं मिला। कृपया सुनिश्चित करें कि आपका चेहरा फ्रेम में स्पष्ट रूप से दिखाई दे रहा है।"}
-                prob = float(probs[0]) if probs is not None else 0.0
-                lm = landmarks[0] if landmarks is not None else None
-                if lm is not None and len(lm) >= 2:
-                    left_eye = {"x": float(lm[0][0]), "y": float(lm[0][1])}
-                    right_eye = {"x": float(lm[1][0]), "y": float(lm[1][1])}
-                else:
-                    left_eye = right_eye = None
-                eye_openness_score = estimate_eye_openness_from_detection(prob)
-                is_valid = eye_openness_score >= 0.3
-                return {"valid": bool(is_valid), "face_detected": True, "eye_openness_score": round(eye_openness_score, 2),
-                        "message_english": "Photo looks good! Eyes are properly open." if is_valid else "Eyes appear to be closed or partially closed. Please open your eyes wide and try again.",
-                        "message_hindi": "फोटो अच्छी है! आंखें ठीक से खुली हैं।" if is_valid else "आंखें बंद या आंशिक रूप से बंद दिखाई दे रही हैं। कृपया अपनी आंखें चौड़ी खोलें और पुनः प्रयास करें。",
-                        "eye_landmarks": {"left_eye": left_eye, "right_eye": right_eye}}
-            except Exception:
-                traceback.print_exc()
-                raise HTTPException(status_code=500, detail="Face detector failed during inference.")
-        if not isinstance(mtcnn, dict) and _MTCNN_IMPL == "mtcnn":
-            try:
-                detections = mtcnn.detect_faces(img_arr)
-            except Exception:
-                detections = mtcnn.detect_faces(pil_img)
-            if not detections:
-                return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                        "message_english": "No face detected. Please ensure your face is clearly visible in the frame.",
-                        "message_hindi": "कोई चेहरा नहीं मिला। कृपया सुनिश्चित करें कि आपका चेहरा फ्रेम में स्पष्ट रूप से दिखाई दे रहा है।"}
-            face = detections[0]
-            keypoints = face.get("keypoints", {})
-            left_eye = keypoints.get("left_eye")
-            right_eye = keypoints.get("right_eye")
-            confidence = float(face.get("confidence", 0.0))
-            eye_openness_score = estimate_eye_openness_from_detection(confidence)
-            is_valid = eye_openness_score >= 0.3
-            return {"valid": bool(is_valid), "face_detected": True, "eye_openness_score": round(eye_openness_score, 2),
-                    "message_english": "Photo looks good! Eyes are properly open." if is_valid else "Eyes appear to be closed or partially closed. Please open your eyes wide and try again.",
-                    "message_hindi": "फोटो अच्छी है! आंखें ठीक से खुली हैं।" if is_valid else "आंखें बंद या आंशिक रूप से बंद दिखाई दे रही हैं। कृपया अपनी आंखें चौड़ी खोलें और पुनः प्रयास करें。",
-                    "eye_landmarks": {"left_eye": left_eye, "right_eye": right_eye}}
-        if isinstance(mtcnn, dict) and mtcnn.get("impl") == "opencv":
-            try:
-                gray = cv2.cvtColor(img_arr, cv2.COLOR_RGB2GRAY)
-                face_cascade = mtcnn["face_cascade"]
-                eye_cascade = mtcnn["eye_cascade"]
-                faces = face_cascade.detectMultiScale(gray, scaleFactor=1.1, minNeighbors=4, minSize=(60, 60))
-                if len(faces) == 0:
-                    return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                            "message_english": "No face detected. Please ensure your face is clearly visible in the frame.",
-                            "message_hindi": "कोई चेहरा नहीं मिला। कृपया सुनिश्चित करें कि आपका चेहरा फ्रेम में स्पष्ट रूप से दिखाई दे रहा है।"}
-                (x, y, w, h) = faces[0]
-                roi_gray = gray[y:y+h, x:x+w]
-                eyes = eye_cascade.detectMultiScale(roi_gray, scaleFactor=1.1, minNeighbors=5, minSize=(20, 10))
-                eye_openness_score = 1.0 if len(eyes) >= 1 else 0.0
-                is_valid = eye_openness_score >= 0.3
-                left_eye = None
-                right_eye = None
-                if len(eyes) >= 1:
-                    ex, ey, ew, eh = eyes[0]
-                    cx = float(x + ex + ew/2)
-                    cy = float(y + ey + eh/2)
-                    left_eye = {"x": cx, "y": cy}
-                return {"valid": bool(is_valid), "face_detected": True, "eye_openness_score": round(eye_openness_score, 2),
-                        "message_english": "Photo looks good! Eyes are detected." if is_valid else "Eyes not detected. Please open your eyes wide and try again.",
-                        "message_hindi": "फोटो अच्छी है! आंखें मिलीं।" if is_valid else "आंखें नहीं मिलीं। कृपया अपनी आंखें चौड़ी खोलें और पुनः प्रयास करें。",
-                        "eye_landmarks": {"left_eye": left_eye, "right_eye": right_eye}}
-            except Exception:
-                traceback.print_exc()
-                raise HTTPException(status_code=500, detail="OpenCV fallback detector failed.")
-        raise HTTPException(status_code=500, detail="Invalid detector configuration.")
-    except HTTPException:
-        raise
-    except Exception as e:
-        traceback.print_exc()
-        return {"valid": False, "face_detected": False, "eye_openness_score": 0.0,
-                "message_english": "Error processing image. Please try again.",
-                "message_hindi": "छवि प्रोसेस करने में त्रुटि। कृपया पुनः प्रयास करें।",
-                "error": str(e)}
-@app.post("/api/v1/upload")
-async def upload_images(
-    background_tasks: BackgroundTasks,
-    face_image: UploadFile = File(...),
-    eye_image: UploadFile = File(...)
-):
-    """
-    Save images and enqueue background processing. VLM -> LLM runs inside process_screening.
-    """
-    try:
-        screening_id = str(uuid.uuid4())
-        now = datetime.utcnow().isoformat() + "Z"
-        tmp_dir = "/tmp/elderly_healthwatch"
-        os.makedirs(tmp_dir, exist_ok=True)
-        face_path = os.path.join(tmp_dir, f"{screening_id}_face.jpg")
-        eye_path = os.path.join(tmp_dir, f"{screening_id}_eye.jpg")
-        face_bytes = await face_image.read()
-        eye_bytes = await eye_image.read()
-        with open(face_path, "wb") as f:
-            f.write(face_bytes)
-        with open(eye_path, "wb") as f:
-            f.write(eye_bytes)
-        screenings_db[screening_id] = {
-            "id": screening_id,
-            "timestamp": now,
-            "face_image_path": face_path,
-            "eye_image_path": eye_path,
-            "status": "queued",
-            "quality_metrics": {},
-            "ai_results": {},
-            "disease_predictions": [],
-            "recommendations": {}
-        }
-        background_tasks.add_task(process_screening, screening_id)
-        return {"screening_id": screening_id}
-    except Exception as e:
-        traceback.print_exc()
-        raise HTTPException(status_code=500, detail=f"Failed to upload images: {e}")
-@app.post("/api/v1/analyze/{screening_id}")
-async def analyze_screening(screening_id: str, background_tasks: BackgroundTasks):
-    if screening_id not in screenings_db:
-        raise HTTPException(status_code=404, detail="Screening not found")
-    if screenings_db[screening_id].get("status") == "processing":
-        return {"message": "Already processing"}
-    screenings_db[screening_id]["status"] = "queued"
-    background_tasks.add_task(process_screening, screening_id)
-    return {"message": "Analysis enqueued"}
-@app.get("/api/v1/status/{screening_id}")
-async def get_status(screening_id: str):
-    if screening_id not in screenings_db:
-        raise HTTPException(status_code=404, detail="Screening not found")
-    status = screenings_db[screening_id].get("status", "unknown")
-    progress = 50 if status == "processing" else (100 if status == "completed" else 0)
-    return {"screening_id": screening_id, "status": status, "progress": progress}
-@app.get("/api/v1/results/{screening_id}")
-async def get_results(screening_id: str):
-    if screening_id not in screenings_db:
-        raise HTTPException(status_code=404, detail="Screening not found")
-    # Ensure vlm_raw is always present in ai_results for debugging
-    entry = screenings_db[screening_id]
-    entry.setdefault("ai_results", {})
-    entry["ai_results"].setdefault("vlm_raw", entry.get("ai_results", {}).get("vlm_raw", ""))
-    return entry
-@app.get("/api/v1/history/{user_id}")
-async def get_history(user_id: str):
-    history = [s for s in screenings_db.values() if s.get("user_id") == user_id]
-    return {"screenings": history}
-# -----------------------
-# Immediate VLM -> LLM routes (return vitals in one call)
-# -----------------------
-@app.post("/api/v1/get-vitals")
-async def get_vitals_from_upload(
-    face_image: UploadFile = File(...),
-    eye_image: UploadFile = File(...)
-):
-    """
-    Run VLM -> LLM pipeline synchronously (but off the event loop) and return:
-      { vlm_parsed_features, vlm_raw_output, llm_structured_risk }
-    Note: VLM will receive only the face image (not the eye image).
-    """
-    if not GRADIO_AVAILABLE:
-        raise HTTPException(status_code=500, detail="VLM/LLM client not available in this deployment.")
-    # save files to a temp directory
-    try:
-        tmp_dir = "/tmp/elderly_healthwatch"
-        os.makedirs(tmp_dir, exist_ok=True)
-        uid = str(uuid.uuid4())
-        face_path = os.path.join(tmp_dir, f"{uid}_face.jpg")
-        eye_path = os.path.join(tmp_dir, f"{uid}_eye.jpg")
-        face_bytes = await face_image.read()
-        eye_bytes = await eye_image.read()
-        with open(face_path, "wb") as f:
-            f.write(face_bytes)
-        with open(eye_path, "wb") as f:
-            f.write(eye_bytes)
-    except Exception as e:
-        logger.exception("Failed saving uploaded images")
-        raise HTTPException(status_code=500, detail=f"Failed saving images: {e}")
-    try:
-        # Run VLM (off the event loop) - returns (features, raw, meta)
-        vlm_features, vlm_raw, vlm_meta = await asyncio.to_thread(run_vlm_and_get_features, face_path, eye_path)
-        # Log VLM outputs
-        logger.info("get_vitals_from_upload - VLM raw (snippet): %s", (vlm_raw[:500] + "...") if vlm_raw else "<EMPTY>")
-        logger.info("get_vitals_from_upload - VLM parsed features: %s", json.dumps(vlm_features, indent=2, ensure_ascii=False) if vlm_features else "None")
-        logger.info("get_vitals_from_upload - VLM meta: %s", json.dumps(vlm_meta, ensure_ascii=False))
-        # Decide what to feed to LLM: prefer cleaned JSON if available, else raw VLM string
-        if vlm_features:
-            llm_input = json.dumps(vlm_features, ensure_ascii=False)
-            logger.info("Feeding CLEANED VLM JSON to LLM (len=%d).", len(llm_input))
-        else:
-            llm_input = vlm_raw if vlm_raw and vlm_raw.strip() else "{}"
-            logger.info("Feeding RAW VLM STRING to LLM (len=%d).", len(llm_input))
-        # Run LLM (off the event loop)
-        structured_risk = await asyncio.to_thread(run_llm_on_vlm, llm_input)
-        # Return merged result (includes raw VLM output + meta for debugging)
-        return {
-            "vlm_raw_output": vlm_raw,
-            "vlm_parsed_features": vlm_features,
-            "vlm_meta": vlm_meta,
-            "llm_structured_risk": structured_risk
-        }
-    except Exception as e:
-        logger.exception("get_vitals_from_upload pipeline failed")
-        raise HTTPException(status_code=500, detail=f"Pipeline failed: {e}")
-@app.post("/api/v1/get-vitals/{screening_id}")
-async def get_vitals_for_screening(screening_id: str):
-    """
-    Re-run VLM->LLM on images already stored for `screening_id` in screenings_db.
-    Useful for re-processing or debugging.
-    Note: VLM will receive only the face image (not the eye image).
-    """
-    if screening_id not in screenings_db:
-        raise HTTPException(status_code=404, detail="Screening not found")
-    entry = screenings_db[screening_id]
-    face_path = entry.get("face_image_path")
-    eye_path = entry.get("eye_image_path")
-    if not (face_path and os.path.exists(face_path) and eye_path and os.path.exists(eye_path)):
-        raise HTTPException(status_code=400, detail="Stored images missing for this screening")
-    try:
-        # Run VLM off the event loop (returns features, raw, meta)
-        vlm_features, vlm_raw, vlm_meta = await asyncio.to_thread(run_vlm_and_get_features, face_path, eye_path)
-        logger.info("get_vitals_for_screening(%s) - VLM raw (snippet): %s", screening_id, (vlm_raw[:500] + "...") if vlm_raw else "<EMPTY>")
-        logger.info("get_vitals_for_screening(%s) - VLM parsed features: %s", screening_id, json.dumps(vlm_features, indent=2, ensure_ascii=False) if vlm_features else "None")
-        logger.info("get_vitals_for_screening(%s) - VLM meta: %s", screening_id, json.dumps(vlm_meta, ensure_ascii=False))
-        if vlm_features:
-            llm_input = json.dumps(vlm_features, ensure_ascii=False)
-            logger.info("Feeding CLEANED VLM JSON to LLM (len=%d).", len(llm_input))
-        else:
-            llm_input = vlm_raw if vlm_raw and vlm_raw.strip() else "{}"
-            logger.info("Feeding RAW VLM STRING to LLM (len=%d).", len(llm_input))
-        structured_risk = await asyncio.to_thread(run_llm_on_vlm, llm_input)
-        # Optionally store this run's outputs back into the DB for inspection
-        entry.setdefault("ai_results", {})
-        entry["ai_results"].update({
-            "vlm_parsed_features": vlm_features,
-            "vlm_raw": vlm_raw,
-            "vlm_meta": vlm_meta,
-            "structured_risk": structured_risk,
-            "last_vitals_run": datetime.utcnow().isoformat() + "Z"
-        })
-        return {
-            "screening_id": screening_id,
-            "vlm_raw_output": vlm_raw,
-            "vlm_parsed_features": vlm_features,
-            "vlm_meta": vlm_meta,
-            "llm_structured_risk": structured_risk
-        }
-    except Exception as e:
-        logger.exception("get_vitals_for_screening pipeline failed")
-        raise HTTPException(status_code=500, detail=f"Pipeline failed: {e}")
-# -----------------------
-# URL-based vitals endpoint (optional)
-# -----------------------
-class ImageUrls(BaseModel):
-    face_image_url: HttpUrl
-    eye_image_url: HttpUrl
-import httpx  # make sure to add httpx to requirements
-# helper: download URL to file with safety checks
-async def download_image_to_path(url: str, dest_path: str, max_bytes: int = 5_000_000, timeout_seconds: int = 10) -> None:
-    """
-    Download an image from `url` and save to dest_path.
-    Guards:
-     - timeout
-     - max bytes
-     - basic content-type check (image/*)
-    Raises HTTPException on failure.
-    """
-    try:
-        async with httpx.AsyncClient(timeout=timeout_seconds, follow_redirects=True) as client:
-            resp = await client.get(url, timeout=timeout_seconds)
-            resp.raise_for_status()
-            content_type = resp.headers.get("Content-Type", "")
-            if not content_type.startswith("image/"):
-                raise ValueError(f"URL does not appear to be an image (Content-Type={content_type})")
-            total = 0
-            with open(dest_path, "wb") as f:
-                async for chunk in resp.aiter_bytes():
-                    if not chunk:
-                        continue
-                    total += len(chunk)
-                    if total > max_bytes:
-                        raise ValueError(f"Image exceeds max allowed size ({max_bytes} bytes)")
-                    f.write(chunk)
-    except httpx.HTTPStatusError as e:
-        raise HTTPException(status_code=400, detail=f"Failed to fetch image: {e.response.status_code} {str(e)}")
-    except Exception as e:
-        raise HTTPException(status_code=400, detail=f"Failed to download image: {str(e)}")
-@app.post("/api/v1/get-vitals-by-url")
-async def get_vitals_from_urls(payload: ImageUrls = Body(...)):
-    """
-    Download face and eye images from given URLs, then run the same VLM -> LLM pipeline and return results.
-    Note: VLM will receive only the face image (not the eye image).
-    Body: { "face_image_url": "...", "eye_image_url": "..." }
-    """
-    if not GRADIO_AVAILABLE:
-        raise HTTPException(status_code=500, detail="VLM/LLM client not available in this deployment.")
-    # prepare tmp paths
-    try:
-        tmp_dir = "/tmp/elderly_healthwatch"
-        os.makedirs(tmp_dir, exist_ok=True)
-        uid = str(uuid.uuid4())
-        face_path = os.path.join(tmp_dir, f"{uid}_face.jpg")
-        eye_path = os.path.join(tmp_dir, f"{uid}_eye.jpg")
-    except Exception as e:
-        logger.exception("Failed to prepare temp paths")
-        raise HTTPException(status_code=500, detail=f"Server error preparing temp files: {e}")
-    # download images (with guards)
-    try:
-        await download_image_to_path(str(payload.face_image_url), face_path)
-        await download_image_to_path(str(payload.eye_image_url), eye_path)
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.exception("Downloading images failed")
-        raise HTTPException(status_code=400, detail=f"Failed to download images: {e}")
-    # run existing pipeline (off the event loop)
-    try:
-        vlm_features, vlm_raw, vlm_meta = await asyncio.to_thread(run_vlm_and_get_features, face_path, eye_path)
-        logger.info("get_vitals_from_urls - VLM raw (snippet): %s", (vlm_raw[:500] + "...") if vlm_raw else "<EMPTY>")
-        logger.info("get_vitals_from_urls - VLM parsed features: %s", json.dumps(vlm_features, indent=2, ensure_ascii=False) if vlm_features else "None")
-        logger.info("get_vitals_from_urls - VLM meta: %s", json.dumps(vlm_meta, ensure_ascii=False))
-        if vlm_features:
-            llm_input = json.dumps(vlm_features, ensure_ascii=False)
-            logger.info("Feeding CLEANED VLM JSON to LLM (len=%d).", len(llm_input))
-        else:
-            llm_input = vlm_raw if vlm_raw and vlm_raw.strip() else "{}"
-            logger.info("Feeding RAW VLM STRING to LLM (len=%d).", len(llm_input))
-        structured_risk = await asyncio.to_thread(run_llm_on_vlm, llm_input)
-        return {
-            "vlm_raw_output": vlm_raw,
-            "vlm_parsed_features": vlm_features,
-            "vlm_meta": vlm_meta,
-            "llm_structured_risk": structured_risk
-        }
-    except Exception as e:
-        logger.exception("get_vitals_by_url pipeline failed")
-        raise HTTPException(status_code=500, detail=f"Pipeline failed: {e}")
-# -----------------------
-# Main background pipeline (upload -> process_screening)
-# -----------------------
-async def process_screening(screening_id: str):
-    """
-    Main pipeline:
-     - load images
-     - quick detector-based quality metrics
-     - run VLM -> vlm_features (dict or None) + vlm_raw (string) + vlm_meta
-     - run LLM on vlm_features (preferred) or vlm_raw -> structured risk JSON
-     - merge results into ai_results and finish
-    """
-    try:
-        if screening_id not in screenings_db:
-            logger.error("[process_screening] screening %s not found", screening_id)
-            return
-        screenings_db[screening_id]["status"] = "processing"
-        logger.info("[process_screening] Starting %s", screening_id)
-        entry = screenings_db[screening_id]
-        face_path = entry.get("face_image_path")
-        eye_path = entry.get("eye_image_path")
-        if not (face_path and os.path.exists(face_path)):
-            raise RuntimeError("Face image missing")
-        if not (eye_path and os.path.exists(eye_path)):
-            raise RuntimeError("Eye image missing")
-        face_img = Image.open(face_path).convert("RGB")
-        eye_img = Image.open(eye_path).convert("RGB")
-        # Basic detection + quality metrics (facenet/mtcnn/opencv)
-        face_detected = False
-        face_confidence = 0.0
-        left_eye_coord = right_eye_coord = None
-        if mtcnn is not None and not isinstance(mtcnn, dict) and (_MTCNN_IMPL == "facenet_pytorch" or _MTCNN_IMPL == "mtcnn"):
-            try:
-                if _MTCNN_IMPL == "facenet_pytorch":
-                    boxes, probs, landmarks = mtcnn.detect(face_img, landmarks=True)
-                    if boxes is not None and len(boxes) > 0:
-                        face_detected = True
-                        face_confidence = float(probs[0]) if probs is not None else 0.0
-                        if landmarks is not None:
-                            lm = landmarks[0]
-                            if len(lm) >= 2:
-                                left_eye_coord = {"x": float(lm[0][0]), "y": float(lm[0][1])}
-                                right_eye_coord = {"x": float(lm[1][0]), "y": float(lm[1][1])}
-                else:
-                    arr = np.asarray(face_img)
-                    detections = mtcnn.detect_faces(arr)
-                    if detections:
-                        face_detected = True
-                        face_confidence = float(detections[0].get("confidence", 0.0))
-                        k = detections[0].get("keypoints", {})
-                        left_eye_coord = k.get("left_eye")
-                        right_eye_coord = k.get("right_eye")
-            except Exception:
-                traceback.print_exc()
-        if isinstance(mtcnn, dict) and mtcnn.get("impl") == "opencv":
-            try:
-                arr = np.asarray(face_img)
-                gray = cv2.cvtColor(arr, cv2.COLOR_RGB2GRAY)
-                face_cascade = mtcnn["face_cascade"]
-                eye_cascade = mtcnn["eye_cascade"]
-                faces = face_cascade.detectMultiScale(gray, scaleFactor=1.1, minNeighbors=4, minSize=(60, 60))
-                if len(faces) > 0:
-                    face_detected = True
-                    (x, y, w, h) = faces[0]
-                    face_confidence = min(1.0, (w*h) / (arr.shape[0]*arr.shape[1]) * 4.0)
-                    roi_gray = gray[y:y+h, x:x+w]
-                    eyes = eye_cascade.detectMultiScale(roi_gray, scaleFactor=1.1, minNeighbors=5, minSize=(20, 10))
-                    if len(eyes) >= 1:
-                        ex, ey, ew, eh = eyes[0]
-                        left_eye_coord = {"x": float(x + ex + ew/2), "y": float(y + ey + eh/2)}
-            except Exception:
-                traceback.print_exc()
-        face_quality_score = 0.85 if face_detected and face_confidence > 0.6 else 0.45
-        quality_metrics = {
-            "face_detected": face_detected,
-            "face_confidence": round(face_confidence, 3),
-            "face_quality_score": round(face_quality_score, 2),
-            "eye_coords": {"left_eye": left_eye_coord, "right_eye": right_eye_coord},
-            "face_brightness": int(np.mean(np.asarray(face_img.convert("L")))),
-            "face_blur_estimate": int(np.var(np.asarray(face_img.convert("L"))))
-        }
-        screenings_db[screening_id]["quality_metrics"] = quality_metrics
-        # --------------------------
-        # RUN VLM -> get vlm_features + vlm_raw + vlm_meta
-        # --------------------------
-        vlm_features = None
-        vlm_raw = None
-        vlm_meta = {}
-        try:
-            vlm_features, vlm_raw, vlm_meta = run_vlm_and_get_features(face_path, eye_path)
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({
-                "vlm_parsed_features": vlm_features,
-                "vlm_raw": vlm_raw,
-                "vlm_meta": vlm_meta
-            })
-        except Exception as e:
-            logger.exception("VLM feature extraction failed")
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({"vlm_error": str(e)})
-            vlm_features = None
-            vlm_raw = ""
-            vlm_meta = {"error": str(e)}
-        # Log VLM outputs in pipeline context
-        logger.info("process_screening(%s) - VLM raw (snippet): %s", screening_id, (vlm_raw[:500] + "...") if vlm_raw else "<EMPTY>")
-        logger.info("process_screening(%s) - VLM parsed features: %s", screening_id, json.dumps(vlm_features, indent=2, ensure_ascii=False) if vlm_features else "None")
-        logger.info("process_screening(%s) - VLM meta: %s", screening_id, json.dumps(vlm_meta, ensure_ascii=False))
-        # --------------------------
-        # RUN LLM on vlm_parsed (preferred) or vlm_raw -> structured risk JSON
-        # --------------------------
-        structured_risk = None
-        try:
-            if vlm_features:
-                # prefer cleaned JSON
-                llm_input = json.dumps(vlm_features, ensure_ascii=False)
-            else:
-                # fallback to raw string (may be empty)
-                llm_input = vlm_raw if vlm_raw and vlm_raw.strip() else "{}"
-            structured_risk = run_llm_on_vlm(llm_input)
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({"structured_risk": structured_risk})
-        except Exception as e:
-            logger.exception("LLM processing failed")
-            screenings_db[screening_id].setdefault("ai_results", {})
-            screenings_db[screening_id]["ai_results"].update({"llm_error": str(e)})
-            structured_risk = {
-                "risk_score": 0.0,
-                "jaundice_probability": 0.0,
-                "anemia_probability": 0.0,
-                "hydration_issue_probability": 0.0,
-                "neurological_issue_probability": 0.0,
-                "summary": "",
-                "recommendation": "",
-                "confidence": 0.0
-            }
-        # Use structured_risk for summary recommendations & simple disease inference placeholders
-        screenings_db[screening_id].setdefault("ai_results", {})
-        screenings_db[screening_id]["ai_results"].update({
-            "processing_time_ms": 1200
-        })
-        disease_predictions = [
-            {
-                "condition": "Anemia-like-signs",
-                "risk_level": "Medium" if structured_risk.get("anemia_probability", 0.0) > 0.5 else "Low",
-                "probability": structured_risk.get("anemia_probability", 0.0),
-                "confidence": structured_risk.get("confidence", 0.0)
-            },
-            {
-                "condition": "Jaundice-like-signs",
-                "risk_level": "Medium" if structured_risk.get("jaundice_probability", 0.0) > 0.5 else "Low",
-                "probability": structured_risk.get("jaundice_probability", 0.0),
-                "confidence": structured_risk.get("confidence", 0.0)
-            }
-        ]
-        recommendations = {
-            "action_needed": "consult" if structured_risk.get("risk_score", 0.0) > 30.0 else "monitor",
-            "message_english": structured_risk.get("recommendation", "") or f"Please follow up with a health professional if concerns persist.",
-            "message_hindi": ""
-        }
-        screenings_db[screening_id].update({
-            "status": "completed",
-            "disease_predictions": disease_predictions,
-            "recommendations": recommendations
-        })
-        logger.info("[process_screening] Completed %s", screening_id)
-    except Exception as e:
-        traceback.print_exc()
-        if screening_id in screenings_db:
-            screenings_db[screening_id]["status"] = "failed"
-            screenings_db[screening_id]["error"] = str(e)
-        else:
-            logger.error("[process_screening] Failed for unknown screening %s: %s", screening_id, str(e))
-# -----------------------
-# Run server (for local debugging)
-# -----------------------
-if __name__ == "__main__":
-    import uvicorn
-    uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=False)

 """
 Elderly HealthWatch AI Backend (FastAPI)
 Pipeline:
     * always returns raw VLM output in API responses,
     * extracts JSON from VLM via regex when possible, and
     * sends only the face image to the VLM (not the eye image).
+    * uploads face image to temp hosting and uses URL instead of file path
 """
 import io
 GRADIO_VLM_SPACE = os.getenv("GRADIO_SPACE", "developer0hye/Qwen3-VL-8B-Instruct")
 LLM_GRADIO_SPACE = os.getenv("LLM_GRADIO_SPACE", "Tonic/med-gpt-oss-20b-demo")
 HF_TOKEN = os.getenv("HF_TOKEN", None)
+USE_IMAGE_URLS = True  # Always use URLs instead of files for VLM
 # Default VLM prompt
 DEFAULT_VLM_PROMPT = (
     }
     return out
+# -----------------------
+# Image upload to temp hosting
+# -----------------------
+import httpx  # make sure to add httpx to requirements
+import base64
+# helper: upload image to temporary hosting and get URL
+async def upload_image_to_temp_host(image_path: str) -> str:
+    """
+    Upload an image to a temporary hosting service (using tmpfiles.org as example).
+    Returns the public URL of the uploaded image.
+    Alternative services: catbox.moe, 0x0.st, etc.
+    """
+    try:
+        with open(image_path, 'rb') as f:
+            files = {'file': f}
+            async with httpx.AsyncClient(timeout=30.0) as client:
+                # Using tmpfiles.org as temporary host (24 hour retention)
+                response = await client.post('https://tmpfiles.org/api/v1/upload', files=files)
+                response.raise_for_status()
+                result = response.json()
+                # tmpfiles.org returns: {"status": "success", "data": {"url": "..."}}
+                if result.get('status') == 'success':
+                    url = result['data']['url']
+                    # Convert download URL to direct URL
+                    url = url.replace('tmpfiles.org/', 'tmpfiles.org/dl/')
+                    logger.info(f"Image uploaded successfully: {url}")
+                    return url
+                else:
+                    raise ValueError(f"Upload failed: {result}")
+    except Exception as e:
+        logger.exception(f"Failed to upload image to temp host: {e}")
+        raise HTTPException(status_code=500, detail=f"Failed to upload image: {e}")
+# helper: download URL to file with safety checks
+async def download_image_to_path(url: str, dest_path: str, max_bytes: int = 5_000_000, timeout_seconds: int = 10) -> None:
+    """
+    Download an image from `url` and save to dest_path.
+    Guards:
+     - timeout
+     - max bytes
+     - basic content-type check (image/*)
+    Raises HTTPException on failure.
+    """
+    try:
+        async with httpx.AsyncClient(timeout=timeout_seconds, follow_redirects=True) as client:
+            resp = await client.get(url, timeout=timeout_seconds)
+            resp.raise_for_status()
+            content_type = resp.headers.get("Content-Type", "")
+            if not content_type.startswith("image/"):
+                raise ValueError(f"URL does not appear to be an image (Content-Type={content_type})")
+            total = 0
+            with open(dest_path, "wb") as f:
+                async for chunk in resp.aiter_bytes():
+                    if not chunk:
+                        continue
+                    total += len(chunk)
+                    if total > max_bytes:
+                        raise ValueError(f"Image exceeds max allowed size ({max_bytes} bytes)")
+                    f.write(chunk)
+    except httpx.HTTPStatusError as e:
+        raise HTTPException(status_code=400, detail=f"Failed to fetch image: {e.response.status_code} {str(e)}")
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=f"Failed to download image: {str(e)}")
 # -----------------------
 # Gradio / VLM helper (sends only face image, returns meta)
 # -----------------------
     return Client(space)
 def run_vlm_and_get_features(face_path: str, eye_path: Optional[str] = None, prompt: Optional[str] = None,
+                             raise_on_file_delivery_failure: bool = False,
+                             use_url: bool = False
                              ) -> Tuple[Optional[Dict[str, Any]], str, Dict[str, Any]]:
     """
+    Synchronous call to remote VLM (gradio /chat_fn). Sends ONLY the face image.
+    If use_url=True, uploads image to temp host and sends URL instead of file path.
     Returns tuple: (parsed_features_dict_or_None, raw_text_response_str, meta)
     meta includes:
       - vlm_file_delivery_ok (bool)  # expects ≥1 file acknowledged (face)
       - vlm_files_seen (int or None)
       - vlm_raw_len (int)
       - vlm_out_object (short repr)
+      - face_url (str, if use_url=True)
     """
     prompt = prompt or DEFAULT_VLM_PROMPT
     if not os.path.exists(face_path):
         raise FileNotFoundError(f"Face image not found at: {face_path}")
+    if eye_path and not os.path.exists(eye_path):
         raise FileNotFoundError(f"Eye image not found at: {eye_path}")
     face_size = os.path.getsize(face_path)
+    logger.info(f"VLM input file - Face: {face_size} bytes")
+    if face_size == 0:
+        raise ValueError("Face image is empty (0 bytes)")
     if not GRADIO_AVAILABLE:
         raise RuntimeError("gradio_client not available in this environment.")
+    # Verify file can be opened as image
     try:
         Image.open(face_path).verify()
+        logger.info("Face image verified as valid")
     except Exception as e:
+        raise ValueError(f"Invalid image file: {e}")
     client = get_gradio_client_for_space(GRADIO_VLM_SPACE)
+    meta: Dict[str, Any] = {
+        "vlm_file_delivery_ok": False,
+        "vlm_files_seen": None,
+        "vlm_raw_len": 0,
+        "vlm_out_object": None
+    }
+    # Upload to temp host if use_url=True
+    if use_url:
+        try:
+            # Run async upload in sync context using asyncio
+            loop = asyncio.new_event_loop()
+            asyncio.set_event_loop(loop)
+            face_url = loop.run_until_complete(upload_image_to_temp_host(face_path))
+            loop.close()
+            meta["face_url"] = face_url
+            logger.info(f"Using image URL for VLM: {face_url}")
+            # Pass URL directly to Gradio client using handle_file
+            message = {"text": prompt, "files": [handle_file(face_url)]}
+        except Exception as e:
+            logger.exception("Failed to upload image to temp host")
+            raise RuntimeError(f"Image upload failed: {e}")
+    else:
+        # Original behavior: use file path
+        message = {"text": prompt, "files": [handle_file(face_path)]}
     # SINGLE CALL (no retries)
     try:
+        logger.info("Calling VLM Space %s with %s", GRADIO_VLM_SPACE, "URL" if use_url else "file")
         result = client.predict(message=message, history=[], api_name="/chat_fn")
     except Exception as e:
         logger.exception("VLM call failed (no retries)")
     Call the remote LLM Space's /chat endpoint with defensive input handling and a single retry.
     - Logs the VLM raw string and the chosen payload.
     - Sends cleaned JSON (json.dumps(vlm_features)) if vlm_features_or_raw is dict, else sends raw string.
+    - Uses regex to extract the final JSON from