Spaces:

Stroke-ia
/

API

Sleeping

API

File size: 8,389 Bytes

f9414c6

from fastapi import FastAPI, UploadFile, File, HTTPException, Security, Depends
from fastapi.security.api_key import APIKeyHeader
from fastapi.responses import JSONResponse, StreamingResponse
import uvicorn
import logging
import io
import os
from typing import Tuple, Optional

import numpy as np
from PIL import Image
import cv2

# ML
from ultralytics import YOLO
import mediapipe as mp

# ==========================
# 🔑 Sécurité : API Key
# ==========================
API_KEY = "1234"  # ⚠️ change avant de partager
api_key_header = APIKeyHeader(name="X-API-Key")

def verify_api_key(api_key: str = Security(api_key_header)):
    if api_key != API_KEY:
        raise HTTPException(status_code=403, detail="Forbidden")
    return api_key

# ==========================
# 📝 Logger
# ==========================
logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s - %(levelname)s - %(message)s"
)
logger = logging.getLogger("stroke-api")

# ==========================
# 🚀 App
# ==========================
app = FastAPI(
    title="Stroke Detection API",
    version="1.2.0",
    description="""
    🚑 Stroke Detection API using YOLOv8 + Face Detection (MediaPipe)

    ⚠️ **Disclaimer**: Research/demo only — not a medical device.
    """
)

# ==========================
# 📦 Chargement modèles
# ==========================
try:
    model = YOLO("best.pt")
    logger.info("✅ YOLO model loaded.")
except Exception as e:
    logger.exception("❌ Failed to load YOLO model")
    raise RuntimeError(f"Model loading failed: {e}")

mp_face_detection = mp.solutions.face_detection

# ==========================
# 🔧 Utilitaires
# ==========================
ALLOWED_EXT = (".png", ".jpg", ".jpeg")
ALLOWED_MIME = {"image/png", "image/jpeg"}
MAX_BYTES = 8 * 1024 * 1024  # 8 MB
CROP_ON_FACE = True          # recadrer sur le visage détecté

def _validate_file(file: UploadFile, raw: bytes):
    # extension
    if not file.filename.lower().endswith(ALLOWED_EXT):
        raise HTTPException(status_code=400, detail="Invalid file extension. Use .png/.jpg/.jpeg")
    # MIME
    if (file.content_type or "").lower() not in ALLOWED_MIME:
        # On continue si extension OK mais content_type vide côté client
        if file.content_type:
            raise HTTPException(status_code=400, detail="Invalid content-type. Use image/png or image/jpeg")
    # taille
    if len(raw) > MAX_BYTES:
        raise HTTPException(status_code=413, detail=f"Image too large. Max {MAX_BYTES//(1024*1024)} MB")

def _read_image_to_numpy(raw: bytes) -> np.ndarray:
    try:
        img = Image.open(io.BytesIO(raw)).convert("RGB")
        return np.array(img)
    except Exception:
        raise HTTPException(status_code=400, detail="Unreadable image file")

def _largest_face_bbox(np_img: np.ndarray, min_conf: float = 0.6) -> Optional[Tuple[int,int,int,int]]:
    """
    Retourne (x1,y1,x2,y2) du plus grand visage détecté, ou None.
    """
    h, w = np_img.shape[:2]
    with mp_face_detection.FaceDetection(min_detection_confidence=min_conf) as fd:
        results = fd.process(cv2.cvtColor(np_img, cv2.COLOR_RGB2BGR))
        if not results.detections:
            return None
        boxes = []
        for det in results.detections:
            rel = det.location_data.relative_bounding_box
            x1 = int(max(0, rel.xmin) * w)
            y1 = int(max(0, rel.ymin) * h)
            x2 = int(min(1.0, rel.xmin + rel.width) * w)
            y2 = int(min(1.0, rel.ymin + rel.height) * h)
            boxes.append((x1, y1, x2, y2))
        # choisir le plus grand
        boxes.sort(key=lambda b: (b[2]-b[0])*(b[3]-b[1]), reverse=True)
        return boxes[0] if boxes else None

def _crop_to_bbox(np_img: np.ndarray, bbox: Tuple[int,int,int,int], margin: float = 0.15) -> np.ndarray:
    h, w = np_img.shape[:2]
    x1, y1, x2, y2 = bbox
    bw, bh = x2 - x1, y2 - y1
    # marge autour du visage
    dx, dy = int(bw * margin), int(bh * margin)
    X1 = max(0, x1 - dx)
    Y1 = max(0, y1 - dy)
    X2 = min(w, x2 + dx)
    Y2 = min(h, y2 + dy)
    return np_img[Y1:Y2, X1:X2].copy()

def _annotate_face_box(np_img: np.ndarray, bbox: Tuple[int,int,int,int]) -> np.ndarray:
    annotated = cv2.cvtColor(np_img, cv2.COLOR_RGB2BGR).copy()
    x1, y1, x2, y2 = bbox
    cv2.rectangle(annotated, (x1, y1), (x2, y2), (0, 255, 0), 2)  # couleur par défaut
    return annotated

# ==========================
# 🩺 Healthcheck
# ==========================
@app.get("/health")
async def health():
    return {"status": "ok", "model_loaded": True}

# ==========================
# 📦 Endpoint JSON
# ==========================
@app.post("/v1/predict/")
async def predict(
    file: UploadFile = File(...),
    api_key: str = Depends(verify_api_key)
):
    raw = await file.read()
    _validate_file(file, raw)

    try:
        np_img = _read_image_to_numpy(raw)

        # 1) Détection visage obligatoire
        face_bbox = _largest_face_bbox(np_img)
        if face_bbox is None:
            return JSONResponse(
                status_code=422,
                content={"status": "error", "message": "Aucun visage humain détecté. Veuillez centrer le visage."}
            )

        # 2) Option : recadrer sur le visage pour améliorer la détection
        input_img = _crop_to_bbox(np_img, face_bbox) if CROP_ON_FACE else np_img

        # 3) YOLO inference (en mémoire)
        results = model.predict(source=input_img, verbose=False)

        output = []
        for r in results:
            for box in r.boxes:
                output.append({
                    "class": r.names[int(box.cls[0].item())],
                    "confidence": float(box.conf[0].item()),
                    "bbox": box.xyxy[0].tolist()
                })

        logger.info(f"/predict {file.filename} -> {len(output)} detections (face ok)")
        return JSONResponse(content={
            "status": "ok",
            "face_detected": True,
            "face_bbox": list(map(int, face_bbox)),
            "predictions": output
        })

    except HTTPException:
        raise
    except Exception as e:
        logger.exception("Error in /v1/predict")
        raise HTTPException(status_code=500, detail=str(e))

# ==========================
# 🖼️ Endpoint Image (annotée)
# ==========================
@app.post("/v1/predict_image/")
async def predict_image(
    file: UploadFile = File(...),
    api_key: str = Depends(verify_api_key)
):
    raw = await file.read()
    _validate_file(file, raw)

    try:
        np_img = _read_image_to_numpy(raw)

        # 1) Détection visage
        face_bbox = _largest_face_bbox(np_img)
        if face_bbox is None:
            return JSONResponse(
                status_code=422,
                content={"status": "error", "message": "Aucun visage humain détecté. Veuillez centrer le visage."}
            )

        # 2) Recadrer sur le visage (optionnel)
        input_img = _crop_to_bbox(np_img, face_bbox) if CROP_ON_FACE else np_img

        # 3) YOLO
        results = model.predict(source=input_img, verbose=False)

        # 4) Annotations YOLO
        yolo_annot = results[0].plot()  # BGR
        yolo_annot = cv2.cvtColor(yolo_annot, cv2.COLOR_BGR2RGB)

        # 5) Si on n’a pas recadré, on dessine aussi le cadre visage sur l’image d’origine
        if not CROP_ON_FACE:
            annotated = _annotate_face_box(np_img, face_bbox)
            # fusion simple : ici on retourne juste l’annot YOLO (non redimensionnée)
            out_rgb = annotated
        else:
            # On retourne l’image annotée sur le crop visage
            out_rgb = yolo_annot

        # 6) Retour en PNG (stream)
        pil_img = Image.fromarray(out_rgb)
        buf = io.BytesIO()
        pil_img.save(buf, format="PNG")
        buf.seek(0)

        logger.info(f"/predict_image {file.filename} -> face ok + image annotée")
        return StreamingResponse(buf, media_type="image/png")

    except HTTPException:
        raise
    except Exception as e:
        logger.exception("Error in /v1/predict_image")
        raise HTTPException(status_code=500, detail=str(e))

# ==========================
# 🚀 Lancement local
# ==========================
if __name__ == "__main__":
    # Sur HF Spaces, c’est Gradio/Space qui lance; localement :
    uvicorn.run(app, host="0.0.0.0", port=7860)