File size: 8,389 Bytes
f9414c6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 |
from fastapi import FastAPI, UploadFile, File, HTTPException, Security, Depends
from fastapi.security.api_key import APIKeyHeader
from fastapi.responses import JSONResponse, StreamingResponse
import uvicorn
import logging
import io
import os
from typing import Tuple, Optional
import numpy as np
from PIL import Image
import cv2
# ML
from ultralytics import YOLO
import mediapipe as mp
# ==========================
# 🔑 Sécurité : API Key
# ==========================
API_KEY = "1234" # ⚠️ change avant de partager
api_key_header = APIKeyHeader(name="X-API-Key")
def verify_api_key(api_key: str = Security(api_key_header)):
if api_key != API_KEY:
raise HTTPException(status_code=403, detail="Forbidden")
return api_key
# ==========================
# 📝 Logger
# ==========================
logging.basicConfig(
level=logging.INFO,
format="%(asctime)s - %(levelname)s - %(message)s"
)
logger = logging.getLogger("stroke-api")
# ==========================
# 🚀 App
# ==========================
app = FastAPI(
title="Stroke Detection API",
version="1.2.0",
description="""
🚑 Stroke Detection API using YOLOv8 + Face Detection (MediaPipe)
⚠️ **Disclaimer**: Research/demo only — not a medical device.
"""
)
# ==========================
# 📦 Chargement modèles
# ==========================
try:
model = YOLO("best.pt")
logger.info("✅ YOLO model loaded.")
except Exception as e:
logger.exception("❌ Failed to load YOLO model")
raise RuntimeError(f"Model loading failed: {e}")
mp_face_detection = mp.solutions.face_detection
# ==========================
# 🔧 Utilitaires
# ==========================
ALLOWED_EXT = (".png", ".jpg", ".jpeg")
ALLOWED_MIME = {"image/png", "image/jpeg"}
MAX_BYTES = 8 * 1024 * 1024 # 8 MB
CROP_ON_FACE = True # recadrer sur le visage détecté
def _validate_file(file: UploadFile, raw: bytes):
# extension
if not file.filename.lower().endswith(ALLOWED_EXT):
raise HTTPException(status_code=400, detail="Invalid file extension. Use .png/.jpg/.jpeg")
# MIME
if (file.content_type or "").lower() not in ALLOWED_MIME:
# On continue si extension OK mais content_type vide côté client
if file.content_type:
raise HTTPException(status_code=400, detail="Invalid content-type. Use image/png or image/jpeg")
# taille
if len(raw) > MAX_BYTES:
raise HTTPException(status_code=413, detail=f"Image too large. Max {MAX_BYTES//(1024*1024)} MB")
def _read_image_to_numpy(raw: bytes) -> np.ndarray:
try:
img = Image.open(io.BytesIO(raw)).convert("RGB")
return np.array(img)
except Exception:
raise HTTPException(status_code=400, detail="Unreadable image file")
def _largest_face_bbox(np_img: np.ndarray, min_conf: float = 0.6) -> Optional[Tuple[int,int,int,int]]:
"""
Retourne (x1,y1,x2,y2) du plus grand visage détecté, ou None.
"""
h, w = np_img.shape[:2]
with mp_face_detection.FaceDetection(min_detection_confidence=min_conf) as fd:
results = fd.process(cv2.cvtColor(np_img, cv2.COLOR_RGB2BGR))
if not results.detections:
return None
boxes = []
for det in results.detections:
rel = det.location_data.relative_bounding_box
x1 = int(max(0, rel.xmin) * w)
y1 = int(max(0, rel.ymin) * h)
x2 = int(min(1.0, rel.xmin + rel.width) * w)
y2 = int(min(1.0, rel.ymin + rel.height) * h)
boxes.append((x1, y1, x2, y2))
# choisir le plus grand
boxes.sort(key=lambda b: (b[2]-b[0])*(b[3]-b[1]), reverse=True)
return boxes[0] if boxes else None
def _crop_to_bbox(np_img: np.ndarray, bbox: Tuple[int,int,int,int], margin: float = 0.15) -> np.ndarray:
h, w = np_img.shape[:2]
x1, y1, x2, y2 = bbox
bw, bh = x2 - x1, y2 - y1
# marge autour du visage
dx, dy = int(bw * margin), int(bh * margin)
X1 = max(0, x1 - dx)
Y1 = max(0, y1 - dy)
X2 = min(w, x2 + dx)
Y2 = min(h, y2 + dy)
return np_img[Y1:Y2, X1:X2].copy()
def _annotate_face_box(np_img: np.ndarray, bbox: Tuple[int,int,int,int]) -> np.ndarray:
annotated = cv2.cvtColor(np_img, cv2.COLOR_RGB2BGR).copy()
x1, y1, x2, y2 = bbox
cv2.rectangle(annotated, (x1, y1), (x2, y2), (0, 255, 0), 2) # couleur par défaut
return annotated
# ==========================
# 🩺 Healthcheck
# ==========================
@app.get("/health")
async def health():
return {"status": "ok", "model_loaded": True}
# ==========================
# 📦 Endpoint JSON
# ==========================
@app.post("/v1/predict/")
async def predict(
file: UploadFile = File(...),
api_key: str = Depends(verify_api_key)
):
raw = await file.read()
_validate_file(file, raw)
try:
np_img = _read_image_to_numpy(raw)
# 1) Détection visage obligatoire
face_bbox = _largest_face_bbox(np_img)
if face_bbox is None:
return JSONResponse(
status_code=422,
content={"status": "error", "message": "Aucun visage humain détecté. Veuillez centrer le visage."}
)
# 2) Option : recadrer sur le visage pour améliorer la détection
input_img = _crop_to_bbox(np_img, face_bbox) if CROP_ON_FACE else np_img
# 3) YOLO inference (en mémoire)
results = model.predict(source=input_img, verbose=False)
output = []
for r in results:
for box in r.boxes:
output.append({
"class": r.names[int(box.cls[0].item())],
"confidence": float(box.conf[0].item()),
"bbox": box.xyxy[0].tolist()
})
logger.info(f"/predict {file.filename} -> {len(output)} detections (face ok)")
return JSONResponse(content={
"status": "ok",
"face_detected": True,
"face_bbox": list(map(int, face_bbox)),
"predictions": output
})
except HTTPException:
raise
except Exception as e:
logger.exception("Error in /v1/predict")
raise HTTPException(status_code=500, detail=str(e))
# ==========================
# 🖼️ Endpoint Image (annotée)
# ==========================
@app.post("/v1/predict_image/")
async def predict_image(
file: UploadFile = File(...),
api_key: str = Depends(verify_api_key)
):
raw = await file.read()
_validate_file(file, raw)
try:
np_img = _read_image_to_numpy(raw)
# 1) Détection visage
face_bbox = _largest_face_bbox(np_img)
if face_bbox is None:
return JSONResponse(
status_code=422,
content={"status": "error", "message": "Aucun visage humain détecté. Veuillez centrer le visage."}
)
# 2) Recadrer sur le visage (optionnel)
input_img = _crop_to_bbox(np_img, face_bbox) if CROP_ON_FACE else np_img
# 3) YOLO
results = model.predict(source=input_img, verbose=False)
# 4) Annotations YOLO
yolo_annot = results[0].plot() # BGR
yolo_annot = cv2.cvtColor(yolo_annot, cv2.COLOR_BGR2RGB)
# 5) Si on n’a pas recadré, on dessine aussi le cadre visage sur l’image d’origine
if not CROP_ON_FACE:
annotated = _annotate_face_box(np_img, face_bbox)
# fusion simple : ici on retourne juste l’annot YOLO (non redimensionnée)
out_rgb = annotated
else:
# On retourne l’image annotée sur le crop visage
out_rgb = yolo_annot
# 6) Retour en PNG (stream)
pil_img = Image.fromarray(out_rgb)
buf = io.BytesIO()
pil_img.save(buf, format="PNG")
buf.seek(0)
logger.info(f"/predict_image {file.filename} -> face ok + image annotée")
return StreamingResponse(buf, media_type="image/png")
except HTTPException:
raise
except Exception as e:
logger.exception("Error in /v1/predict_image")
raise HTTPException(status_code=500, detail=str(e))
# ==========================
# 🚀 Lancement local
# ==========================
if __name__ == "__main__":
# Sur HF Spaces, c’est Gradio/Space qui lance; localement :
uvicorn.run(app, host="0.0.0.0", port=7860)
|