Spaces:

BiasLab2025
/

perceptiondemo

Paused

App Files Files Community

AliZak commited on Feb 11

Commit

62064b6

verified ·

1 Parent(s): ffe6db7

Uploaded the base files

Browse files

Files changed (3) hide show

Dockerfile +19 -0
perception_roi_server.py +789 -0
requirements.txt +5 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,19 @@

+FROM python:3.10-slim
+ENV PYTHONDONTWRITEBYTECODE=1
+ENV PYTHONUNBUFFERED=1
+RUN apt-get update \
+    && apt-get install -y --no-install-recommends ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+WORKDIR /app
+COPY requirements.txt /app/requirements.txt
+RUN pip install --no-cache-dir -r /app/requirements.txt
+COPY perception_roi_server.py /app/perception_roi_server.py
+EXPOSE 7860
+CMD ["python", "/app/perception_roi_server.py", "--host", "0.0.0.0", "--port", "7860"]

perception_roi_server.py ADDED Viewed

	@@ -0,0 +1,789 @@

+#!/usr/bin/env python3
+"""
+ROI-aware compression server (FastAPI)
+- Uploads a video and prompt
+- Runs YOLOv8x detection + simple tracking
+- Produces 3 outputs: overlay (tracking), compressed, ROI-preserved
+- Serves MJPEG stream of live overlay
+Endpoints:
+    POST /track/async
+    POST /process/compress/{job_id}
+  GET  /process/status/{job_id}
+  GET  /process/video/overlay/{job_id}
+  GET  /process/video/compressed/{job_id}
+  GET  /process/video/roi/{job_id}
+  GET  /detect/stream/{job_id}
+"""
+import os
+import uuid
+import time
+import math
+import threading
+import shutil
+import subprocess
+from dataclasses import dataclass, field
+from typing import Dict, List, Optional, Any
+import cv2
+import numpy as np
+from fastapi import FastAPI, UploadFile, File, Form, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import FileResponse, StreamingResponse, JSONResponse
+from ultralytics import YOLO
+DEFAULT_WEIGHTS = os.environ.get("YOLO_WEIGHTS", "yolov8s.pt")
+DEFAULT_CONF = float(os.environ.get("YOLO_CONF", "0.25"))
+DEFAULT_DEVICE = os.environ.get("YOLO_DEVICE", "auto")
+FAST_DETECT_SCALE = float(os.environ.get("FAST_DETECT_SCALE", "0.65"))
+FAST_DETECT_IMGSZ = int(os.environ.get("FAST_DETECT_IMGSZ", "512"))
+app = FastAPI(title="ROI Compression Server", version="1.0.0")
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=False,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+_model_lock = threading.Lock()
+_model: Optional[YOLO] = None
+def get_model(weights: str) -> YOLO:
+    global _model
+    with _model_lock:
+        if _model is None:
+            _model = YOLO(weights)
+        return _model
+def _parse_queries(q: str) -> List[str]:
+    if not q:
+        return []
+    parts = [p.strip().lower() for p in q.replace("\n", ",").split(",")]
+    return [p for p in parts if p]
+def _keep_det(label: str, queries: List[str]) -> bool:
+    if not queries:
+        return True
+    l = (label or "").strip().lower()
+    if not l:
+        return False
+    return any((q == l) or (q in l) or (l in q) for q in queries)
+def _yolo_detect_frame(
+    model: YOLO,
+    frame_bgr: np.ndarray,
+    conf: float,
+    queries: List[str],
+    device: str,
+    fast_mode: bool = False,
+) -> List[Dict[str, Any]]:
+    scale = 1.0
+    if fast_mode:
+        scale = max(0.1, min(1.0, float(FAST_DETECT_SCALE)))
+    if scale < 1.0:
+        h, w = frame_bgr.shape[:2]
+        sw, sh = max(64, int(w * scale)), max(64, int(h * scale))
+        small = cv2.resize(frame_bgr, (sw, sh), interpolation=cv2.INTER_AREA)
+        img = cv2.cvtColor(small, cv2.COLOR_BGR2RGB)
+    else:
+        img = cv2.cvtColor(frame_bgr, cv2.COLOR_BGR2RGB)
+    pred_kwargs = {"conf": conf, "verbose": False}
+    if fast_mode:
+        pred_kwargs["imgsz"] = FAST_DETECT_IMGSZ
+    if device and str(device).lower() != "auto":
+        pred_kwargs["device"] = device
+        if fast_mode and str(device).lower() != "cpu":
+            pred_kwargs["half"] = True
+    try:
+        res = model.predict(img, **pred_kwargs)
+    except Exception as e:
+        msg = str(e)
+        if ("cuda" in msg.lower()) and (str(device).lower() != "cpu"):
+            pred_kwargs["device"] = "cpu"
+            res = model.predict(img, **pred_kwargs)
+        else:
+            raise
+    if not res:
+        return []
+    r0 = res[0]
+    names = getattr(r0, "names", None) or getattr(model, "names", None) or {}
+    boxes = []
+    if r0.boxes is None:
+        return boxes
+    for b in r0.boxes:
+        try:
+            xyxy = b.xyxy[0].cpu().numpy().tolist()
+            if scale < 1.0:
+                inv = 1.0 / scale
+                xyxy = [v * inv for v in xyxy]
+            score = float(b.conf[0].cpu().numpy())
+            cls_i = int(b.cls[0].cpu().numpy())
+            label = str(names.get(cls_i, cls_i))
+            if not _keep_det(label, queries):
+                continue
+            boxes.append({"bbox_xyxy": xyxy, "label": label, "score": score})
+        except Exception:
+            continue
+    return boxes
+def _draw_boxes(frame_bgr: np.ndarray, dets: List[Dict[str, Any]]) -> np.ndarray:
+    out = frame_bgr.copy()
+    for d in dets:
+        b = d.get("bbox_xyxy")
+        if not (isinstance(b, (list, tuple)) and len(b) == 4):
+            continue
+        x1, y1, x2, y2 = [int(max(0, v)) for v in b]
+        label = str(d.get("label", ""))
+        score = d.get("score", None)
+        tid = d.get("track_id", None)
+        tag = f"#{tid}" if isinstance(tid, int) else ""
+        txt = f"{label}{tag} {score:.2f}" if isinstance(score, (float, int)) else f"{label}{tag}"
+        cv2.rectangle(out, (x1, y1), (x2, y2), (0, 255, 0), 2)
+        if txt:
+            cv2.putText(out, txt, (x1, max(12, y1 - 6)), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 1, cv2.LINE_AA)
+    return out
+def _iou_xyxy(a: List[float], b: List[float]) -> float:
+    ax1, ay1, ax2, ay2 = a
+    bx1, by1, bx2, by2 = b
+    inter_x1 = max(ax1, bx1)
+    inter_y1 = max(ay1, by1)
+    inter_x2 = min(ax2, bx2)
+    inter_y2 = min(ay2, by2)
+    if inter_x2 <= inter_x1 or inter_y2 <= inter_y1:
+        return 0.0
+    inter = (inter_x2 - inter_x1) * (inter_y2 - inter_y1)
+    area_a = max(0.0, (ax2 - ax1)) * max(0.0, (ay2 - ay1))
+    area_b = max(0.0, (bx2 - bx1)) * max(0.0, (by2 - by1))
+    denom = area_a + area_b - inter
+    if denom <= 0:
+        return 0.0
+    return float(inter / denom)
+def _assign_tracks(dets: List[Dict[str, Any]], tracker: Dict[str, Any], iou_thresh: float = 0.3) -> List[Dict[str, Any]]:
+    prev = tracker.get("tracks", [])
+    used_prev = set()
+    out = []
+    for d in dets:
+        b = d.get("bbox_xyxy")
+        label = str(d.get("label", ""))
+        best_i = None
+        best_iou = 0.0
+        if isinstance(b, (list, tuple)) and len(b) == 4:
+            for i, tr in enumerate(prev):
+                if i in used_prev:
+                    continue
+                if label and tr.get("label") and tr.get("label") != label:
+                    continue
+                iou = _iou_xyxy(b, tr.get("bbox_xyxy", [0, 0, 0, 0]))
+                if iou > best_iou:
+                    best_iou = iou
+                    best_i = i
+        if best_i is not None and best_iou >= iou_thresh:
+            d["track_id"] = int(prev[best_i].get("id"))
+            used_prev.add(best_i)
+        else:
+            d["track_id"] = int(tracker.get("next_id", 1))
+            tracker["next_id"] = int(d["track_id"]) + 1
+        out.append(d)
+    tracker["tracks"] = [
+        {"id": int(d.get("track_id")), "bbox_xyxy": d.get("bbox_xyxy"), "label": d.get("label", "")}
+        for d in out
+    ]
+    return out
+def _ensure_even(v: int, min_v: int = 64) -> int:
+    v = max(min_v, int(v))
+    return v - (v % 2)
+def _compute_target_params(w: int, h: int, fps: float, bandwidth_kbps: int, target_fps: int, target_w: int, target_h: int, scale: float):
+    fps = max(1.0, float(fps or 1.0))
+    budget = max(100, int(bandwidth_kbps or 1500))
+    base_kbps_720p30 = 2500.0
+    base_kbps_orig = base_kbps_720p30 * (float(w) * float(h) * fps) / (1280.0 * 720.0 * 30.0)
+    if not math.isfinite(base_kbps_orig) or base_kbps_orig <= 0:
+        base_kbps_orig = base_kbps_720p30
+    if target_w and target_h:
+        tw, th = int(target_w), int(target_h)
+    else:
+        scale = float(scale or 1.0)
+        if scale < 0.1:
+            scale = 0.1
+        if scale > 1.0:
+            scale = 1.0
+        tw, th = int(w * scale), int(h * scale)
+    tfps = int(target_fps or fps)
+    scale_r = min(1.0, math.sqrt(budget / base_kbps_orig))
+    tw = min(tw, int(w * scale_r))
+    th = min(th, int(h * scale_r))
+    tfps = min(int(fps), tfps)
+    tw = _ensure_even(max(64, tw))
+    th = _ensure_even(max(64, th))
+    tfps = max(1, tfps)
+    frame_step = max(1, int(round(fps / max(1, tfps))))
+    return tw, th, tfps, frame_step
+def _open_writer(path: str, w: int, h: int, fps: float) -> Optional[cv2.VideoWriter]:
+    if w <= 0 or h <= 0:
+        return None
+    # for codec in ("avc1", "H264", "mp4v"):
+    #     try:
+    #         fourcc = cv2.VideoWriter_fourcc(*codec)
+    #         wtmp = cv2.VideoWriter(path, fourcc, float(fps or 30.0), (int(w), int(h)))
+    #         if wtmp is not None and wtmp.isOpened():
+    #             return wtmp
+    #     except Exception:
+    #         continue
+    # Force software-friendly codec to avoid hardware H.264 failures on some systems.
+    try:
+        fourcc = cv2.VideoWriter_fourcc(*"mp4v")
+        wtmp = cv2.VideoWriter(path, fourcc, float(fps or 30.0), (int(w), int(h)))
+        if wtmp is not None and wtmp.isOpened():
+            return wtmp
+    except Exception:
+        pass
+    return None
+def _ffmpeg_available() -> bool:
+    return shutil.which("ffmpeg") is not None
+def _transcode_h264(src_path: str) -> Optional[str]:
+    if not src_path or not os.path.exists(src_path):
+        return None
+    if not _ffmpeg_available():
+        return None
+    dst_path = os.path.splitext(src_path)[0] + "_h264.mp4"
+    cmd = [
+        "ffmpeg",
+        "-y",
+        "-i",
+        src_path,
+        "-c:v",
+        "libx264",
+        "-preset",
+        "veryfast",
+        "-pix_fmt",
+        "yuv420p",
+        dst_path,
+    ]
+    try:
+        subprocess.run(cmd, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
+        if os.path.exists(dst_path) and os.path.getsize(dst_path) > 1024:
+            return dst_path
+    except Exception:
+        return None
+    return None
+def _apply_roi_overlay(frame_bgr: np.ndarray, dets: List[Dict[str, Any]], target_w: int, target_h: int) -> np.ndarray:
+    h, w = frame_bgr.shape[:2]
+    bg_small = cv2.resize(frame_bgr, (int(target_w), int(target_h)), interpolation=cv2.INTER_AREA)
+    bg = cv2.resize(bg_small, (int(w), int(h)), interpolation=cv2.INTER_LINEAR)
+    out = bg.copy()
+    pad = max(2, int(min(w, h) * 0.005))
+    for d in dets:
+        b = d.get("bbox_xyxy")
+        if not (isinstance(b, (list, tuple)) and len(b) == 4):
+            continue
+        x1, y1, x2, y2 = [int(v) for v in b]
+        x1 = max(0, x1 - pad)
+        y1 = max(0, y1 - pad)
+        x2 = min(w, x2 + pad)
+        y2 = min(h, y2 + pad)
+        if x2 <= x1 or y2 <= y1:
+            continue
+        out[y1:y2, x1:x2] = frame_bgr[y1:y2, x1:x2]
+    return out
+@dataclass
+class Job:
+    id: str
+    video_path: str
+    created: float = field(default_factory=time.time)
+    status: str = "tracking"
+    error: Optional[str] = None
+    fps: float = 30.0
+    w: int = 0
+    h: int = 0
+    frame_step: int = 1
+    target_fps: int = 15
+    target_width: int = 0
+    target_height: int = 0
+    bandwidth_kbps: int = 1500
+    conf: float = DEFAULT_CONF
+    weights: str = DEFAULT_WEIGHTS
+    device: str = DEFAULT_DEVICE
+    fast_mode: bool = False
+    queries: List[str] = field(default_factory=list)
+    overlay_video_path: Optional[str] = None
+    compressed_video_path: Optional[str] = None
+    roi_video_path: Optional[str] = None
+    det_by_frame: Dict[int, List[Dict[str, Any]]] = field(default_factory=dict)
+    latest_jpeg: Optional[bytes] = None
+    latest_compressed_jpeg: Optional[bytes] = None
+    latest_roi_jpeg: Optional[bytes] = None
+    lock: threading.Lock = field(default_factory=threading.Lock)
+    tracker_state: Dict[str, Any] = field(default_factory=lambda: {"next_id": 1, "tracks": []})
+jobs: Dict[str, Job] = {}
+def _process_job(job: Job):
+    try:
+        model = get_model(job.weights)
+        cap = cv2.VideoCapture(job.video_path)
+        if not cap.isOpened():
+            raise RuntimeError("Could not open video.")
+        fps = float(cap.get(cv2.CAP_PROP_FPS) or 30.0)
+        w = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH) or 0)
+        h = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT) or 0)
+        tw, th, tfps, frame_step = _compute_target_params(
+            w=w,
+            h=h,
+            fps=fps,
+            bandwidth_kbps=job.bandwidth_kbps,
+            target_fps=job.target_fps,
+            target_w=job.target_width,
+            target_h=job.target_height,
+            scale=max(0.25, min(1.0, (job.target_width / w) if (job.target_width and w) else 1.0)),
+        )
+        os.makedirs("outputs", exist_ok=True)
+        overlay_path = os.path.join("outputs", f"{job.id}_overlay.mp4")
+        overlay_writer = _open_writer(overlay_path, w, h, tfps)
+        with job.lock:
+            job.fps = fps
+            job.w = w
+            job.h = h
+            job.frame_step = frame_step
+            job.target_fps = tfps
+            job.target_width = tw
+            job.target_height = th
+            job.overlay_video_path = overlay_path if overlay_writer is not None else None
+            job.status = "tracking"
+        frame_idx = 0
+        tracker = job.tracker_state
+        while True:
+            ok, frame = cap.read()
+            if not ok:
+                break
+            if frame_idx % frame_step != 0:
+                frame_idx += 1
+                continue
+            dets = _yolo_detect_frame(model, frame, conf=job.conf, queries=job.queries, device=job.device, fast_mode=job.fast_mode)
+            if dets and not any("track_id" in d for d in dets):
+                dets = _assign_tracks(dets, tracker)
+            elif dets:
+                tracker["tracks"] = [
+                    {"id": int(d.get("track_id")), "bbox_xyxy": d.get("bbox_xyxy"), "label": d.get("label", "")}
+                    for d in dets
+                ]
+                max_id = max((int(d.get("track_id", 0)) for d in dets), default=0)
+                tracker["next_id"] = max(tracker.get("next_id", 1), max_id + 1)
+            with job.lock:
+                job.det_by_frame[int(frame_idx)] = dets
+            overlay = _draw_boxes(frame, dets)
+            ok2, jpg = cv2.imencode(".jpg", overlay, [int(cv2.IMWRITE_JPEG_QUALITY), 80])
+            if ok2:
+                with job.lock:
+                    job.latest_jpeg = jpg.tobytes()
+            if overlay_writer is not None:
+                overlay_writer.write(overlay)
+            frame_idx += 1
+        cap.release()
+        if overlay_writer is not None:
+            try:
+                overlay_writer.release()
+            except Exception:
+                pass
+        h264_overlay = _transcode_h264(overlay_path) if overlay_writer is not None else None
+        with job.lock:
+            if h264_overlay:
+                job.overlay_video_path = h264_overlay
+            job.status = "tracked"
+    except Exception as e:
+        with job.lock:
+            job.status = "error"
+            job.error = str(e)
+def _compress_job(job: Job, bandwidth_kbps: int, target_fps: int, target_w: int, target_h: int, resolution_scale: float):
+    try:
+        cap = cv2.VideoCapture(job.video_path)
+        if not cap.isOpened():
+            raise RuntimeError("Could not open video.")
+        fps = float(cap.get(cv2.CAP_PROP_FPS) or 30.0)
+        w = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH) or 0)
+        h = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT) or 0)
+        tw, th, tfps, frame_step = _compute_target_params(
+            w=w,
+            h=h,
+            fps=fps,
+            bandwidth_kbps=bandwidth_kbps,
+            target_fps=target_fps,
+            target_w=target_w,
+            target_h=target_h,
+            scale=resolution_scale,
+        )
+        os.makedirs("outputs", exist_ok=True)
+        compressed_path = os.path.join("outputs", f"{job.id}_compressed_rt.mp4")
+        roi_path = os.path.join("outputs", f"{job.id}_roi_rt.mp4")
+        compressed_writer = _open_writer(compressed_path, tw, th, tfps)
+        roi_writer = _open_writer(roi_path, w, h, tfps)
+        with job.lock:
+            job.status = "compressing"
+            job.bandwidth_kbps = int(bandwidth_kbps)
+            job.target_fps = int(tfps)
+            job.target_width = int(tw)
+            job.target_height = int(th)
+        frame_idx = 0
+        last_dets: List[Dict[str, Any]] = []
+        while True:
+            ok, frame = cap.read()
+            if not ok:
+                break
+            if frame_idx % frame_step != 0:
+                frame_idx += 1
+                continue
+            dets = job.det_by_frame.get(int(frame_idx))
+            if dets is None:
+                dets = last_dets
+            else:
+                last_dets = dets
+            compressed_frame = None
+            roi_frame = None
+            if compressed_writer is not None:
+                try:
+                    compressed_frame = cv2.resize(frame, (tw, th), interpolation=cv2.INTER_AREA)
+                    compressed_writer.write(compressed_frame)
+                except Exception:
+                    compressed_frame = None
+            if roi_writer is not None:
+                try:
+                    roi_frame = _apply_roi_overlay(frame, dets, tw, th)
+                    roi_writer.write(roi_frame)
+                except Exception:
+                    roi_frame = None
+            try:
+                if compressed_frame is not None:
+                    okc, jpgc = cv2.imencode(".jpg", compressed_frame, [int(cv2.IMWRITE_JPEG_QUALITY), 80])
+                    if okc:
+                        with job.lock:
+                            job.latest_compressed_jpeg = jpgc.tobytes()
+                if roi_frame is not None:
+                    okr, jpgr = cv2.imencode(".jpg", roi_frame, [int(cv2.IMWRITE_JPEG_QUALITY), 80])
+                    if okr:
+                        with job.lock:
+                            job.latest_roi_jpeg = jpgr.tobytes()
+            except Exception:
+                pass
+            frame_idx += 1
+        cap.release()
+        for wtr in (compressed_writer, roi_writer):
+            if wtr is not None:
+                try:
+                    wtr.release()
+                except Exception:
+                    pass
+        h264_compressed = _transcode_h264(compressed_path) if compressed_writer is not None else None
+        h264_roi = _transcode_h264(roi_path) if roi_writer is not None else None
+        with job.lock:
+            if h264_compressed:
+                job.compressed_video_path = h264_compressed
+            else:
+                job.compressed_video_path = compressed_path if os.path.exists(compressed_path) else job.compressed_video_path
+            if h264_roi:
+                job.roi_video_path = h264_roi
+            else:
+                job.roi_video_path = roi_path if os.path.exists(roi_path) else job.roi_video_path
+            job.status = "completed"
+    except Exception as e:
+        with job.lock:
+            job.status = "error"
+            job.error = str(e)
+@app.post("/track/async")
+async def track_async(
+    video: UploadFile = File(...),
+    queries: str = Form(""),
+    conf: float = Form(DEFAULT_CONF),
+    weights: str = Form(DEFAULT_WEIGHTS),
+    device: str = Form(""),
+    fast_mode: bool = Form(False),
+    bandwidth_kbps: int = Form(1500),
+    target_fps: int = Form(15),
+    target_width: int = Form(0),
+    target_height: int = Form(0),
+    resolution_scale: float = Form(1.0),
+):
+    job_id = uuid.uuid4().hex[:12]
+    os.makedirs("uploads", exist_ok=True)
+    dst = os.path.join("uploads", f"{job_id}_{os.path.basename(video.filename or 'input.mp4')}")
+    data = await video.read()
+    with open(dst, "wb") as f:
+        f.write(data)
+    job = Job(
+        id=job_id,
+        video_path=dst,
+        status="tracking",
+        conf=float(conf),
+        weights=str(weights),
+        device=str(device).strip() or DEFAULT_DEVICE,
+        queries=_parse_queries(queries),
+        fast_mode=bool(fast_mode),
+        target_fps=int(target_fps or 15),
+        bandwidth_kbps=int(bandwidth_kbps or 1500),
+        target_width=int(target_width or 0),
+        target_height=int(target_height or 0),
+    )
+    jobs[job_id] = job
+    # fast preview for MJPEG
+    try:
+        cap = cv2.VideoCapture(dst)
+        ok, frame0 = cap.read()
+        cap.release()
+        if ok and frame0 is not None:
+            model = get_model(job.weights)
+            det0 = _yolo_detect_frame(model, frame0, conf=job.conf, queries=job.queries, device=job.device, fast_mode=job.fast_mode)
+            det0 = _assign_tracks(det0, job.tracker_state)
+            with job.lock:
+                job.det_by_frame[0] = det0
+            vis0 = _draw_boxes(frame0, det0)
+            ok2, jpg = cv2.imencode(".jpg", vis0, [int(cv2.IMWRITE_JPEG_QUALITY), 80])
+            if ok2:
+                with job.lock:
+                    job.latest_jpeg = jpg.tobytes()
+    except Exception:
+        pass
+    t = threading.Thread(target=_process_job, args=(job,), daemon=True)
+    t.start()
+    return JSONResponse({
+        "job_id": job_id,
+        "status_url": f"/process/status/{job_id}",
+        "stream_url": f"/detect/stream/{job_id}",
+        "overlay_video_url": f"/process/video/overlay/{job_id}",
+        "compressed_video_url": f"/process/video/compressed/{job_id}",
+        "roi_video_url": f"/process/video/roi/{job_id}",
+    })
+@app.post("/process/compress/{job_id}")
+async def process_compress(
+    job_id: str,
+    bandwidth_kbps: int = Form(1500),
+    target_fps: int = Form(15),
+    target_width: int = Form(0),
+    target_height: int = Form(0),
+    resolution_scale: float = Form(1.0),
+):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    with job.lock:
+        if job.status in ("tracking", "compressing"):
+            raise HTTPException(status_code=409, detail="Job still running")
+        if job.status not in ("tracked", "completed"):
+            raise HTTPException(status_code=409, detail="Tracking not ready")
+    t = threading.Thread(
+        target=_compress_job,
+        args=(job, int(bandwidth_kbps), int(target_fps), int(target_width), int(target_height), float(resolution_scale)),
+        daemon=True,
+    )
+    t.start()
+    return JSONResponse({"job_id": job_id, "status": "compressing"})
+@app.get("/process/status/{job_id}")
+def process_status(job_id: str):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    with job.lock:
+        return {
+            "job_id": job.id,
+            "status": job.status,
+            "error": job.error,
+            "target_width": job.target_width,
+            "target_height": job.target_height,
+            "target_fps": job.target_fps,
+            "bandwidth_kbps": job.bandwidth_kbps,
+        }
+def _mjpeg_generator(job: Job):
+    boundary = b"--frame"
+    while True:
+        with job.lock:
+            jpg = job.latest_jpeg
+            status = job.status
+            err = job.error
+        if err:
+            break
+        if jpg:
+            yield boundary + b"\r\n"
+            yield b"Content-Type: image/jpeg\r\n"
+            yield f"Content-Length: {len(jpg)}\r\n\r\n".encode("ascii")
+            yield jpg + b"\r\n"
+        time.sleep(0.15)
+        if status in ("completed", "error"):
+            time.sleep(0.5)
+            break
+def _mjpeg_generator_compressed(job: Job):
+    boundary = b"--frame"
+    while True:
+        with job.lock:
+            jpg = job.latest_compressed_jpeg
+            status = job.status
+            err = job.error
+        if err:
+            break
+        if jpg:
+            yield boundary + b"\r\n"
+            yield b"Content-Type: image/jpeg\r\n"
+            yield f"Content-Length: {len(jpg)}\r\n\r\n".encode("ascii")
+            yield jpg + b"\r\n"
+        time.sleep(0.15)
+        if status in ("completed", "error"):
+            time.sleep(0.5)
+            break
+def _mjpeg_generator_roi(job: Job):
+    boundary = b"--frame"
+    while True:
+        with job.lock:
+            jpg = job.latest_roi_jpeg
+            status = job.status
+            err = job.error
+        if err:
+            break
+        if jpg:
+            yield boundary + b"\r\n"
+            yield b"Content-Type: image/jpeg\r\n"
+            yield f"Content-Length: {len(jpg)}\r\n\r\n".encode("ascii")
+            yield jpg + b"\r\n"
+        time.sleep(0.15)
+        if status in ("completed", "error"):
+            time.sleep(0.5)
+            break
+@app.get("/detect/stream/{job_id}")
+def detect_stream(job_id: str):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    return StreamingResponse(_mjpeg_generator(job), media_type="multipart/x-mixed-replace; boundary=frame")
+@app.get("/process/stream/compressed/{job_id}")
+def process_stream_compressed(job_id: str):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    return StreamingResponse(_mjpeg_generator_compressed(job), media_type="multipart/x-mixed-replace; boundary=frame")
+@app.get("/process/stream/roi/{job_id}")
+def process_stream_roi(job_id: str):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    return StreamingResponse(_mjpeg_generator_roi(job), media_type="multipart/x-mixed-replace; boundary=frame")
+@app.get("/process/video/overlay/{job_id}")
+def process_video_overlay(job_id: str):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    path = job.overlay_video_path if job.overlay_video_path and os.path.exists(job.overlay_video_path) and os.path.getsize(job.overlay_video_path) > 1024 else job.video_path
+    return FileResponse(path, media_type="video/mp4")
+@app.get("/process/video/compressed/{job_id}")
+def process_video_compressed(job_id: str):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    path = job.compressed_video_path if job.compressed_video_path and os.path.exists(job.compressed_video_path) and os.path.getsize(job.compressed_video_path) > 1024 else job.video_path
+    return FileResponse(path, media_type="video/mp4")
+@app.get("/process/video/roi/{job_id}")
+def process_video_roi(job_id: str):
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Unknown job_id")
+    path = job.roi_video_path if job.roi_video_path and os.path.exists(job.roi_video_path) and os.path.getsize(job.roi_video_path) > 1024 else job.video_path
+    return FileResponse(path, media_type="video/mp4")
+if __name__ == "__main__":
+    import argparse
+    import uvicorn
+    p = argparse.ArgumentParser()
+    p.add_argument("--host", default="127.0.0.1")
+    p.add_argument("--port", default=8000, type=int)
+    p.add_argument("--weights", default=DEFAULT_WEIGHTS)
+    p.add_argument("--device", default=DEFAULT_DEVICE)
+    args = p.parse_args()
+    DEFAULT_WEIGHTS = args.weights
+    DEFAULT_DEVICE = args.device
+    get_model(args.weights)
+    host = os.environ.get("HOST", args.host or "0.0.0.0")
+    port = int(os.environ.get("PORT", args.port))
+    uvicorn.run(app, host=host, port=port)

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+fastapi==0.115.2
+uvicorn[standard]==0.30.6
+ultralytics==8.3.34
+opencv-python-headless==4.10.0.84
+numpy==1.26.4