Spaces:

Arko007
/

maritime

Sleeping

File size: 20,534 Bytes

# processing.py
"""
SUB-SENTINEL processing pipeline (Groq-first, Ultralytics fallback).

Exports:
  enhance_image(raw_bytes) -> (base64_str, np.ndarray)
  run_detection(rgb, sonar_data=None, conf_thresh=0.40) -> list[dict]
  build_heatmap(rgb) -> base64_str
  fuse_sonar_overlay(rgb, sonar_data) -> base64_str
  generate_vector_sketch(detections) -> str (base64 zlib JSON)

Environment:
  DETECTION_BACKEND = "groq" | "ultralytics" | "auto"  (default "auto")
  DETECTION_MODEL   = path to model / compiled groq artifact or ultralytics model id (default "yolov8m.pt")
  GROQ_API_KEY      = optional API key for Groq LLM (if you want LLM postprocessing)
"""
import os
import io
import json
import zlib
import base64
import logging
from typing import Optional, List, Dict, Any

import cv2
import numpy as np
from PIL import Image
from skimage.metrics import structural_similarity as ssim

logger = logging.getLogger(__name__)
logger.addHandler(logging.NullHandler())

# Config
DEFAULT_DETECTION_MODEL = os.getenv("DETECTION_MODEL", "yolov8m.pt")
DETECTION_BACKEND = os.getenv("DETECTION_BACKEND", "auto").lower()  # "groq", "ultralytics", "auto"
GROQ_API_KEY = os.getenv("GROQ_API_KEY") or os.getenv("groq")  # read common variants

# Maritime label mapping (COCO -> maritime)
_LABEL_MAP: Dict[str, str] = {
    "person": "Diver/Swimmer",
    "boat": "Surface/Sub Threat",
    "ship": "Surface/Sub Threat",
    "submarine": "Surface/Sub Threat",
    "surfboard": "Surface/Sub Threat",
    # extend as needed
}

# --------------------------- utilities -------------------------------------
def _array_to_base64(img_array: np.ndarray, fmt: str = "PNG") -> str:
    pil_img = Image.fromarray(img_array.astype(np.uint8))
    buf = io.BytesIO()
    fmt_upper = fmt.upper()
    pil_img.save(buf, format=fmt_upper, quality=90)
    encoded = base64.b64encode(buf.getvalue()).decode("utf-8")
    mime = "image/png" if fmt_upper == "PNG" else "image/jpeg"
    return f"data:{mime};base64,{encoded}"


def _bytes_to_array(raw_bytes: bytes) -> np.ndarray:
    nparr = np.frombuffer(raw_bytes, np.uint8)
    bgr = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
    if bgr is None:
        raise ValueError("OpenCV could not decode the image.")
    return cv2.cvtColor(bgr, cv2.COLOR_BGR2RGB)


def _ensure_int_box(box: List[float]) -> List[int]:
    return [int(round(v)) for v in box]


# ------------------------ enhancement engines -------------------------------
def _clahe_enhance(rgb: np.ndarray) -> np.ndarray:
    lab = cv2.cvtColor(rgb, cv2.COLOR_RGB2LAB)
    l, a, b = cv2.split(lab)
    clahe = cv2.createCLAHE(clipLimit=2.5, tileGridSize=(8, 8))
    l = clahe.apply(l)
    a = np.clip(a.astype(np.int16) - 5, 0, 255).astype(np.uint8)
    b = np.clip(b.astype(np.int16) + 10, 0, 255).astype(np.uint8)
    merged = cv2.merge([l, a, b])
    return cv2.cvtColor(merged, cv2.COLOR_LAB2RGB)


def _funiegan_enhance(rgb: np.ndarray) -> Optional[np.ndarray]:
    weights_path = "weights/funiegan.onnx"
    if not os.path.exists(weights_path):
        return None
    try:
        net = cv2.dnn.readNetFromONNX(weights_path)
        h, w = rgb.shape[:2]
        resized = cv2.resize(rgb, (256, 256)).astype(np.float32) / 127.5 - 1.0
        blob = cv2.dnn.blobFromImage(resized)
        net.setInput(blob)
        out = net.forward()
        out_img = ((out[0].transpose(1, 2, 0) + 1.0) * 127.5).clip(0, 255).astype(np.uint8)
        return cv2.resize(out_img, (w, h))
    except Exception as exc:
        logger.warning("FUnIE-GAN inference failed (%s); falling back.", exc)
        return None


def enhance_image(raw_bytes: bytes, prefer_funiegan: bool = True) -> tuple[str, np.ndarray]:
    rgb = _bytes_to_array(raw_bytes)
    enhanced = None
    if prefer_funiegan:
        enhanced = _funiegan_enhance(rgb)
    if enhanced is None:
        enhanced = _clahe_enhance(rgb)
    return _array_to_base64(enhanced, fmt="JPEG"), rgb


# ------------------------- forensic heatmap --------------------------------
def build_heatmap(rgb: np.ndarray) -> str:
    gray = cv2.cvtColor(rgb, cv2.COLOR_RGB2GRAY)
    blurred = cv2.GaussianBlur(gray, (15, 15), 0)
    try:
        _, ssim_map = ssim(gray, blurred, full=True, data_range=255)
    except Exception:
        diff = cv2.absdiff(gray, blurred).astype(np.float32) / 255.0
        ssim_map = 1.0 - diff
    ssim_norm = ((ssim_map + 1.0) / 2.0 * 255.0).clip(0, 255).astype(np.uint8)
    colormap = cv2.COLORMAP_RdYlGn if hasattr(cv2, "COLORMAP_RdYlGn") else cv2.COLORMAP_JET
    heatmap_bgr = cv2.applyColorMap(ssim_norm, colormap)
    rgb_bgr = cv2.cvtColor(rgb, cv2.COLOR_RGB2BGR)
    overlay = cv2.addWeighted(rgb_bgr, 0.55, heatmap_bgr, 0.45, 0)
    overlay_rgb = cv2.cvtColor(overlay, cv2.COLOR_BGR2RGB)
    return _array_to_base64(overlay_rgb, fmt="PNG")


# ------------------------- detection helpers --------------------------------
def _local_texture_authenticity(patch: np.ndarray) -> float:
    if patch is None or patch.size == 0:
        return 0.0
    gray = cv2.cvtColor(patch, cv2.COLOR_RGB2GRAY) if patch.ndim == 3 else patch
    var = cv2.Laplacian(gray, cv2.CV_64F).var()
    norm = (var - 10.0) / (200.0 - 10.0)
    return float(np.clip(norm, 0.0, 1.0))


# ---------------------- Groq runtime backend (placeholder) ------------------
def _run_detection_groq(rgb: np.ndarray, compiled_model_path: str, conf_thresh: float) -> List[Dict[str, Any]]:
    """
    Placeholder Groq runner. Replace with your project's Groq runtime/SDK calls.

    Recommended flow:
      - import the Groq runtime installed in your environment (API differs by Groq release)
      - load compiled artifact or use a long-lived runner
      - prepare input (resize / normalize) exactly as the compiled model expects
      - run inference and parse outputs into COCO-like detections:
            [ {"class": "person", "conf": 0.82, "bbox":[x1,y1,x2,y2]}, ... ]
    If Groq runtime isn't installed, this function raises and the pipeline will fallback.
    """
    # Try to import a Groq runtime package (NAME VARIES). This is intentionally guarded.
    try:
        # Example placeholder import; replace with your runtime import
        import groq_runtime  # <<-- REPLACE with actual Groq runtime package for your compiled model
    except Exception as exc:
        raise RuntimeError("Groq runtime not installed") from exc

    # PSEUDOCODE (replace with your actual runtime usage):
    try:
        # runner = groq_runtime.Runner(compiled_model_path)
        # model_input = cv2.resize(rgb, (MODEL_W, MODEL_H)).astype(np.float32) / 255.0
        # batch = np.expand_dims(model_input, axis=0)
        # outputs = runner.run(batch)
        # parse outputs -> parsed_detections
        parsed_detections: List[Dict[str, Any]] = []
        # -----> Replace the pseudocode above with real runtime calls and parsing
        return parsed_detections
    except Exception as exc:
        raise RuntimeError("Groq model execution failed") from exc


# -------------------- Groq LLM refinement (optional) ------------------------
def refine_with_groq_llm(detections: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
    """
    (Optional) Use a Groq LLM to refine/correct YOLO outputs (label mapping, merge boxes, etc.)
    This function is intentionally conservative: if no GROQ_API_KEY or client, it returns original detections.

    To enable: install the Groq client/SDK for LLM usage and replace the body below
    with a real call. Keep the function robust: always return a list of detections.
    """
    if not GROQ_API_KEY or not detections:
        return detections

    # >>> EXAMPLE (COMMENTED) - Replace with your Groq LLM client usage <<<
    # try:
    #     import groq
    #     client = groq.Client(api_key=GROQ_API_KEY)
    #     prompt = "You are a maritime analyst. Given these detections (JSON), correct labels and return JSON list."
    #     response = client.chat.completions.create(
    #         model="llama-3-small", messages=[{"role":"user","content":prompt + json.dumps(detections)}], temperature=0.2
    #     )
    #     refined = json.loads(response.choices[0].message.content)
    #     return refined
    # except Exception as e:
    #     logger.warning("Groq LLM refine failed: %s", e)
    #     return detections

    # By default, return unchanged (safe!)
    return detections


# ------------------------- unified detection (Groq -> Ultralytics) ----------
def run_detection(rgb: np.ndarray,
                  sonar_data: Optional[Dict[str, Any]] = None,
                  conf_thresh: float = 0.40,
                  allowed_only: Optional[List[str]] = None) -> List[Dict[str, Any]]:
    """
    Try configured backend(s) and return enriched detection dicts:
      {
        "class": str,
        "mapped_label": str,
        "confidence": float,
        "forensic_confidence": "HIGH|MEDIUM|LOW",
        "bbox": [x1,y1,x2,y2],
        "hallucinated": bool
      }
    """
    allowed = set(allowed_only) if allowed_only else set(_LABEL_MAP.keys())
    backend_choice = DETECTION_BACKEND
    model_path = os.getenv("DETECTION_MODEL", DEFAULT_DETECTION_MODEL)

    # 1) Try Groq compiled runtime if requested or auto
    if backend_choice in ("groq", "auto"):
        try:
            groq_dets = _run_detection_groq(rgb, model_path, conf_thresh)
            if groq_dets:
                enriched: List[Dict[str, Any]] = []
                h, w = rgb.shape[:2]
                for d in groq_dets:
                    cls_name = d.get("class", "unknown")
                    conf = float(d.get("conf", 0.0))
                    if conf < conf_thresh or cls_name not in allowed:
                        continue
                    x1, y1, x2, y2 = _ensure_int_box(d.get("bbox", [0, 0, 0, 0]))
                    patch = rgb[y1:y2, x1:x2] if y2 > y1 and x2 > x1 else None
                    texture = _local_texture_authenticity(patch)
                    combined = 0.6 * conf + 0.4 * texture
                    forensic = "HIGH" if combined > 0.75 else "MEDIUM" if combined > 0.55 else "LOW"
                    hallucinated = (conf > 0.6 and texture < 0.25)
                    enriched.append({
                        "class": cls_name,
                        "mapped_label": _LABEL_MAP.get(cls_name, cls_name),
                        "confidence": round(conf, 4),
                        "forensic_confidence": forensic,
                        "bbox": [x1, y1, x2, y2],
                        "hallucinated": hallucinated,
                    })
                if enriched:
                    # Optional LLM refine step (won't run unless GROQ_API_KEY & client wired)
                    return refine_with_groq_llm(enriched)
        except Exception as exc:
            logger.info("Groq backend not used: %s", exc)

    # 2) Fallback to Ultralytics (YOLO)
    try:
        from ultralytics import YOLO  # type: ignore
    except Exception as exc:
        logger.warning("ultralytics not available (%s); detection disabled.", exc)
        return []

    try:
        model = YOLO(model_path)
        results = model(rgb, verbose=False)
    except Exception as exc:
        logger.warning("Ultralytics model load/inference failed (%s).", exc)
        return []

    detections: List[Dict[str, Any]] = []
    h, w = rgb.shape[:2]
    for result in results:
        boxes = getattr(result, "boxes", None)
        if boxes is None:
            continue
        for box in boxes:
            try:
                conf = float(box.conf[0]) if hasattr(box.conf, "__len__") else float(box.conf)
                if conf < conf_thresh:
                    continue
                cls_id = int(box.cls[0]) if hasattr(box.cls, "__len__") else int(box.cls)
                cls_name = model.names.get(cls_id, str(cls_id)) if hasattr(model, "names") else str(cls_id)
                xyxy = box.xyxy[0] if hasattr(box.xyxy, "__len__") and len(box.xyxy) > 0 else None
                if xyxy is None:
                    continue
                x1, y1, x2, y2 = (int(round(float(v))) for v in xyxy)
                if cls_name not in allowed:
                    continue
                patch = rgb[y1:y2, x1:x2] if y2 > y1 and x2 > x1 else None
                texture_score = _local_texture_authenticity(patch)
                combined = 0.6 * conf + 0.4 * texture_score
                forensic = "HIGH" if combined > 0.75 else "MEDIUM" if combined > 0.55 else "LOW"
                hallucinated = (conf > 0.6 and texture_score < 0.25)
                detections.append({
                    "class": cls_name,
                    "mapped_label": _LABEL_MAP.get(cls_name, cls_name),
                    "confidence": round(conf, 4),
                    "forensic_confidence": forensic,
                    "bbox": [x1, y1, x2, y2],
                    "hallucinated": hallucinated,
                })
            except Exception as exc:
                logger.debug("Skipping a box due to error: %s", exc)
                continue

    # Optional LLM refinement (no-op unless you wire in GROQ LLM client)
    detections = refine_with_groq_llm(detections)

    # Sonar-guided hallucination placeholders when no vision detections
    if sonar_data and not detections:
        contours = sonar_data.get("contours", [])
        for c in contours:
            pts = []
            for nx, ny in c:
                px = int(np.clip(nx, 0.0, 1.0) * w)
                py = int(np.clip(ny, 0.0, 1.0) * h)
                pts.append([px, py])
            if len(pts) < 3:
                continue
            pts_np = np.array(pts, dtype=np.int32)
            x, y, ww, hh = cv2.boundingRect(pts_np)
            detections.append({
                "class": "sonar_contact",
                "mapped_label": "Sonar Contact (hallucinated)",
                "confidence": 0.0,
                "forensic_confidence": "LOW",
                "bbox": [int(x), int(y), int(x + ww), int(y + hh)],
                "hallucinated": True,
                "sonar_polygon": pts,
            })

    return detections


# -------------------- whisper-link / vector sketch --------------------------
def generate_vector_sketch(detections: List[Dict[str, Any]], max_bytes: int = 1024) -> str:
    sketch = {"detections": []}
    for d in detections:
        x1, y1, x2, y2 = d.get("bbox", [0, 0, 0, 0])
        w = max(1, x2 - x1)
        h = max(1, y2 - y1)
        cx = x1 + w / 2.0
        cy = y1 + h / 2.0
        sketch["detections"].append({
            "label": d.get("mapped_label", d.get("class")),
            "conf": float(d.get("confidence", 0.0)),
            "center": [float(cx), float(cy)],
            "size": [float(w), float(h)],
            "hallucinated": bool(d.get("hallucinated", False)),
        })
    raw = json.dumps(sketch, separators=(",", ":"), ensure_ascii=False).encode("utf-8")
    compressed = zlib.compress(raw, level=9)
    if len(compressed) > max_bytes:
        summary = {"summary": [{"label": x["label"], "conf": x["conf"]} for x in sketch["detections"]]}
        compressed = zlib.compress(json.dumps(summary, separators=(",", ":")).encode("utf-8"), level=9)
    return base64.b64encode(compressed).decode("utf-8")


# --------------------- sonar overlay / wireframe ---------------------------
def fuse_sonar_overlay(rgb: np.ndarray, sonar_data: Optional[Dict[str, Any]] = None) -> str:
    """
    Draw sonar overlay with radar rings and sweep wedge.
    sonar_data can contain:
      - angle: center angle in degrees (0 = right, 90 = up)
      - sweep: sweep half-width in degrees
      - max_range: radius for wedge (in px)
      - contours: list of normalized contour polygons
    """
    if rgb is None:
        raise ValueError("rgb image is required")

    # OpenCV drawing expects BGR. Convert, draw, then convert back.
    bgr = cv2.cvtColor(rgb, cv2.COLOR_RGB2BGR)
    h, w = bgr.shape[:2]
    center = (w // 2, h // 2)
    radius_limit = min(center)

    # draw concentric rings
    for r in range(50, max(60, radius_limit), 60):
        if r >= radius_limit:
            break
        cv2.circle(bgr, center, r, (0, 255, 0), 1)

    # parameters from sonar_data or defaults
    angle = float(sonar_data.get("angle", 0)) if sonar_data else 0.0
    sweep = float(sonar_data.get("sweep", 20)) if sonar_data else 20.0
    max_r = int(sonar_data.get("max_range", radius_limit * 0.9)) if sonar_data else int(radius_limit * 0.9)

    # make a translucent wedge for the sweep
    overlay = bgr.copy()
    start_angle = angle - sweep / 2.0
    end_angle = angle + sweep / 2.0

    # build polygon points (center + arc)
    points = [center]
    for ang in np.linspace(start_angle, end_angle, num=40):
        rad = np.deg2rad(ang)
        x = int(center[0] + max_r * np.cos(rad))
        y = int(center[1] - max_r * np.sin(rad))  # coordinate system: y down => subtract
        points.append((x, y))

    pts = np.array(points, dtype=np.int32)
    cv2.fillPoly(overlay, [pts], (0, 255, 0))
    fused = cv2.addWeighted(bgr, 1.0, overlay, 0.20, 0)

    # optional: draw a sweep outline
    cv2.polylines(fused, [pts], isClosed=False, color=(0, 255, 0), thickness=1)

    # Keep original contour logic also
    if sonar_data:
        contours = sonar_data.get("contours", [])
        for c in contours:
            pts_contour = []
            for nx, ny in c:
                px = int(np.clip(nx, 0.0, 1.0) * (w - 1))
                py = int(np.clip(ny, 0.0, 1.0) * (h - 1))
                pts_contour.append([px, py])

            if len(pts_contour) >= 2:
                pts_np = np.array(pts_contour, dtype=np.int32)
                cv2.polylines(fused, [pts_np], True, (0, 255, 255), 2)

    final_rgb = cv2.cvtColor(fused, cv2.COLOR_BGR2RGB)
    return _array_to_base64(final_rgb, fmt="PNG")


# --------------------------- SITREP helper ---------------------------------
# ===================== 🔥 NEW VISUAL FEATURES ==============================

def draw_detection_boxes(rgb: np.ndarray, detections: List[Dict[str, Any]]) -> str:
    """
    Draw bounding boxes on image (for frontend display)
    """
    img = rgb.copy()

    for det in detections:
        x1, y1, x2, y2 = det["bbox"]
        label = f"{det['mapped_label']} {int(det['confidence']*100)}%"

        # Box
        cv2.rectangle(img, (x1, y1), (x2, y2), (255, 50, 50), 2)

        # Text
        cv2.putText(
            img,
            label,
            (x1, y1 - 10),
            cv2.FONT_HERSHEY_SIMPLEX,
            0.5,
            (255, 50, 50),
            2
        )

    return _array_to_base64(img, fmt="JPEG")


def generate_bioluminescence(rgb: np.ndarray) -> str:
    """
    Create a bioluminescence effect:
      - stronger blurred glow (Gaussian)
      - cyan/teal tint blended on top
    """
    if rgb is None:
        raise ValueError("rgb image is required")

    # use an explicit odd kernel for blur (clear and reliable)
    glow = cv2.GaussianBlur(rgb, (21, 21), 0)

    # build a cyan/teal tint - in RGB format (not BGR)
    tint = np.zeros_like(rgb, dtype=np.uint8)
    tint[:, :, 0] = 100  # Blue channel (in RGB)
    tint[:, :, 1] = 160  # Green channel (in RGB)
    tint[:, :, 2] = 40   # Red channel (keep low for cyan/teal)

    # operate in float to avoid early clipping, then clip at the end
    base_f = rgb.astype(np.float32)
    glow_f = glow.astype(np.float32)
    tint_f = tint.astype(np.float32)

    # mix base + glow (glow should be visible but not wash out)
    combined = cv2.addWeighted(base_f, 0.7, glow_f, 0.4, 0.0)

    # add tint softly
    final_f = cv2.addWeighted(combined, 1.0, tint_f, 0.25, 0.0)

    final = np.clip(final_f, 0, 255).astype(np.uint8)
    return _array_to_base64(final, fmt="JPEG")

    
def detections_to_sitrep_txt(detections: List[Dict[str, Any]]) -> str:
    if not detections:
        return ("SITUATION: Sensor sweep complete – no contacts.\n"
                "ASSESSMENT: Area clear.\n"
                "RECOMMENDATION: Continue routine patrol.")
    labels = ", ".join({d["mapped_label"] for d in detections})
    count = len(detections)
    return (f"SITUATION: {count} contact(s) detected – {labels}.\n"
            "ASSESSMENT: Requires manual review (forensic confidence noted).\n"
            "RECOMMENDATION: Dispatch response team and maintain sensor lock.")


__all__ = [
    "enhance_image",
    "run_detection",
    "build_heatmap",
    "fuse_sonar_overlay",
    "generate_vector_sketch",
    "detections_to_sitrep_txt",
    "draw_detection_boxes",
    "generate_bioluminescence",
]