Spaces:

mlbench123
/

inspecTech_CV

Sleeping

App Files Files Community

mlbench123 commited on Apr 21

Commit

2a47873

verified ·

1 Parent(s): 19f9b44

Create app.py

Browse files

Files changed (1) hide show

app.py +922 -0

app.py ADDED Viewed

	@@ -0,0 +1,922 @@

+"""
+Amazon Trailer Inspector — app.py
+HuggingFace Spaces · FastAPI · Free vision LLMs
+REST API that accepts 6 labeled images and runs all 6 aspect inspections
+in parallel, returning a structured JSON inspection report.
+Endpoint: POST /inspect
+"""
+import base64
+import concurrent.futures
+import io
+import json
+import os
+import re
+import traceback
+from typing import Optional
+import uvicorn
+from fastapi import FastAPI, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import JSONResponse
+from PIL import Image
+from huggingface_hub import InferenceClient
+from pydantic import BaseModel, Field
+# ──────────────────────────────────────────────────────────────────────────────
+# MODELS  (tried in order — first success wins per image)
+# ──────────────────────────────────────────────────────────────────────────────
+MODELS = [
+    # ── Tier 1: best vision quality ──────────────────────────────────────────
+    "google/gemma-4-27b-it",             # Primary — Gemma 4 27B (stable HF serverless name)
+    "meta-llama/Llama-4-Scout-17B-16E-Instruct",  # Llama 4 Scout — excellent vision, free HF
+    # ── Tier 2: dedicated vision models ──────────────────────────────────────
+    "Qwen/Qwen2.5-VL-7B-Instruct",      # Qwen 2.5 VL — strong free-tier vision
+    "Qwen/Qwen2-VL-7B-Instruct",        # Qwen 2 VL — previous gen, very stable
+    # ── Tier 3: additional fallbacks ─────────────────────────────────────────
+    "meta-llama/Llama-3.2-11B-Vision-Instruct",   # Llama 3.2 11B Vision — reliable fallback
+    "microsoft/Phi-3.5-vision-instruct", # Phi-3.5 Vision — lightweight, good accuracy
+    "HuggingFaceM4/idefics3-8b-llama3",  # IDEFICS3 — HF native, always available
+    "mistralai/Pixtral-12B-2409",        # Pixtral 12B — Mistral's vision model, free tier
+]
+# ──────────────────────────────────────────────────────────────────────────────
+# ASPECT PROMPTS
+# ──────────────────────────────────────────────────────────────────────────────
+PROMPTS = {
+"front": """You are a precise visual inspector for Amazon trailer fleets.
+════════════════════════════════════════════════════════
+STEP 1 — IMAGE VALIDATION (do this BEFORE anything else)
+════════════════════════════════════════════════════════
+Determine whether this is a valid FRONT LEFT or FRONT RIGHT image of an Amazon trailer.
+A VALID front-aspect image shows the trailer from the FRONT or FRONT-CORNER area:
+- The main subject is the SIDE PANEL of the trailer — the large blue/white body with branding
+- The image is shot from the FRONT HALF looking toward the rear, OR from the front corner
+- The rear dual-axle truck tires are NOT visible (or are tiny/distant in the far background)
+- Components like sensors, GPS, Prime logo, and the green Trailer ID label are the focus
+An INVALID image is one where:
+- The trailer's REAR DUAL-AXLE TRUCK TIRES are LARGE, PROMINENT, and CLEARLY VISIBLE
+- These are specifically: large inflated rubber truck tires on the REAR BOGIE AXLES,
+  appearing as 4 large grouped tires (2 axles × 2 tires each = 4 tires together)
+  at the REAR UNDERCARRIAGE of the trailer body
+- They appear in the foreground or mid-frame, bottom-center of the image, large in size
+- The shot is clearly taken from behind or the rear half of the trailer
+⚠️ CRITICAL — DO NOT CONFUSE THESE WITH REAR TIRES:
+  ❌ LANDING GEAR / SUPPORT LEGS: The retractable metal support struts/legs under the
+     front of the trailer when it is parked (not attached to a truck). These are METAL
+     POLES/STRUTS, not rubber tires. They hold up the front of a parked trailer.
+     → DO NOT flag landing gear as rear tires.
+  ❌ SINGLE FRONT STEER AXLE: If a truck cab is attached, its single front steering wheel
+     (one tire on each side, much smaller than rear bogie) is NOT the rear dual axle.
+     → DO NOT flag single front steer wheels as rear dual-axle tires.
+  ❌ TRAILER DOLLIES / SMALL WHEELS: Any small wheels used for maneuvering a parked
+     trailer are not the rear axle tires.
+POSITIVE IDENTIFICATION — only flag as INVALID if you see ALL of these:
+  ✔ Large inflated RUBBER TRUCK TIRES (clearly rubber, round, with tread)
+  ✔ DUAL AXLE configuration — two sets of large tires grouped together (4 tires total)
+  ✔ Located at the REAR of the trailer body / rear undercarriage
+  ✔ LARGE in the frame — prominent, not a tiny distant element
+DECISION:
+→ If rear dual-axle RUBBER TRUCK TIRES (4 grouped) are LARGE AND PROMINENT in frame:
+   Set image_valid = "missing", Set ALL other components to "missing"
+→ In ALL other cases (no tires, landing gear visible, single wheels, distant tires, etc.):
+   Set image_valid = "detected"
+   Proceed to STEP 2 below.
+════════════════════════════════════════════════════════
+STEP 2 — COMPONENT DETECTION (only if image_valid = "detected")
+════════════════════════════════════════════════════════
+This image shows the FRONT-LEFT or FRONT-RIGHT corner of an Amazon trailer — the rear corner
+area is visible from the side/front angle showing the side panels and rear corner post.
+Carefully locate all 4 components described below.
+────────────────────────────────────────────────────────
+COMPONENT 1 — SENSORS
+────────────────────────────────────────────────────────
+WHERE: On the REAR DOOR FACE or the lower area of the trailer near the rear corner.
+Look at the lower-middle or lower-left area of the rear panel visible in this image.
+WHAT: Exactly TWO metal plates shaped like DIAMONDS (rotated squares / rhombuses).
+- Each plate has diagonal cross-bracing visible on its face (an X pattern of raised ridges)
+- They are mounted SIDE BY SIDE, touching or close together
+- Color: beige, gold, tan, or silver-gray metallic
+- Size: roughly the size of a dinner plate each
+- They appear as a PAIR — two identical diamond shapes next to each other
+- May be on the rear face of the trailer or on the lower panel near the door area
+────────────────────────────────────────────────────────
+COMPONENT 2 — GPS_DEVICE
+────────────────────────────────────────────────────────
+⚠️ THIS IS THE MOST COMMONLY MISSED COMPONENT — READ CAREFULLY ⚠️
+WHERE: At the VERY TOP of the REAR CORNER POST. The corner post is the narrow vertical
+aluminum pillar/column at the rear corner of the trailer — where the SIDE WALL meets
+the rear face. Look at the TOP of this post, right at or just below the ROOF LINE.
+CRITICAL SEARCH STRATEGY — do this before answering:
+  1. First locate the GREEN TRAILER ID STRIP (component 4 — the lime-green vertical label)
+  2. Look DIRECTLY ABOVE that green strip, on the SAME vertical corner post
+  3. Search for a small white or light-gray rectangular box mounted there
+  4. Also check the VERY TOP CORNER where the corner post meets the roof rail
+WHAT IT LOOKS LIKE:
+  - A small white, off-white, or light gray rectangular electronic housing/box
+  - Roughly the size of a large book or small tablet (wider than tall, or square)
+  - Has a visible FRONT FACE — may show a small digital display, sensor window, or LED
+  - Mounted FLUSH to or BRACKETED onto the corner post or roof/top rail junction
+CONFIDENCE GUIDANCE: If you see ANY small rectangular box or housing at the top of the
+corner post, even if partially visible or unclear, mark "detected". Only mark "missing"
+if you can clearly confirm there is NO box/device at the top of the corner post.
+────────────────────────────────────────────────────────
+COMPONENT 3 — PRIME_LOGO
+────────────────────────────────────────────────────────
+WHERE: On the main side panels of the trailer body — the large blue (or white) surface.
+WHAT: Any Amazon Prime branding — ANY of the following counts:
+- The word "prime" in white letters on the trailer body
+- The word "amazon" with or without the arrow/smile logo
+- The Amazon arrow/smile swoosh logo alone (curved arrow shape)
+- Any partial visibility of the above — even one letter or partial arrow
+─────────────────────────────────��──────────────────────
+COMPONENT 4 — TRAILER_ID
+────────────────────────────────────────────────────────
+WHERE: On the REAR VERTICAL CORNER POST — the narrow vertical aluminum pillar/column
+at the rear corner of the trailer, where the side panel meets the rear face.
+WHAT: A fluorescent GREEN or LIME-GREEN vertical label strip affixed to this corner post.
+- The strip runs VERTICALLY down a section of the corner post
+- Displays an alphanumeric code running vertically: e.g. "SV2602705", "AZNG..."
+- The green background color is very distinctive — bright lime-green
+- Located roughly at mid-height to upper-middle of the corner post
+IMPORTANT: Even if only PART of the green strip is visible → still mark "detected".
+Reply ONLY with a single flat JSON object — no extra text, no markdown fences, no nested objects:
+{
+  "image_valid": "detected",
+  "sensors":     "missing",
+  "gps_device":  "missing",
+  "prime_logo":  "detected",
+  "trailer_id":  "detected"
+}
+Each value must be exactly "detected" or "missing". Nothing else.""",
+"rear": """You are a precise visual inspector for Amazon trailer fleets.
+════════════════════════════════════════════════════════
+STEP 1 — IMAGE VALIDATION: IS THIS A VALID REAR-SIDE VIEW?
+════════════════════════════════════════════════════════
+Your FIRST task is to determine whether this image shows the REAR HALF / REAR SIDE of an Amazon
+trailer. This is critical — FRONT-SIDE views of the trailer must be rejected.
+THE SINGLE MOST RELIABLE RULE — TIRE PROXIMITY TEST:
+Look at the BOTTOM of the image, near the side of the trailer CLOSEST TO THE CAMERA:
+REAR-SIDE IMAGE (VALID):
+  → The trailer's REAR DUAL-AXLE TIRES are on the NEAR SIDE — CLOSE to the camera,
+    appearing LARGE and PROMINENT in the lower portion of the image.
+  → "Rear dual axle" = a GROUP of 4 large rubber truck tires (2 axles × 2 tires each),
+    all packed together at the rear undercarriage.
+  → The trailer's REAR DOORS / REAR FACE is also visible in this view.
+FRONT-SIDE IMAGE (INVALID — must reject):
+  → The area CLOSEST TO THE CAMERA shows NO LARGE TIRES — only:
+      • Metal support legs / landing gear struts
+      • Open undercarriage with no dominant tire group visible on the near side
+  → The rear dual-axle tires, IF visible at all, appear SMALL and FAR AWAY.
+VALIDATION DECISION:
+Q1: Are large rubber truck tires (dual-axle group) visible CLOSE TO THE CAMERA?
+  → YES → image_valid = "detected" → proceed to STEP 2
+  → NO → image_valid = "missing", set ALL other components to "missing", STOP.
+════════════════════════════════════════════════════════
+STEP 2 — COMPONENT DETECTION (only if image_valid = "detected")
+════════════════════════════════════════════════════════
+════════════════════════════════════════════════════════
+COMPONENT 1 — SIDE SKIRT / FIN
+════════════════════════════════════════════════════════
+WHERE: Directly below the trailer body floor, along the BOTTOM SIDE of the trailer.
+Just below the horizontal red-and-white reflective tape stripe at the trailer bottom.
+WHAT: A flat, solid rectangular panel hanging vertically below the trailer chassis.
+- Fills the gap between the trailer floor underside and the ground level, beside the axles
+- May be dark gray, charcoal, black, silver, or metallic in color
+- IN SHADOW: look for its RECTANGULAR OUTLINE and STRAIGHT EDGES instead of color
+- Look for a SOLID FLAT SURFACE blocking the view through to the undercarriage
+════════════════════════════════════════════════════════
+COMPONENT 2 — EDGE KIT
+════════════════════════════════════════════════════════
+WHERE: On the SIDE SURFACE of the trailer body, near the REAR END.
+Located at roughly mid-to-upper height on the side panel, just before the rear corner.
+WHAT:
+- A BODY-COLORED rectangular panel — the SAME COLOR as the trailer body
+- Has VISIBLE BOLT HOLES or screw holes (several dots/holes visible in the panel)
+- Taller than it is wide — roughly portrait-orientation rectangle
+- Mounted flush against the trailer side near the rear-door corner post area
+════════════════════════════════════════════════════════
+SIDE IDENTIFICATION RULES
+════════════════════════════════════════════════════════
+- First identify: which side of the trailer is facing the camera?
+- LEFT SIDE view: rear doors visible on the LEFT; side extends RIGHT
+- RIGHT SIDE view: rear doors visible on the RIGHT; side extends LEFT
+- Only mark a side as "detected" if that side is ACTUALLY VISIBLE in this image
+- "left" and "right" are from the TRAILER'S own perspective (driver's point of view)
+Reply ONLY with a single flat JSON object — no extra text, no markdown fences, no nested objects:
+{
+  "image_valid":       "detected",
+  "side_skirts_left":  "missing",
+  "side_skirts_right": "detected",
+  "edge_kit_left":     "missing",
+  "edge_kit_right":    "detected"
+}
+Each value must be exactly "detected" or "missing". Nothing else.""",
+"inside": """You are a precise visual inspector for Amazon trailer fleets.
+Examine this image of an Amazon trailer interior.
+════════════════════════════════════════════════════════
+STEP 1 — DOOR STATUS CHECK (do this FIRST)
+════════════════════════════════════════════════════════
+DOORS ARE OPEN if you can see INTO the trailer cargo area:
+- A long dark tunnel/corridor extending into the trailer depth
+- Corrugated ribbed metal side walls running into the distance
+- A wooden or composite floor surface at the entrance threshold
+DOORS ARE CLOSED if the image shows flat door panel surfaces as the main subject.
+If doors are CLOSED → set BOTH components to "missing"
+If doors are OPEN → proceed to STEP 2.
+════════════════════════════════════════════════════════
+STEP 2 — COMPONENT DETECTION (only if doors are OPEN)
+════════════════════════════════════════════════════════
+COMPONENT 1 — SIDE_GUARDS
+WHERE: Along the LEFT and RIGHT interior side walls of the trailer cargo area.
+WHAT: Corrugated or ribbed protective panels lining the inside walls — typically silver/gray
+metal with horizontal or diagonal ribbing/corrugation. They run from near the floor upward
+along both interior side walls. Mark "detected" if visible on at least one side wall.
+COMPONENT 2 — FLOORING
+WHERE: At the BOTTOM of the trailer interior opening — the floor surface at the entrance.
+WHAT: Wooden plank flooring — individual wooden planks running parallel lengthwise.
+- Color: brown, amber, tan, or light brown wood tone
+- The planks span the full width of the trailer floor
+- ONLY mark "detected" if you can clearly see the brown wooden plank surface INSIDE the trailer
+- Do NOT count asphalt/concrete ground outside the trailer
+Reply ONLY with a single flat JSON object — no extra text, no markdown fences, no nested objects:
+{
+  "side_guards": "detected",
+  "flooring":    "missing"
+}
+Each value must be exactly "detected" or "missing". Nothing else.""",
+"door": """You are a precise visual inspector for Amazon trailer fleets.
+════════════════════════════════════════════════════════
+STEP 1 — IMAGE VALIDATION (do this BEFORE anything else)
+════════════════════════════════════════════════════════
+A VALID door-details image has ALL of the following:
+  ✔ The REAR SWING DOORS of the trailer are the main subject — both door panels visible face-on
+  ✔ The doors are CLOSED (flat white/gray/metal door panels visible — NOT an open interior view)
+  ✔ The BOTTOM of the door frame is visible
+  ✔ The image is taken straight-on or slightly angled from the REAR of the trailer
+An INVALID image:
+  - A FRONT or SIDE view of the trailer
+  - Doors are OPEN
+  - Not showing the rear swing door panels as the main subject
+  - Bottom of door frame is cut off
+DECISION:
+→ If NOT a valid door-details image:
+   Set image_valid = "missing", Set BOTH other components to "missing"
+→ If IS a valid closed rear-door image:
+   Set image_valid = "detected", Proceed to STEP 2.
+════════════════════════════════════════════════════════
+STEP 2 — COMPONENT DETECTION (only if image_valid = "detected")
+════════════════════════════════════════════════════════
+COMPONENT 1 — LATCH_KIT_LASH_LINKS
+Door securing hardware — ANY of the following:
+  a) LATCH KIT: Metal door latching/locking mechanism — horizontal latch bars, vertical locking
+     rods, T-handles, cam locks, keeper plates, door handle assemblies, lock rod brackets,
+     or any hardware that keeps the door closed.
+  b) LASH LINKS: Metal chain links, D-rings, anchor hooks, or tie-down rings on door/inner frame.
+Mark "detected" if ANY latch hardware OR lash link hardware is visible.
+COMPONENT 2 — GROTE_LED_LIGHTS
+LED light fixtures at the bottom of the door frame:
+  - Look specifically at the BOTTOM CORNERS of the rear door frame / underside of the trailer
+  - Grote lights appear as rectangular or square metal housing boxes (silver, black, or chrome)
+    with LED lenses inside — typically red but may be white or amber
+  - They are mounted at the lower edge of the door frame, one on each bottom corner
+  - Even if only one side is visible, mark "detected"
+  - Do NOT count reflective tape or passive reflectors — only active LED light fixtures
+Reply ONLY with a single flat JSON object — no extra text, no markdown fences, no nested objects:
+{
+  "image_valid":          "detected",
+  "latch_kit_lash_links": "detected",
+  "grote_led_lights":     "missing"
+}
+Each value must be exactly "detected" or "missing". Nothing else."""
+}
+# ──────────────────────────────────────────────────────────────────────────────
+# ASPECT METADATA
+# ──────────────────────────────────────────────────────────────────────────────
+ASPECT_KEYS = {
+    "front":  ["image_valid", "sensors", "gps_device", "prime_logo", "trailer_id"],
+    "rear":   ["image_valid", "side_skirts_left", "side_skirts_right", "edge_kit_left", "edge_kit_right"],
+    "inside": ["side_guards", "flooring"],
+    "door":   ["image_valid", "latch_kit_lash_links", "grote_led_lights"],
+}
+CONF_RANK = {"high": 3, "medium": 2, "low": 1, "": 0}
+# Valid label names accepted by the API
+VALID_LABELS = {"front_right", "front_left", "rear_right", "rear_left", "inside", "door"}
+# Map each label to its inspection aspect
+LABEL_TO_ASPECT = {
+    "front_right": "front",
+    "front_left":  "front",
+    "rear_right":  "rear",
+    "rear_left":   "rear",
+    "inside":      "inside",
+    "door":        "door",
+}
+# ──────────────────────────────────────────────────────────────────────────────
+# HF CLIENT
+# ──────────────────────────────────────────────────────────────────────────────
+_hf_client: InferenceClient | None = None
+def _get_client(token: str) -> InferenceClient:
+    global _hf_client
+    if _hf_client is None:
+        _hf_client = InferenceClient(provider="auto", api_key=token)
+    return _hf_client
+# ──────────────────────────────────────────────────────────────────────────────
+# IMAGE HELPERS
+# ──────────────────────────────────────────────────────────────────────────────
+def pil_to_b64(img: Image.Image, max_side: int = 1024) -> str:
+    img = img.copy().convert("RGB")
+    if max(img.size) > max_side:
+        img.thumbnail((max_side, max_side), Image.LANCZOS)
+    buf = io.BytesIO()
+    img.save(buf, format="JPEG", quality=82)
+    return base64.b64encode(buf.getvalue()).decode("utf-8")
+def decode_b64_image(b64_str: str) -> Image.Image:
+    """Decode a base64 string (with or without data-URI prefix) to a PIL Image."""
+    if "," in b64_str:
+        b64_str = b64_str.split(",", 1)[1]
+    raw = base64.b64decode(b64_str)
+    return Image.open(io.BytesIO(raw)).convert("RGB")
+# ──────────────────────────────────────────────────────────────────────────────
+# JSON EXTRACTION
+# ───────────────────────────────────────────────��──────────────────────────────
+def extract_json(text: str, keys: list) -> dict | None:
+    if not text:
+        return None
+    text = re.sub(r"<think>[\s\S]*?</think>", "", text, flags=re.IGNORECASE)
+    text = re.sub(r"```(?:json)?", "", text, flags=re.IGNORECASE).replace("```", "")
+    brace = text.find("{")
+    if brace > 0:
+        text = text[brace:]
+    text = text.strip()
+    m = re.search(r"\{[\s\S]*\}", text)
+    if not m:
+        return None
+    raw = m.group()
+    try:
+        return json.loads(raw)
+    except json.JSONDecodeError:
+        pass
+    fixed = re.sub(r",\s*([}\]])", r"\1", raw)
+    try:
+        return json.loads(fixed)
+    except json.JSONDecodeError:
+        pass
+    try:
+        rebuilt = {}
+        for key in keys:
+            m_str = re.search(rf'"{key}"\s*:\s*"([^"]+)"', raw)
+            if m_str:
+                rebuilt[key] = m_str.group(1)
+                continue
+            m_obj = re.search(rf'"{key}"\s*:\s*(\{{[^}}]+\}})', raw, re.DOTALL)
+            if m_obj:
+                try:
+                    rebuilt[key] = json.loads(m_obj.group(1))
+                except Exception:
+                    pass
+        if rebuilt:
+            return rebuilt
+    except Exception:
+        pass
+    return None
+def validate_result(data: dict, keys: list) -> dict | None:
+    if not data:
+        return None
+    out = {}
+    for key in keys:
+        item = data.get(key)
+        if item is None:
+            return None
+        if isinstance(item, str):
+            found = item.strip().lower() == "detected"
+        elif isinstance(item, dict):
+            found = item.get("found", False)
+            if isinstance(found, str):
+                found = found.lower() in ("true", "yes", "1")
+            found = bool(found)
+        else:
+            return None
+        out[key] = {"found": found, "confidence": "high", "notes": ""}
+    return out
+# ──────────────────────────────────────────────────────────────────────────────
+# PER-IMAGE ANALYSIS
+# ──────────────────────────────────────────────────────────────────────────────
+def analyze_one(img: Image.Image, aspect: str, token: str) -> tuple:
+    """
+    Try MODELS in order for a single image.
+    Returns (result_dict, model_short_name) on success,
+            (None, joined_error_string)      on total failure.
+    """
+    b64    = pil_to_b64(img)
+    keys   = ASPECT_KEYS[aspect]
+    prompt = PROMPTS[aspect]
+    errors = []
+    for model in MODELS:
+        short = model.split("/")[-1]
+        try:
+            client = _get_client(token)
+            resp = client.chat_completion(
+                model=model,
+                messages=[
+                    {
+                        "role": "system",
+                        "content": (
+                            "You are a JSON-only API for trailer inspection. "
+                            "You MUST respond with a single valid flat JSON object and absolutely "
+                            "nothing else — no explanation, no preamble, no markdown fences, "
+                            "no reasoning text, no nested objects. "
+                            "Every value must be exactly the string \"detected\" or \"missing\". "
+                            "Start your response with '{' and end with '}'."
+                        ),
+                    },
+                    {
+                        "role": "user",
+                        "content": [
+                            {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{b64}"}},
+                            {"type": "text", "text": prompt},
+                        ],
+                    },
+                ],
+                max_tokens=120,
+                temperature=0.05,
+            )
+            raw_content = resp.choices[0].message.content
+            print(f"[{short}][{aspect}] raw: {raw_content[:300]}")
+            data   = extract_json(raw_content, keys)
+            result = validate_result(data, keys)
+            if result is not None:
+                return result, short
+            errors.append(f"{short}: JSON parse failed. Raw: {raw_content[:150]}")
+        except Exception as e:
+            err = str(e)
+            if "401" in err or "403" in err:
+                errors.append(f"{short}: auth error — check HF_TOKEN ({err[:100]})")
+            elif "404" in err:
+                errors.append(f"{short}: 404 — model unavailable ({err[:100]})")
+            elif "429" in err:
+                errors.append(f"{short}: rate limited — retrying next model")
+            elif "503" in err or "502" in err:
+                errors.append(f"{short}: model loading — retrying next model")
+            else:
+                errors.append(f"{short}: {err[:180]}")
+    return None, " | ".join(errors)
+def merge_results(results: list, aspect: str) -> dict:
+    """OR-merge multiple image results: if any image detected it, it's found."""
+    keys   = ASPECT_KEYS[aspect]
+    merged = {k: {"found": False, "confidence": "low", "notes": ""} for k in keys}
+    for res in results:
+        if not res:
+            continue
+        for k in keys:
+            src = res.get(k, {})
+            if src.get("found"):
+                merged[k]["found"] = True
+                if CONF_RANK.get(src.get("confidence", ""), 0) > CONF_RANK.get(merged[k]["confidence"], 0):
+                    merged[k]["confidence"] = src["confidence"]
+    return merged
+# ──────────────────────────────────────────────────────────────────────────────
+# REPORT BUILDERS
+# ──────────────────────────────────────────────────────────────────────────────
+def build_front_report(merged_left: dict | None, merged_right: dict | None) -> dict:
+    """
+    Combine front_left and front_right results.
+    For image_valid: if either side's image is invalid, note it.
+    For components: detected if found in EITHER side (OR logic).
+    """
+    components = {}
+    comp_keys = ["sensors", "gps_device", "prime_logo", "trailer_id"]
+    comp_names = {
+        "sensors":    "Sensors",
+        "gps_device": "GPS Device",
+        "prime_logo": "Prime Logo",
+        "trailer_id": "Trailer ID Label",
+    }
+    for key in comp_keys:
+        left_found  = merged_left.get(key, {}).get("found", False)  if merged_left  else False
+        right_found = merged_right.get(key, {}).get("found", False) if merged_right else False
+        detected    = left_found or right_found
+        components[comp_names[key]] = "detected" if detected else "missing"
+    # Image validity notes
+    notes = []
+    if merged_left is None:
+        notes.append("front_left: image missing from input")
+    elif not merged_left.get("image_valid", {}).get("found", True):
+        notes.append("front_left: invalid image (wrong angle)")
+    if merged_right is None:
+        notes.append("front_right: image missing from input")
+    elif not merged_right.get("image_valid", {}).get("found", True):
+        notes.append("front_right: invalid image (wrong angle)")
+    return {"components": components, "notes": notes}
+def build_rear_report(merged_left: dict | None, merged_right: dict | None) -> dict:
+    """
+    Combine rear_left and rear_right results.
+    Each component shows X/2 detection count.
+    Both sides MUST be independently detected for full confirmation.
+    """
+    components = {}
+    notes = []
+    # Check image validity
+    left_valid  = merged_left  is not None and merged_left.get("image_valid",  {}).get("found", True)
+    right_valid = merged_right is not None and merged_right.get("image_valid", {}).get("found", True)
+    if merged_left is None:
+        notes.append("rear_left: image missing from input")
+    elif not left_valid:
+        notes.append("rear_left: invalid image (wrong angle/side)")
+    if merged_right is None:
+        notes.append("rear_right: image missing from input")
+    elif not right_valid:
+        notes.append("rear_right: invalid image (wrong angle/side)")
+    comp_pairs = [
+        ("side_skirts_left", "side_skirts_right", "Side Skirts / Fins"),
+        ("edge_kit_left",    "edge_kit_right",    "Edge Kit"),
+    ]
+    for left_key, right_key, display_name in comp_pairs:
+        left_found  = merged_left.get(left_key,  {}).get("found", False) if merged_left  else False
+        right_found = merged_right.get(right_key, {}).get("found", False) if merged_right else False
+        count = int(left_found) + int(right_found)
+        status = f"{count}/2"
+        if count == 2:
+            result = "detected"
+        elif count == 1:
+            side   = "left side" if left_found else "right side"
+            result = f"partially detected ({side} only)"
+        else:
+            result = "missing"
+        components[display_name] = {
+            "status": result,
+            "count":  status,
+        }
+    return {"components": components, "notes": notes}
+def build_inside_report(merged: dict | None) -> dict:
+    if merged is None:
+        return {
+            "components": {
+                "Side Guards": "missing",
+                "Flooring":    "missing",
+            },
+            "notes": ["inside: image missing from input"],
+        }
+    return {
+        "components": {
+            "Side Guards": "detected" if merged.get("side_guards", {}).get("found") else "missing",
+            "Flooring":    "detected" if merged.get("flooring",    {}).get("found") else "missing",
+        },
+        "notes": [],
+    }
+def build_door_report(merged: dict | None) -> dict:
+    if merged is None:
+        return {
+            "components": {
+                "Latch Kit & Lash Links": "missing",
+                "Grote LED Lights":       "missing",
+            },
+            "notes": ["door: image missing from input"],
+        }
+    notes = []
+    if not merged.get("image_valid", {}).get("found", True):
+        notes.append("door: invalid image (not a valid rear door view)")
+    return {
+        "components": {
+            "Latch Kit & Lash Links": "detected" if merged.get("latch_kit_lash_links", {}).get("found") else "missing",
+            "Grote LED Lights":       "detected" if merged.get("grote_led_lights",     {}).get("found") else "missing",
+        },
+        "notes": notes,
+    }
+# ──────────────────────────────────────────────────────────────────────────────
+# FASTAPI APP
+# ──────────────────────────────────────────────────────────────────────────────
+app = FastAPI(
+    title="Amazon Trailer Inspector API",
+    description=(
+        "AI-powered trailer inspection API. "
+        "Submit up to 6 labeled images (front_right, front_left, rear_right, rear_left, inside, door) "
+        "and receive a structured component detection report."
+    ),
+    version="2.0.0",
+)
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# ── Pydantic models ─────────────────────────────────────────────────────────
+class ImageInput(BaseModel):
+    label: str = Field(
+        ...,
+        description="One of: front_right, front_left, rear_right, rear_left, inside, door",
+        example="front_left",
+    )
+    image_base64: str = Field(
+        ...,
+        description=(
+            "Base64-encoded image. Can be raw base64 or a data URI "
+            "(e.g. 'data:image/jpeg;base64,...'). "
+            "Supported formats: JPEG, PNG, WEBP."
+        ),
+    )
+class InspectRequest(BaseModel):
+    images: list[ImageInput] = Field(
+        ...,
+        min_length=1,
+        max_length=6,
+        description="List of labeled images. Each label may appear at most once.",
+        example=[
+            {"label": "front_left",  "image_base64": "<base64>"},
+            {"label": "front_right", "image_base64": "<base64>"},
+            {"label": "rear_left",   "image_base64": "<base64>"},
+            {"label": "rear_right",  "image_base64": "<base64>"},
+            {"label": "inside",      "image_base64": "<base64>"},
+            {"label": "door",        "image_base64": "<base64>"},
+        ],
+    )
+# ── Routes ──────────────────────────────────────────────────────────────────
+@app.get("/", tags=["Health"])
+def root():
+    return {
+        "status": "ok",
+        "service": "Amazon Trailer Inspector API",
+        "version": "2.0.0",
+        "endpoint": "POST /inspect",
+    }
+@app.get("/health", tags=["Health"])
+def health():
+    token = os.environ.get("HF_TOKEN", "").strip()
+    return {
+        "status": "ok",
+        "hf_token_set": bool(token),
+        "models": [m.split("/")[-1] for m in MODELS],
+    }
+@app.post("/inspect", tags=["Inspection"])
+def inspect(request: InspectRequest):
+    """
+    Run full trailer inspection on all submitted images in parallel.
+    **Input:** Up to 6 labeled base64 images.
+    **Output:** Per-label report with component detection results.
+    Labels accepted: `front_right`, `front_left`, `rear_right`, `rear_left`, `inside`, `door`
+    """
+    token = os.environ.get("HF_TOKEN", "").strip()
+    if not token:
+        raise HTTPException(
+            status_code=503,
+            detail=(
+                "HF_TOKEN not configured. "
+                "Set it in Space Settings → Repository Secrets."
+            ),
+        )
+    # Validate labels and deduplicate
+    seen_labels = {}
+    for item in request.images:
+        if item.label not in VALID_LABELS:
+            raise HTTPException(
+                status_code=422,
+                detail=f"Invalid label '{item.label}'. Must be one of: {sorted(VALID_LABELS)}",
+            )
+        if item.label in seen_labels:
+            raise HTTPException(
+                status_code=422,
+                detail=f"Duplicate label '{item.label}'. Each label may only appear once.",
+            )
+        seen_labels[item.label] = item.image_base64
+    # Decode all images
+    decoded: dict[str, Image.Image] = {}
+    for label, b64 in seen_labels.items():
+        try:
+            decoded[label] = decode_b64_image(b64)
+        except Exception as e:
+            raise HTTPException(
+                status_code=422,
+                detail=f"Could not decode image for label '{label}': {e}",
+            )
+    # ── Run all label analyses in parallel ──────────────────────────────────
+    # Each label → its aspect → analyze_one(img, aspect, token)
+    # front_left and front_right each run independently with the "front" prompt
+    # rear_left and rear_right each run independently with the "rear" prompt
+    # Results for front and rear are then merged across their respective sides
+    label_results: dict[str, dict | None] = {}
+    def run_label(label: str) -> tuple[str, dict | None]:
+        aspect = LABEL_TO_ASPECT[label]
+        img    = decoded[label]
+        # analyze_one returns (result_dict, model_name_or_error)
+        result, meta = analyze_one(img, aspect, token)
+        if result is not None:
+            print(f"[API] {label} → success via {meta}")
+            return label, result
+        else:
+            print(f"[API] {label} → all models failed: {meta}")
+            return label, None
+    with concurrent.futures.ThreadPoolExecutor(max_workers=6) as pool:
+        futures = {pool.submit(run_label, label): label for label in decoded}
+        for fut in concurrent.futures.as_completed(futures):
+            label, result = fut.result()
+            label_results[label] = result
+    # ── Build the final report ───────────────────────────────────────────────
+    # FRONT: merge left + right with OR logic
+    front_left_raw  = label_results.get("front_left")
+    front_right_raw = label_results.get("front_right")
+    front_report = None
+    if "front_left" in decoded or "front_right" in decoded:
+        front_report = build_front_report(front_left_raw, front_right_raw)
+    # REAR: left and right reported with X/2 count logic
+    rear_left_raw  = label_results.get("rear_left")
+    rear_right_raw = label_results.get("rear_right")
+    rear_report = None
+    if "rear_left" in decoded or "rear_right" in decoded:
+        rear_report = build_rear_report(rear_left_raw, rear_right_raw)
+    # INSIDE
+    inside_report = None
+    if "inside" in decoded:
+        inside_report = build_inside_report(label_results.get("inside"))
+    # DOOR
+    door_report = None
+    if "door" in decoded:
+        door_report = build_door_report(label_results.get("door"))
+    # ── Assemble response ────────────────────────────────────────────────────
+    report = {}
+    if front_report is not None:
+        report["front"] = {
+            "label":      "Front Left / Right",
+            "images_provided": [l for l in ("front_left", "front_right") if l in decoded],
+            "components": front_report["components"],
+            "notes":      front_report["notes"],
+        }
+    if rear_report is not None:
+        report["rear"] = {
+            "label":      "Rear Left / Right",
+            "images_provided": [l for l in ("rear_left", "rear_right") if l in decoded],
+            "components": rear_report["components"],
+            "notes":      rear_report["notes"],
+        }
+    if inside_report is not None:
+        report["inside"] = {
+            "label":      "Inside Trailer",
+            "images_provided": ["inside"],
+            "components": inside_report["components"],
+            "notes":      inside_report["notes"],
+        }
+    if door_report is not None:
+        report["door"] = {
+            "label":      "Door Details",
+            "images_provided": ["door"],
+            "components": door_report["components"],
+            "notes":      door_report["notes"],
+        }
+    # Note any labels that were not submitted
+    missing_labels = sorted(VALID_LABELS - set(decoded.keys()))
+    return JSONResponse(content={
+        "status":         "success",
+        "images_received": list(decoded.keys()),
+        "labels_missing":  missing_labels,
+        "report":          report,
+    })
+# ──────────────────────────────────────────────────────────────────────────────
+# STARTUP
+# ──────────────────────────────────────────────────────────────────────────────
+_tok = os.environ.get("HF_TOKEN", "")
+print("=" * 60)
+print("  Amazon Trailer Inspector — API mode")
+print(f"  HF_TOKEN : {'SET (' + str(len(_tok)) + ' chars)' if _tok else 'NOT SET ⚠️'}")
+print(f"  Models   : {[m.split('/')[-1] for m in MODELS]}")
+print("=" * 60)
+if __name__ == "__main__":
+    uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=False)