Spaces:

lyimo
/

Car_Counting

Sleeping

App Files Files Community

lyimo commited on May 18

Commit

35e66da

verified ·

1 Parent(s): 7176850

Update app.py

Browse files

Files changed (1) hide show

app.py +777 -406

app.py CHANGED Viewed

@@ -1,13 +1,14 @@
 """
-Bridge Traffic & Load Demo App
-Fast RF-DETR + ByteTrack vehicle counting for bridge videos.
 """
 import os
 import time
 import tempfile
 from functools import lru_cache
-from typing import Dict, List, Tuple
 import cv2
 import gradio as gr
@@ -19,42 +20,65 @@ import pandas as pd
 import supervision as sv
 import torch
-from rfdetr import RFDETRNano, RFDETRMedium
 # ---------------------------------------------------------------------
-# Vehicle classes from COCO
 # ---------------------------------------------------------------------
-# COCO IDs used by RF-DETR:
-# 2 = car, 3 = motorcycle, 5 = bus, 7 = truck
-VEHICLE_CLASSES: Dict[int, str] = {
-    2: "car",
-    3: "motorcycle",
-    5: "bus",
-    7: "truck",
-}
-# Very rough demonstration weights in kg.
-# Adjust these for your local traffic profile.
-DEFAULT_WEIGHTS_KG: Dict[int, int] = {
-    2: 1500,    # car / small vehicle
-    3: 250,     # motorcycle
-    5: 12000,   # bus
-    7: 18000,   # truck / lorry
-}
-CLASS_COLORS_BGR: Dict[int, Tuple[int, int, int]] = {
-    2: (40, 190, 120),    # car
-    3: (255, 170, 70),    # motorcycle
-    5: (245, 120, 45),    # bus
-    7: (220, 70, 180),    # truck
-}
-MODEL_OPTIONS = {
-    "Nano - fastest": RFDETRNano,
-    "Medium - more accurate, slower": RFDETRMedium,
-}
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 try:
@@ -63,91 +87,281 @@ except Exception:
     pass
 if DEVICE == "cuda":
-    torch.backends.cudnn.benchmark = True
 # ---------------------------------------------------------------------
 # Model loading
 # ---------------------------------------------------------------------
-@lru_cache(maxsize=2)
-def load_model(model_name: str):
-    """Load RF-DETR once and reuse it across runs."""
-    model_cls = MODEL_OPTIONS[model_name]
-    print(f"Loading {model_name} on {DEVICE}...")
     try:
-        model = model_cls(device=DEVICE)
     except TypeError:
-        # Fallback for older RF-DETR builds
-        model = model_cls()
-    if DEVICE == "cuda":
-        try:
-            model.optimize_for_inference()
-            print("RF-DETR optimized for inference.")
-        except Exception as exc:
-            print(f"optimize_for_inference skipped: {exc}")
-    print("Model ready.")
     return model
 # ---------------------------------------------------------------------
-# Detection helper
 # ---------------------------------------------------------------------
-def predict_vehicles(
     model,
     frame_bgr: np.ndarray,
     confidence: float,
     inference_width: int,
-) -> sv.Detections:
     """
-    Resize frame before inference for speed, then scale boxes back to
-    original video coordinates.
     """
     h, w = frame_bgr.shape[:2]
-    inference_width = int(inference_width)
     if inference_width > 0 and w > inference_width:
-        scale = inference_width / float(w)
-        resized_w = inference_width
-        resized_h = int(h * scale)
-        model_frame = cv2.resize(frame_bgr, (resized_w, resized_h), interpolation=cv2.INTER_AREA)
     else:
         scale = 1.0
-        model_frame = frame_bgr
-    frame_rgb = cv2.cvtColor(model_frame, cv2.COLOR_BGR2RGB)
     with torch.inference_mode():
-        detections = model.predict(frame_rgb, threshold=float(confidence))
     if len(detections) == 0:
-        return detections
-    # Keep only vehicle classes.
-    mask = np.isin(detections.class_id, list(VEHICLE_CLASSES.keys()))
-    detections = detections[mask]
-    if len(detections) == 0:
-        return detections
-    # Scale boxes back to original frame size.
-    if scale != 1.0:
         detections.xyxy = detections.xyxy / scale
-    return detections
 # ---------------------------------------------------------------------
-# Counting and load helpers
 # ---------------------------------------------------------------------
-def side_of_line(y: float, line_y: int, dead_zone_px: int = 4) -> int:
-    """
-    Returns -1 above the line, +1 below the line, 0 inside a small dead zone.
-    The dead zone prevents jitter around the line from causing false crossings.
-    """
     diff = y - line_y
     if abs(diff) <= dead_zone_px:
         return 0
@@ -158,47 +372,181 @@ def detection_centres(detections: sv.Detections) -> np.ndarray:
     if len(detections) == 0:
         return np.empty((0, 2), dtype=float)
     xyxy = detections.xyxy
-    cx = (xyxy[:, 0] + xyxy[:, 2]) / 2.0
-    cy = (xyxy[:, 1] + xyxy[:, 3]) / 2.0
-    return np.column_stack([cx, cy])
-def get_class_weight_kg(class_id: int, weights: Dict[int, int]) -> int:
-    return int(weights.get(int(class_id), 0))
-def draw_header_panel(
-    frame: np.ndarray,
     total_count: int,
     cumulative_kg: float,
     live_load_kg: float,
     load_index_percent: float,
-    fps_text: str,
-) -> np.ndarray:
-    """Draw a clean dashboard panel at the top-left of the frame."""
-    overlay = frame.copy()
-    x1, y1, x2, y2 = 18, 18, 520, 158
-    cv2.rectangle(overlay, (x1, y1), (x2, y2), (20, 24, 36), -1)
-    frame = cv2.addWeighted(overlay, 0.82, frame, 0.18, 0)
-    cv2.putText(frame, "BRIDGE TRAFFIC LOAD DEMO", (34, 46),
-                cv2.FONT_HERSHEY_SIMPLEX, 0.72, (255, 255, 255), 2, cv2.LINE_AA)
-    cv2.putText(frame, f"Vehicles crossed: {total_count}", (34, 78),
-                cv2.FONT_HERSHEY_SIMPLEX, 0.62, (230, 240, 255), 2, cv2.LINE_AA)
-    cv2.putText(frame, f"Cumulative estimated mass: {cumulative_kg / 1000.0:.1f} tonnes", (34, 106),
-                cv2.FONT_HERSHEY_SIMPLEX, 0.58, (220, 240, 230), 2, cv2.LINE_AA)
-    cv2.putText(frame, f"Live load: {live_load_kg / 1000.0:.1f} t | Load index: {load_index_percent:.1f}% | {fps_text}", (34, 134),
-                cv2.FONT_HERSHEY_SIMPLEX, 0.52, (230, 230, 255), 1, cv2.LINE_AA)
     return frame
 def annotate_frame(
     frame: np.ndarray,
     detections: sv.Detections,
     line_y: int,
     roi_top_y: int,
     roi_bottom_y: int,
@@ -207,22 +555,30 @@ def annotate_frame(
     cumulative_kg: float,
     live_load_kg: float,
     load_index_percent: float,
-    fps_text: str,
 ) -> np.ndarray:
-    """Draw ROI, counting line, boxes, labels and dashboard."""
     h, w = frame.shape[:2]
-    # Bridge deck ROI overlay
     overlay = frame.copy()
-    cv2.rectangle(overlay, (0, roi_top_y), (w, roi_bottom_y), (80, 80, 80), -1)
     frame = cv2.addWeighted(overlay, 0.08, frame, 0.92, 0)
-    # Counting line
     cv2.line(frame, (0, line_y), (w, line_y), (40, 230, 255), 3)
-    cv2.putText(frame, "COUNTING LINE", (24, max(28, line_y - 12)),
-                cv2.FONT_HERSHEY_SIMPLEX, 0.58, (40, 230, 255), 2, cv2.LINE_AA)
-    # ROI borders
     cv2.line(frame, (0, roi_top_y), (w, roi_top_y), (170, 170, 170), 1)
     cv2.line(frame, (0, roi_bottom_y), (w, roi_bottom_y), (170, 170, 170), 1)
@@ -235,180 +591,100 @@ def annotate_frame(
         if confidences is None:
             confidences = [0.0] * len(detections)
-        for xyxy, class_id, conf, track_id in zip(
-            detections.xyxy,
-            detections.class_id,
-            confidences,
-            tracker_ids,
-        ):
-            class_id = int(class_id)
             x1, y1, x2, y2 = map(int, xyxy)
-            name = VEHICLE_CLASSES.get(class_id, "vehicle")
-            color = CLASS_COLORS_BGR.get(class_id, (80, 220, 255))
-            weight_t = DEFAULT_WEIGHTS_KG.get(class_id, 0) / 1000.0
             cv2.rectangle(frame, (x1, y1), (x2, y2), color, 2)
-            id_text = f"#{int(track_id)} " if track_id is not None and int(track_id) >= 0 else ""
-            label = f"{id_text}{name} {float(conf):.2f} ~{weight_t:.1f}t"
             (tw, th), base = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.52, 1)
             label_y1 = max(0, y1 - th - base - 8)
             cv2.rectangle(frame, (x1, label_y1), (x1 + tw + 10, y1), color, -1)
-            cv2.putText(frame, label, (x1 + 5, y1 - 6),
-                        cv2.FONT_HERSHEY_SIMPLEX, 0.52, (255, 255, 255), 1, cv2.LINE_AA)
-    frame = draw_header_panel(
         frame=frame,
         total_count=total_count,
         cumulative_kg=cumulative_kg,
         live_load_kg=live_load_kg,
         load_index_percent=load_index_percent,
-        fps_text=fps_text,
     )
-    # Compact class counts at bottom
-    items = [f"{k}: {v}" for k, v in class_counts.items() if v > 0]
-    count_text = " | ".join(items) if items else "No crossings yet"
-    cv2.putText(frame, count_text, (22, h - 24),
-                cv2.FONT_HERSHEY_SIMPLEX, 0.62, (255, 255, 255), 2, cv2.LINE_AA)
-    return frame
-def build_metrics_html(
-    total_count: int,
-    class_counts: Dict[str, int],
-    cumulative_kg: float,
-    live_load_kg: float,
-    load_index_percent: float,
-    frame_idx: int,
-    total_frames: int,
-    elapsed: float,
-    device: str,
-) -> str:
-    pct = (frame_idx / total_frames * 100.0) if total_frames else 0.0
-    tonnes = cumulative_kg / 1000.0
-    live_tonnes = live_load_kg / 1000.0
-    car = class_counts.get("car", 0)
-    motorcycle = class_counts.get("motorcycle", 0)
-    bus = class_counts.get("bus", 0)
-    truck = class_counts.get("truck", 0)
-    return f"""
-    <div style="font-family:Inter,system-ui,Arial;">
-      <div style="display:grid;grid-template-columns:1fr 1fr;gap:10px;margin-bottom:12px;">
-        <div style="padding:16px;border-radius:16px;background:linear-gradient(135deg,#1d4ed8,#312e81);color:white;">
-          <div style="font-size:11px;letter-spacing:1px;opacity:.85;">VEHICLES CROSSED</div>
-          <div style="font-size:46px;font-weight:800;line-height:1;">{total_count}</div>
-        </div>
-        <div style="padding:16px;border-radius:16px;background:linear-gradient(135deg,#be185d,#7e22ce);color:white;">
-          <div style="font-size:11px;letter-spacing:1px;opacity:.85;">EST. CUMULATIVE MASS</div>
-          <div style="font-size:36px;font-weight:800;line-height:1;">{tonnes:.1f} t</div>
-        </div>
-      </div>
-      <div style="display:grid;grid-template-columns:1fr 1fr;gap:10px;margin-bottom:12px;">
-        <div style="padding:14px;border:1px solid #e5e7eb;border-radius:14px;background:white;">
-          <div style="font-size:12px;color:#6b7280;">Live bridge load</div>
-          <div style="font-size:28px;font-weight:750;color:#111827;">{live_tonnes:.1f} t</div>
-        </div>
-        <div style="padding:14px;border:1px solid #e5e7eb;border-radius:14px;background:white;">
-          <div style="font-size:12px;color:#6b7280;">Load index</div>
-          <div style="font-size:28px;font-weight:750;color:#111827;">{load_index_percent:.1f}%</div>
-        </div>
-      </div>
-      <div style="padding:14px;border:1px solid #e5e7eb;border-radius:14px;background:#ffffff;margin-bottom:12px;">
-        <div style="font-size:12px;color:#6b7280;margin-bottom:8px;">Crossings by class</div>
-        <div style="display:grid;grid-template-columns:1fr 1fr;gap:8px;font-size:14px;">
-          <div>🚗 Cars: <b>{car}</b></div>
-          <div>🏍️ Motorcycles: <b>{motorcycle}</b></div>
-          <div>🚌 Buses: <b>{bus}</b></div>
-          <div>🚛 Trucks: <b>{truck}</b></div>
-        </div>
-      </div>
-      <div style="font-size:12px;color:#6b7280;margin-bottom:4px;display:flex;justify-content:space-between;">
-        <span>Frame {frame_idx} / {total_frames}</span>
-        <span>{pct:.1f}% · {elapsed:.1f}s · {device}</span>
-      </div>
-      <div style="height:8px;background:#e5e7eb;border-radius:99px;overflow:hidden;">
-        <div style="height:100%;width:{pct:.2f}%;background:#4f46e5;"></div>
-      </div>
-    </div>
-    """
-def render_load_plot(history: List[Dict]) -> np.ndarray:
-    """Render load-index chart as an RGB image for Gradio."""
-    if not history:
-        img = np.ones((320, 600, 3), dtype=np.uint8) * 255
-        cv2.putText(img, "Load index chart will appear here", (60, 165),
-                    cv2.FONT_HERSHEY_SIMPLEX, 0.8, (80, 80, 80), 2, cv2.LINE_AA)
-        return img
-    df = pd.DataFrame(history)
-    # Plot only a manageable number of points for speed.
-    if len(df) > 500:
-        df = df.iloc[np.linspace(0, len(df) - 1, 500).astype(int)]
-    fig, ax = plt.subplots(figsize=(8.0, 3.8), dpi=100)
-    ax.plot(df["time_s"], df["load_index_percent"], linewidth=2)
-    ax.set_title("Estimated Bridge Load Index Over Time")
-    ax.set_xlabel("Video time (seconds)")
-    ax.set_ylabel("Load index (%)")
-    ax.grid(True, alpha=0.25)
-    ax.set_ylim(bottom=0)
-    fig.tight_layout()
-    fig.canvas.draw()
-    rgba = np.asarray(fig.canvas.buffer_rgba())
-    rgb = cv2.cvtColor(rgba, cv2.COLOR_RGBA2RGB)
-    plt.close(fig)
-    return rgb
-def build_final_summary(
     total_count: int,
     class_counts: Dict[str, int],
     cumulative_kg: float,
     peak_live_load_kg: float,
     peak_load_index: float,
-    csv_path: str,
 ) -> str:
-    tonnes = cumulative_kg / 1000.0
-    peak_tonnes = peak_live_load_kg / 1000.0
-    return f"""
-### Final bridge traffic summary
-**Vehicles crossed:** {total_count}
-| Vehicle class | Count |
-|---|---:|
-| Cars | {class_counts.get("car", 0)} |
-| Motorcycles | {class_counts.get("motorcycle", 0)} |
-| Buses | {class_counts.get("bus", 0)} |
-| Trucks | {class_counts.get("truck", 0)} |
-**Cumulative estimated mass:** {tonnes:.2f} tonnes
-**Peak estimated live load:** {peak_tonnes:.2f} tonnes
-**Peak load index:** {peak_load_index:.1f}%
-The CSV output contains the estimated load-index time series for later plotting or analysis.
-> Note: This is a demonstration traffic-load indicator, not a certified structural stress calculation.
 """
 # ---------------------------------------------------------------------
-# Main processing generator
 # ---------------------------------------------------------------------
 def process_video(
     video_path,
-    model_name,
     confidence,
     frame_stride,
     inference_width,
@@ -416,38 +692,64 @@ def process_video(
     roi_top_percent,
     roi_bottom_percent,
     reference_capacity_tonnes,
     car_weight_t,
-    motorcycle_weight_t,
     bus_weight_t,
     truck_weight_t,
 ):
     if video_path is None:
         yield (
             None,
-            build_metrics_html(0, {"car": 0, "motorcycle": 0, "bus": 0, "truck": 0}, 0, 0, 0, 0, 0, 0, DEVICE),
-            render_load_plot([]),
-            "Upload a video to start analysis.",
             None,
             None,
         )
         return
-    # Update demo weights from UI.
-    weights_kg = {
-        2: int(float(car_weight_t) * 1000),
-        3: int(float(motorcycle_weight_t) * 1000),
-        5: int(float(bus_weight_t) * 1000),
-        7: int(float(truck_weight_t) * 1000),
-    }
-    # Keep global-like drawing labels consistent for this run.
-    DEFAULT_WEIGHTS_KG.update(weights_kg)
     cap = cv2.VideoCapture(video_path)
     if not cap.isOpened():
         raise RuntimeError(f"Could not open video: {video_path}")
-    fps = cap.get(cv2.CAP_PROP_FPS)
-    if fps is None or fps <= 1:
         fps = 25.0
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT) or 0)
@@ -463,119 +765,134 @@ def process_video(
     roi_bottom_y = int(height * float(roi_bottom_percent) / 100.0)
     if roi_bottom_y <= roi_top_y:
-        roi_top_y = int(height * 0.25)
         roi_bottom_y = int(height * 0.90)
     reference_capacity_kg = max(1.0, float(reference_capacity_tonnes) * 1000.0)
     yield (
         None,
-        build_metrics_html(0, {"car": 0, "motorcycle": 0, "bus": 0, "truck": 0}, 0, 0, 0, 0, total_frames, 0, DEVICE),
-        render_load_plot([]),
-        "### Loading RF-DETR model and starting analysis...",
         None,
         None,
     )
-    model = load_model(str(model_name))
     tracker = sv.ByteTrack(frame_rate=int(round(fps)))
-    # Output files
     out_video_path = tempfile.NamedTemporaryFile(suffix=".mp4", delete=False).name
     out_csv_path = tempfile.NamedTemporaryFile(suffix=".csv", delete=False).name
-    fourcc = cv2.VideoWriter_fourcc(*"mp4v")
-    writer = cv2.VideoWriter(out_video_path, fourcc, fps, (width, height))
-    # State
     last_detections = sv.Detections.empty()
     last_side_by_id: Dict[int, int] = {}
     counted_ids = set()
-    track_class: Dict[int, int] = {}
-    class_counts = {"car": 0, "motorcycle": 0, "bus": 0, "truck": 0}
     total_count = 0
     cumulative_kg = 0.0
     history: List[Dict] = []
-    event_rows: List[Dict] = []
-    start_wall = time.time()
-    last_yield_wall = 0.0
-    last_plot = render_load_plot([])
-    processed_frames = 0
     peak_live_load_kg = 0.0
     peak_load_index = 0.0
     frame_idx = 0
     while True:
         ok, frame = cap.read()
         if not ok:
             break
-        detect_this_frame = (frame_idx % int(frame_stride) == 0)
-        if detect_this_frame:
-            detections = predict_vehicles(
-                model=model,
                 frame_bgr=frame,
                 confidence=float(confidence),
                 inference_width=int(inference_width),
             )
             detections = tracker.update_with_detections(detections)
             last_detections = detections
         else:
             detections = last_detections
-        # Update per-track class and line crossing only when we have tracked detections.
         centres = detection_centres(detections)
         live_load_kg = 0.0
-        active_track_ids = set()
         if len(detections) > 0 and detections.tracker_id is not None:
-            for det_i, (centre, class_id, track_id) in enumerate(
-                zip(centres, detections.class_id, detections.tracker_id)
-            ):
-                if track_id is None or int(track_id) < 0:
                     continue
-                tid = int(track_id)
-                cid = int(class_id)
-                cy = float(centre[1])
-                track_class[tid] = cid
-                active_track_ids.add(tid)
-                # Live bridge-deck load, only if the object is inside the deck ROI.
                 if roi_top_y <= cy <= roi_bottom_y:
-                    live_load_kg += get_class_weight_kg(cid, weights_kg)
                 current_side = side_of_line(cy, line_y)
                 previous_side = last_side_by_id.get(tid)
                 if current_side != 0:
-                    if previous_side is not None and previous_side != 0:
-                        crossed = previous_side != current_side
-                        if crossed and tid not in counted_ids:
-                            vehicle_name = VEHICLE_CLASSES.get(cid, "vehicle")
-                            vehicle_weight = get_class_weight_kg(cid, weights_kg)
-                            direction = "down" if previous_side < current_side else "up"
                             counted_ids.add(tid)
                             total_count += 1
-                            class_counts[vehicle_name] = class_counts.get(vehicle_name, 0) + 1
-                            cumulative_kg += vehicle_weight
-                            event_rows.append({
                                 "video_time_s": frame_idx / fps,
                                 "frame": frame_idx,
                                 "tracker_id": tid,
-                                "vehicle_type": vehicle_name,
                                 "direction": direction,
-                                "estimated_vehicle_weight_kg": vehicle_weight,
                                 "cumulative_estimated_mass_kg": cumulative_kg,
                             })
@@ -585,15 +902,23 @@ def process_video(
         peak_live_load_kg = max(peak_live_load_kg, live_load_kg)
         peak_load_index = max(peak_load_index, load_index_percent)
         history.append({
-            "video_time_s": frame_idx / fps,
             "time_s": frame_idx / fps,
             "frame": frame_idx,
-            "vehicles_crossed_total": total_count,
             "cars_crossed": class_counts.get("car", 0),
             "motorcycles_crossed": class_counts.get("motorcycle", 0),
             "buses_crossed": class_counts.get("bus", 0),
             "trucks_crossed": class_counts.get("truck", 0),
             "live_load_kg": live_load_kg,
             "live_load_tonnes": live_load_kg / 1000.0,
             "load_index_percent": load_index_percent,
@@ -601,14 +926,10 @@ def process_video(
             "cumulative_estimated_mass_tonnes": cumulative_kg / 1000.0,
         })
-        elapsed_wall = time.time() - start_wall
-        processed_frames += 1
-        current_processing_fps = processed_frames / max(elapsed_wall, 1e-6)
-        fps_text = f"{current_processing_fps:.1f} proc FPS"
         annotated = annotate_frame(
             frame=frame,
             detections=detections,
             line_y=line_y,
             roi_top_y=roi_top_y,
             roi_bottom_y=roi_bottom_y,
@@ -617,18 +938,22 @@ def process_video(
             cumulative_kg=cumulative_kg,
             live_load_kg=live_load_kg,
             load_index_percent=load_index_percent,
-            fps_text=fps_text,
         )
         writer.write(annotated)
         now = time.time()
         if now - last_yield_wall >= 0.35:
             last_yield_wall = now
-            # Refresh the chart less often than the frame display.
-            last_plot = render_load_plot(history)
-            rgb_frame = cv2.cvtColor(annotated, cv2.COLOR_BGR2RGB)
             yield (
-                rgb_frame,
                 build_metrics_html(
                     total_count=total_count,
                     class_counts=class_counts,
@@ -637,10 +962,11 @@ def process_video(
                     load_index_percent=load_index_percent,
                     frame_idx=frame_idx + 1,
                     total_frames=total_frames,
-                    elapsed=elapsed_wall,
-                    device=DEVICE,
                 ),
-                last_plot,
                 "### Live analysis running...",
                 None,
                 None,
@@ -651,33 +977,26 @@ def process_video(
     cap.release()
     writer.release()
-    # Save CSV time series. Add event-level detail as separate columns where possible.
     history_df = pd.DataFrame(history)
-    history_df.to_csv(out_csv_path, index=False)
     final_plot = render_load_plot(history)
-    final_summary = build_final_summary(
-        total_count=total_count,
-        class_counts=class_counts,
-        cumulative_kg=cumulative_kg,
-        peak_live_load_kg=peak_live_load_kg,
-        peak_load_index=peak_load_index,
-        csv_path=out_csv_path,
-    )
-    final_frame = None
-    if history:
-        # Try to show the last annotated frame from the output video.
-        cap2 = cv2.VideoCapture(out_video_path)
-        if cap2.isOpened():
-            cap2.set(cv2.CAP_PROP_POS_FRAMES, max(0, frame_idx - 1))
-            ok, last = cap2.read()
-            if ok:
-                final_frame = cv2.cvtColor(last, cv2.COLOR_BGR2RGB)
-            cap2.release()
     yield (
-        final_frame,
         build_metrics_html(
             total_count=total_count,
             class_counts=class_counts,
@@ -686,31 +1005,39 @@ def process_video(
             load_index_percent=0,
             frame_idx=total_frames if total_frames else frame_idx,
             total_frames=total_frames if total_frames else frame_idx,
-            elapsed=time.time() - start_wall,
-            device=DEVICE,
         ),
         final_plot,
-        final_summary,
         out_video_path,
         out_csv_path,
     )
 # ---------------------------------------------------------------------
-# Gradio UI
 # ---------------------------------------------------------------------
 CUSTOM_CSS = """
 .gradio-container {
-    max-width: 1320px !important;
     margin: auto !important;
 }
 #hero {
     text-align: center;
-    padding: 18px 8px 8px 8px;
 }
 #hero h1 {
     font-weight: 850;
-    letter-spacing: -0.6px;
     margin-bottom: 2px;
 }
 #hero p {
@@ -723,7 +1050,7 @@ CUSTOM_CSS = """
     border-radius: 18px;
     padding: 16px;
     background: #ffffff;
-    box-shadow: 0 8px 24px rgba(15, 23, 42, 0.04);
 }
 #live-frame img, #load-plot img {
     border-radius: 14px;
@@ -734,7 +1061,7 @@ footer {
 """
 with gr.Blocks(
-    title="Bridge Traffic Load Demo",
     theme=gr.themes.Soft(primary_hue="indigo", secondary_hue="slate"),
     css=CUSTOM_CSS,
 ) as demo:
@@ -742,53 +1069,68 @@ with gr.Blocks(
     with gr.Row(elem_id="hero"):
         gr.Markdown(
             """
-            # 🌉 Bridge Traffic Load Demo
-            Fast RF-DETR vehicle detection, ByteTrack tracking, line-crossing counts,
-            estimated cumulative vehicle mass, and live bridge load-index over time.
             """
         )
     with gr.Row():
         with gr.Column(scale=1):
             with gr.Group(elem_classes="panel"):
-                gr.Markdown("### 1) Upload video")
                 video_input = gr.Video(
-                    label="Bridge traffic video",
                     sources=["upload"],
                     format="mp4",
                     height=260,
                 )
-                start_btn = gr.Button("▶ Start analysis", variant="primary", size="lg")
-                gr.Markdown("### 2) Speed settings")
-                model_name = gr.Radio(
-                    choices=list(MODEL_OPTIONS.keys()),
-                    value="Nano - fastest",
-                    label="RF-DETR model",
                 )
                 confidence = gr.Slider(
                     minimum=0.10,
                     maximum=0.90,
-                    value=0.40,
                     step=0.05,
                     label="Confidence threshold",
                 )
                 frame_stride = gr.Slider(
                     minimum=1,
-                    maximum=10,
                     value=3,
                     step=1,
                     label="Frame stride",
-                    info="Detect every Nth frame. 1 is most accurate. 3-5 is much faster.",
                 )
                 inference_width = gr.Slider(
                     minimum=384,
                     maximum=1280,
                     value=640,
                     step=64,
-                    label="Inference width",
-                    info="Lower is faster. Try 512 or 640 for CPU demos.",
                 )
                 with gr.Accordion("Bridge settings", open=False):
@@ -814,23 +1156,30 @@ with gr.Blocks(
                         label="Bridge deck ROI bottom (%)",
                     )
                     reference_capacity_tonnes = gr.Slider(
-                        minimum=5,
-                        maximum=200,
                         value=40,
-                        step=5,
                         label="Reference live-load capacity for demo index (tonnes)",
                     )
-                with gr.Accordion("Estimated class weights", open=False):
-                    car_weight_t = gr.Number(value=1.5, label="Car weight estimate (tonnes)")
-                    motorcycle_weight_t = gr.Number(value=0.25, label="Motorcycle weight estimate (tonnes)")
-                    bus_weight_t = gr.Number(value=12.0, label="Bus weight estimate (tonnes)")
-                    truck_weight_t = gr.Number(value=18.0, label="Truck weight estimate (tonnes)")
                 gr.Markdown(
                     """
-                    **For speed:** use **Nano**, inference width **512-640**, and frame stride **3-5**.
-                    Use **Medium** only when you need better detection and have a GPU.
                     """
                 )
@@ -840,7 +1189,7 @@ with gr.Blocks(
                 live_frame = gr.Image(
                     show_label=False,
                     elem_id="live-frame",
-                    height=470,
                 )
             with gr.Row():
@@ -850,14 +1199,15 @@ with gr.Blocks(
                         metrics_html = gr.HTML(
                             value=build_metrics_html(
                                 total_count=0,
-                                class_counts={"car": 0, "motorcycle": 0, "bus": 0, "truck": 0},
                                 cumulative_kg=0,
                                 live_load_kg=0,
                                 load_index_percent=0,
                                 frame_idx=0,
                                 total_frames=0,
                                 elapsed=0,
-                                device=DEVICE,
                             )
                         )
@@ -867,8 +1217,8 @@ with gr.Blocks(
                         load_plot = gr.Image(
                             show_label=False,
                             elem_id="load-plot",
-                            height=310,
-                            value=render_load_plot([]),
                         )
     with gr.Row():
@@ -876,39 +1226,60 @@ with gr.Blocks(
             with gr.Group(elem_classes="panel"):
                 gr.Markdown("### Final annotated video")
                 video_output = gr.Video(label="Replay / download annotated video", height=270)
         with gr.Column(scale=1):
             with gr.Group(elem_classes="panel"):
                 gr.Markdown("### Final summary")
-                summary_output = gr.Markdown("Run an analysis to see the final summary.")
-                csv_output = gr.File(label="Download load-index CSV")
     start_btn.click(
         fn=process_video,
-        inputs=[
-            video_input,
-            model_name,
-            confidence,
-            frame_stride,
-            inference_width,
-            line_position_percent,
-            roi_top_percent,
-            roi_bottom_percent,
-            reference_capacity_tonnes,
-            car_weight_t,
-            motorcycle_weight_t,
-            bus_weight_t,
-            truck_weight_t,
-        ],
-        outputs=[
-            live_frame,
-            metrics_html,
-            load_plot,
-            summary_output,
-            video_output,
-            csv_output,
-        ],
     )
 if __name__ == "__main__":
-    demo.queue(max_size=3).launch()

 """
+Fast Bridge Traffic + Livestock Load Demo
 """
 import os
 import time
 import tempfile
+import warnings
+from pathlib import Path
 from functools import lru_cache
+from typing import Dict, List, Tuple, Optional
 import cv2
 import gradio as gr
 import supervision as sv
 import torch
+# Optional engines
+try:
+    from ultralytics import YOLO
+except Exception:
+    YOLO = None
+try:
+    from rfdetr import RFDETRMedium
+except Exception:
+    RFDETRMedium = None
 # ---------------------------------------------------------------------
+# Quiet noisy dependency warning that is not controlled by this app.
+# The RF-DETR/transformers warning is internal to the dependency stack.
 # ---------------------------------------------------------------------
+warnings.filterwarnings("ignore", message=".*use_return_dict.*")
+warnings.filterwarnings("ignore", message=".*`use_return_dict` is deprecated.*")
+# ---------------------------------------------------------------------
+# App paths and default local video
+# ---------------------------------------------------------------------
+APP_DIR = Path(__file__).resolve().parent
+VIDEO_EXTENSIONS = [".mp4", ".mov", ".avi", ".mkv", ".webm"]
+PREFERRED_VIDEO_NAMES = [
+    "bridge.mp4",
+    "traffic.mp4",
+    "cars.mp4",
+    "video.mp4",
+    "input.mp4",
+    "example.mp4",
+    "sample.mp4",
+]
+def find_default_video() -> Optional[str]:
+    """Find a video sitting next to app.py."""
+    for name in PREFERRED_VIDEO_NAMES:
+        candidate = APP_DIR / name
+        if candidate.exists():
+            return str(candidate)
+    for ext in VIDEO_EXTENSIONS:
+        matches = sorted(APP_DIR.glob(f"*{ext}"))
+        if matches:
+            return str(matches[0])
+    return None
+DEFAULT_VIDEO = find_default_video()
+# ---------------------------------------------------------------------
+# Device and speed setup
+# ---------------------------------------------------------------------
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 try:
     pass
 if DEVICE == "cuda":
+    try:
+        torch.backends.cudnn.benchmark = True
+    except Exception:
+        pass
+# ---------------------------------------------------------------------
+# Target classes and estimated weights
+# ---------------------------------------------------------------------
+# For YOLO COCO:
+# person=0, bicycle=1, car=2, motorcycle=3, bus=5, truck=7,
+# horse=17, sheep=18, cow=19.
+#
+# COCO does not have goat or donkey. We map:
+# sheep -> sheep/goat
+# horse -> horse/donkey
+TARGET_CANONICAL_NAMES = {
+    "person",
+    "bicycle",
+    "car",
+    "motorcycle",
+    "bus",
+    "truck",
+    "cow",
+    "sheep",
+    "goat",
+    "horse",
+    "donkey",
+}
+DISPLAY_NAME = {
+    "person": "person",
+    "bicycle": "bicycle",
+    "car": "car",
+    "motorcycle": "motorcycle",
+    "bus": "bus",
+    "truck": "truck",
+    "cow": "cow",
+    "sheep": "sheep / goat",
+    "goat": "goat",
+    "horse": "horse / donkey",
+    "donkey": "donkey",
+}
+# COCO class names for RF-DETR outputs.
+COCO_NAMES = {
+    0: "person",
+    1: "bicycle",
+    2: "car",
+    3: "motorcycle",
+    5: "bus",
+    7: "truck",
+    17: "horse",
+    18: "sheep",
+    19: "cow",
+}
+# Approximate demo weights in kg.
+# Adjust in the UI for your bridge/traffic context.
+DEFAULT_WEIGHTS_KG = {
+    "person": 75,
+    "bicycle": 120,       # bicycle + rider approximation
+    "motorcycle": 250,
+    "car": 1500,
+    "bus": 12000,
+    "truck": 18000,
+    "cow": 450,
+    "sheep": 60,
+    "goat": 45,
+    "horse": 350,
+    "donkey": 180,
+}
+COLOR_BY_NAME_BGR = {
+    "person": (70, 160, 245),
+    "bicycle": (240, 190, 80),
+    "motorcycle": (255, 150, 80),
+    "car": (60, 210, 130),
+    "bus": (50, 130, 245),
+    "truck": (220, 70, 180),
+    "cow": (160, 120, 80),
+    "sheep": (220, 220, 220),
+    "goat": (210, 210, 230),
+    "horse": (130, 90, 60),
+    "donkey": (120, 110, 95),
+}
 # ---------------------------------------------------------------------
 # Model loading
 # ---------------------------------------------------------------------
+@lru_cache(maxsize=4)
+def load_yolo_model(model_file: str):
+    if YOLO is None:
+        raise RuntimeError(
+            "Ultralytics is not installed. Run: pip install ultralytics"
+        )
+    local_candidate = APP_DIR / model_file
+    model_path = str(local_candidate) if local_candidate.exists() else model_file
+    print(f"Loading YOLO model: {model_path} on {DEVICE}")
+    model = YOLO(model_path)
+    try:
+        model.to(DEVICE)
+    except Exception:
+        pass
+    return model
+@lru_cache(maxsize=1)
+def load_rfdetr_medium():
+    if RFDETRMedium is None:
+        raise RuntimeError(
+            "RF-DETR is not installed. Run: pip install rfdetr"
+        )
+    print(f"Loading RF-DETR Medium on {DEVICE}")
     try:
+        model = RFDETRMedium(device=DEVICE)
     except TypeError:
+        model = RFDETRMedium()
+    # This directly addresses:
+    # "Model is not optimized for inference. Latency may be higher..."
+    try:
+        model.optimize_for_inference()
+        print("RF-DETR Medium optimized for inference.")
+    except Exception as exc:
+        print(f"RF-DETR optimize_for_inference skipped: {exc}")
     return model
 # ---------------------------------------------------------------------
+# Detection conversion
 # ---------------------------------------------------------------------
+def yolo_predict_to_supervision(
+    model,
+    frame_bgr: np.ndarray,
+    confidence: float,
+    imgsz: int,
+) -> Tuple[sv.Detections, List[str]]:
+    """
+    Run YOLO and return supervision Detections plus canonical class names.
+    """
+    results = model.predict(
+        source=frame_bgr,
+        conf=float(confidence),
+        imgsz=int(imgsz),
+        device=0 if DEVICE == "cuda" else "cpu",
+        verbose=False,
+    )[0]
+    if results.boxes is None or len(results.boxes) == 0:
+        return sv.Detections.empty(), []
+    xyxy = results.boxes.xyxy.detach().cpu().numpy()
+    conf = results.boxes.conf.detach().cpu().numpy()
+    cls = results.boxes.cls.detach().cpu().numpy().astype(int)
+    names = model.names if hasattr(model, "names") else {}
+    canonical_names = []
+    keep = []
+    for i, class_id in enumerate(cls):
+        name = str(names.get(int(class_id), class_id)).lower().strip()
+        if name in TARGET_CANONICAL_NAMES:
+            canonical_names.append(name)
+            keep.append(i)
+        elif name == "automobile":
+            canonical_names.append("car")
+            keep.append(i)
+        elif name == "lorry":
+            canonical_names.append("truck")
+            keep.append(i)
+    if not keep:
+        return sv.Detections.empty(), []
+    keep = np.array(keep, dtype=int)
+    detections = sv.Detections(
+        xyxy=xyxy[keep],
+        confidence=conf[keep],
+        class_id=cls[keep],
+    )
+    canonical_names = [canonical_names[j] for j in range(len(canonical_names))]
+    return detections, canonical_names
+def rfdetr_predict_to_supervision(
     model,
     frame_bgr: np.ndarray,
     confidence: float,
     inference_width: int,
+) -> Tuple[sv.Detections, List[str]]:
     """
+    Run RF-DETR Medium. Resize frame before inference for speed, then scale boxes back.
     """
     h, w = frame_bgr.shape[:2]
     if inference_width > 0 and w > inference_width:
+        scale = float(inference_width) / float(w)
+        resized = cv2.resize(
+            frame_bgr,
+            (int(w * scale), int(h * scale)),
+            interpolation=cv2.INTER_AREA,
+        )
     else:
         scale = 1.0
+        resized = frame_bgr
+    rgb = cv2.cvtColor(resized, cv2.COLOR_BGR2RGB)
     with torch.inference_mode():
+        detections = model.predict(rgb, threshold=float(confidence))
     if len(detections) == 0:
+        return detections, []
+    canonical_names = []
+    keep = []
+    for i, cid in enumerate(detections.class_id):
+        cid = int(cid)
+        name = COCO_NAMES.get(cid)
+        if name in TARGET_CANONICAL_NAMES:
+            keep.append(i)
+            canonical_names.append(name)
+    if not keep:
+        return sv.Detections.empty(), []
+    keep = np.array(keep, dtype=int)
+    detections = detections[keep]
+    if scale != 1.0 and len(detections) > 0:
         detections.xyxy = detections.xyxy / scale
+    return detections, canonical_names
+def predict_objects(
+    engine: str,
+    yolo_model_file: str,
+    frame_bgr: np.ndarray,
+    confidence: float,
+    inference_width: int,
+) -> Tuple[sv.Detections, List[str]]:
+    if engine.startswith("YOLO"):
+        model = load_yolo_model(yolo_model_file)
+        return yolo_predict_to_supervision(
+            model=model,
+            frame_bgr=frame_bgr,
+            confidence=confidence,
+            imgsz=inference_width,
+        )
+    model = load_rfdetr_medium()
+    return rfdetr_predict_to_supervision(
+        model=model,
+        frame_bgr=frame_bgr,
+        confidence=confidence,
+        inference_width=inference_width,
+    )
 # ---------------------------------------------------------------------
+# Helpers
 # ---------------------------------------------------------------------
+def side_of_line(y: float, line_y: int, dead_zone_px: int = 5) -> int:
     diff = y - line_y
     if abs(diff) <= dead_zone_px:
         return 0
     if len(detections) == 0:
         return np.empty((0, 2), dtype=float)
     xyxy = detections.xyxy
+    return np.column_stack([
+        (xyxy[:, 0] + xyxy[:, 2]) / 2.0,
+        (xyxy[:, 1] + xyxy[:, 3]) / 2.0,
+    ])
+def make_empty_plot() -> np.ndarray:
+    img = np.ones((300, 620, 3), dtype=np.uint8) * 255
+    cv2.putText(
+        img,
+        "Bridge load index chart will appear here",
+        (70, 155),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.75,
+        (90, 90, 90),
+        2,
+        cv2.LINE_AA,
+    )
+    return img
+def render_load_plot(history: List[Dict]) -> np.ndarray:
+    if not history:
+        return make_empty_plot()
+    df = pd.DataFrame(history)
+    if len(df) > 600:
+        df = df.iloc[np.linspace(0, len(df) - 1, 600).astype(int)]
+    fig, ax = plt.subplots(figsize=(8.0, 3.5), dpi=100)
+    ax.plot(df["time_s"], df["load_index_percent"], linewidth=2)
+    ax.set_title("Estimated Bridge Load Index Over Time")
+    ax.set_xlabel("Video time (seconds)")
+    ax.set_ylabel("Load index (%)")
+    ax.grid(True, alpha=0.25)
+    ax.set_ylim(bottom=0)
+    fig.tight_layout()
+    fig.canvas.draw()
+    rgba = np.asarray(fig.canvas.buffer_rgba())
+    rgb = cv2.cvtColor(rgba, cv2.COLOR_RGBA2RGB)
+    plt.close(fig)
+    return rgb
+def build_metrics_html(
     total_count: int,
+    class_counts: Dict[str, int],
     cumulative_kg: float,
     live_load_kg: float,
     load_index_percent: float,
+    frame_idx: int,
+    total_frames: int,
+    elapsed: float,
+    proc_fps: float,
+    engine: str,
+) -> str:
+    pct = (frame_idx / total_frames * 100.0) if total_frames else 0.0
+    tonnes = cumulative_kg / 1000.0
+    live_tonnes = live_load_kg / 1000.0
+    def c(name: str) -> int:
+        return int(class_counts.get(name, 0))
+    return f"""
+    <div style="font-family:Inter,system-ui,Arial;">
+      <div style="display:grid;grid-template-columns:1fr 1fr;gap:10px;margin-bottom:12px;">
+        <div style="padding:16px;border-radius:18px;background:linear-gradient(135deg,#1d4ed8,#312e81);color:white;">
+          <div style="font-size:11px;letter-spacing:1px;opacity:.86;">OBJECTS CROSSED</div>
+          <div style="font-size:46px;font-weight:850;line-height:1;">{total_count}</div>
+        </div>
+        <div style="padding:16px;border-radius:18px;background:linear-gradient(135deg,#be185d,#7e22ce);color:white;">
+          <div style="font-size:11px;letter-spacing:1px;opacity:.86;">CUMULATIVE EST. MASS</div>
+          <div style="font-size:36px;font-weight:850;line-height:1;">{tonnes:.1f} t</div>
+        </div>
+      </div>
+      <div style="display:grid;grid-template-columns:1fr 1fr;gap:10px;margin-bottom:12px;">
+        <div style="padding:14px;border:1px solid #e5e7eb;border-radius:14px;background:white;">
+          <div style="font-size:12px;color:#6b7280;">Live bridge load</div>
+          <div style="font-size:28px;font-weight:800;color:#111827;">{live_tonnes:.1f} t</div>
+        </div>
+        <div style="padding:14px;border:1px solid #e5e7eb;border-radius:14px;background:white;">
+          <div style="font-size:12px;color:#6b7280;">Load index</div>
+          <div style="font-size:28px;font-weight:800;color:#111827;">{load_index_percent:.1f}%</div>
+        </div>
+      </div>
+      <div style="padding:14px;border:1px solid #e5e7eb;border-radius:14px;background:#ffffff;margin-bottom:12px;">
+        <div style="font-size:12px;color:#6b7280;margin-bottom:8px;">Crossings by class</div>
+        <div style="display:grid;grid-template-columns:1fr 1fr;gap:7px;font-size:13px;">
+          <div>🚶 People: <b>{c("person")}</b></div>
+          <div>🚗 Cars: <b>{c("car")}</b></div>
+          <div>🏍️ Motorcycles: <b>{c("motorcycle")}</b></div>
+          <div>🚲 Bicycles: <b>{c("bicycle")}</b></div>
+          <div>🚌 Buses: <b>{c("bus")}</b></div>
+          <div>🚛 Trucks: <b>{c("truck")}</b></div>
+          <div>🐄 Cows: <b>{c("cow")}</b></div>
+          <div>🐑 Sheep/goats: <b>{c("sheep") + c("goat")}</b></div>
+          <div>🐴 Horse/donkey: <b>{c("horse") + c("donkey")}</b></div>
+        </div>
+      </div>
+      <div style="font-size:12px;color:#6b7280;margin-bottom:4px;display:flex;justify-content:space-between;">
+        <span>Frame {frame_idx} / {total_frames}</span>
+        <span>{pct:.1f}% · {elapsed:.1f}s · {proc_fps:.1f} FPS · {DEVICE} · {engine}</span>
+      </div>
+      <div style="height:8px;background:#e5e7eb;border-radius:999px;overflow:hidden;">
+        <div style="height:100%;width:{pct:.2f}%;background:#4f46e5;"></div>
+      </div>
+    </div>
+    """
+def draw_dashboard(
+    frame: np.ndarray,
+    total_count: int,
+    cumulative_kg: float,
+    live_load_kg: float,
+    load_index_percent: float,
+    proc_fps: float,
+    engine: str,
+) -> np.ndarray:
+    overlay = frame.copy()
+    x1, y1, x2, y2 = 18, 18, 600, 164
+    cv2.rectangle(overlay, (x1, y1), (x2, y2), (18, 24, 38), -1)
+    frame = cv2.addWeighted(overlay, 0.82, frame, 0.18, 0)
+    cv2.putText(
+        frame,
+        "BRIDGE TRAFFIC + LIVESTOCK DEMO",
+        (34, 48),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.72,
+        (255, 255, 255),
+        2,
+        cv2.LINE_AA,
+    )
+    cv2.putText(
+        frame,
+        f"Crossed: {total_count} | Cumulative est. mass: {cumulative_kg/1000.0:.1f} t",
+        (34, 82),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.58,
+        (230, 240, 255),
+        2,
+        cv2.LINE_AA,
+    )
+    cv2.putText(
+        frame,
+        f"Live load: {live_load_kg/1000.0:.1f} t | Load index: {load_index_percent:.1f}%",
+        (34, 114),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.58,
+        (220, 245, 230),
+        2,
+        cv2.LINE_AA,
+    )
+    cv2.putText(
+        frame,
+        f"{proc_fps:.1f} processing FPS | {DEVICE} | {engine}",
+        (34, 144),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.52,
+        (230, 230, 255),
+        1,
+        cv2.LINE_AA,
+    )
     return frame
 def annotate_frame(
     frame: np.ndarray,
     detections: sv.Detections,
+    canonical_names: List[str],
     line_y: int,
     roi_top_y: int,
     roi_bottom_y: int,
     cumulative_kg: float,
     live_load_kg: float,
     load_index_percent: float,
+    proc_fps: float,
+    engine: str,
 ) -> np.ndarray:
     h, w = frame.shape[:2]
+    # Bridge deck ROI.
     overlay = frame.copy()
+    cv2.rectangle(overlay, (0, roi_top_y), (w, roi_bottom_y), (90, 90, 90), -1)
     frame = cv2.addWeighted(overlay, 0.08, frame, 0.92, 0)
+    # Counting line.
     cv2.line(frame, (0, line_y), (w, line_y), (40, 230, 255), 3)
+    cv2.putText(
+        frame,
+        "COUNTING LINE",
+        (24, max(28, line_y - 12)),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.60,
+        (40, 230, 255),
+        2,
+        cv2.LINE_AA,
+    )
+    # ROI borders.
     cv2.line(frame, (0, roi_top_y), (w, roi_top_y), (170, 170, 170), 1)
     cv2.line(frame, (0, roi_bottom_y), (w, roi_bottom_y), (170, 170, 170), 1)
         if confidences is None:
             confidences = [0.0] * len(detections)
+        for i, (xyxy, conf, tid) in enumerate(zip(detections.xyxy, confidences, tracker_ids)):
+            if i >= len(canonical_names):
+                name = "object"
+            else:
+                name = canonical_names[i]
             x1, y1, x2, y2 = map(int, xyxy)
+            color = COLOR_BY_NAME_BGR.get(name, (80, 220, 255))
+            display = DISPLAY_NAME.get(name, name)
+            weight_t = DEFAULT_WEIGHTS_KG.get(name, 0) / 1000.0
             cv2.rectangle(frame, (x1, y1), (x2, y2), color, 2)
+            id_txt = f"#{int(tid)} " if tid is not None and int(tid) >= 0 else ""
+            label = f"{id_txt}{display} {float(conf):.2f} ~{weight_t:.2f}t"
             (tw, th), base = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.52, 1)
             label_y1 = max(0, y1 - th - base - 8)
             cv2.rectangle(frame, (x1, label_y1), (x1 + tw + 10, y1), color, -1)
+            cv2.putText(
+                frame,
+                label,
+                (x1 + 5, y1 - 6),
+                cv2.FONT_HERSHEY_SIMPLEX,
+                0.52,
+                (255, 255, 255),
+                1,
+                cv2.LINE_AA,
+            )
+    frame = draw_dashboard(
         frame=frame,
         total_count=total_count,
         cumulative_kg=cumulative_kg,
         live_load_kg=live_load_kg,
         load_index_percent=load_index_percent,
+        proc_fps=proc_fps,
+        engine=engine,
     )
+    compact_items = []
+    for k in ["person", "car", "motorcycle", "bicycle", "bus", "truck", "cow", "sheep", "goat", "horse", "donkey"]:
+        v = int(class_counts.get(k, 0))
+        if v > 0:
+            compact_items.append(f"{DISPLAY_NAME.get(k, k)}: {v}")
+    text = " | ".join(compact_items) if compact_items else "No crossings yet"
+    cv2.putText(frame, text[:140], (22, h - 24), cv2.FONT_HERSHEY_SIMPLEX, 0.58, (255, 255, 255), 2, cv2.LINE_AA)
+    return frame
+def final_summary_md(
     total_count: int,
     class_counts: Dict[str, int],
     cumulative_kg: float,
     peak_live_load_kg: float,
     peak_load_index: float,
+    auto_video_used: str,
 ) -> str:
+    rows = []
+    for name in ["person", "bicycle", "car", "motorcycle", "bus", "truck", "cow", "sheep", "goat", "horse", "donkey"]:
+        count = int(class_counts.get(name, 0))
+        if count > 0:
+            rows.append(f"| {DISPLAY_NAME.get(name, name)} | {count} |")
+    if not rows:
+        rows.append("| None | 0 |")
+    video_line = f"\n**Default video used:** `{auto_video_used}`\n" if auto_video_used else ""
+    return f"""
+### Final summary
+{video_line}
+**Total crossings:** {total_count}
+| Class | Count |
+|---|---:|
+{chr(10).join(rows)}
+**Cumulative estimated mass:** {cumulative_kg/1000.0:.2f} tonnes
+**Peak estimated live load:** {peak_live_load_kg/1000.0:.2f} tonnes
+**Peak bridge load index:** {peak_load_index:.1f}%
+This is a demonstration traffic-load indicator. Real bridge stress needs axle loads, bridge geometry, material properties, span length, lane position and engineering calibration.
 """
 # ---------------------------------------------------------------------
+# Main video processing generator
 # ---------------------------------------------------------------------
 def process_video(
     video_path,
+    engine,
+    yolo_model_file,
     confidence,
     frame_stride,
     inference_width,
     roi_top_percent,
     roi_bottom_percent,
     reference_capacity_tonnes,
+    person_weight_kg,
+    bicycle_weight_kg,
+    motorcycle_weight_kg,
     car_weight_t,
     bus_weight_t,
     truck_weight_t,
+    cow_weight_kg,
+    sheep_weight_kg,
+    goat_weight_kg,
+    horse_weight_kg,
+    donkey_weight_kg,
 ):
     if video_path is None:
         yield (
             None,
+            build_metrics_html(0, {}, 0, 0, 0, 0, 0, 0, 0, str(engine)),
+            make_empty_plot(),
+            "No video found. Put an `.mp4` file in the same folder as `app.py`, or upload one.",
             None,
             None,
         )
         return
+    # Gradio can pass a dict in some versions.
+    if isinstance(video_path, dict):
+        video_path = video_path.get("path") or video_path.get("name")
+    if not video_path or not os.path.exists(video_path):
+        yield (
+            None,
+            build_metrics_html(0, {}, 0, 0, 0, 0, 0, 0, 0, str(engine)),
+            make_empty_plot(),
+            f"Video not found: {video_path}",
+            None,
+            None,
+        )
+        return
+    DEFAULT_WEIGHTS_KG.update({
+        "person": int(person_weight_kg),
+        "bicycle": int(bicycle_weight_kg),
+        "motorcycle": int(motorcycle_weight_kg),
+        "car": int(float(car_weight_t) * 1000),
+        "bus": int(float(bus_weight_t) * 1000),
+        "truck": int(float(truck_weight_t) * 1000),
+        "cow": int(cow_weight_kg),
+        "sheep": int(sheep_weight_kg),
+        "goat": int(goat_weight_kg),
+        "horse": int(horse_weight_kg),
+        "donkey": int(donkey_weight_kg),
+    })
     cap = cv2.VideoCapture(video_path)
     if not cap.isOpened():
         raise RuntimeError(f"Could not open video: {video_path}")
+    fps = float(cap.get(cv2.CAP_PROP_FPS) or 25.0)
+    if fps <= 1:
         fps = 25.0
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT) or 0)
     roi_bottom_y = int(height * float(roi_bottom_percent) / 100.0)
     if roi_bottom_y <= roi_top_y:
+        roi_top_y = int(height * 0.20)
         roi_bottom_y = int(height * 0.90)
     reference_capacity_kg = max(1.0, float(reference_capacity_tonnes) * 1000.0)
     yield (
         None,
+        build_metrics_html(0, {}, 0, 0, 0, 0, total_frames, 0, 0, str(engine)),
+        make_empty_plot(),
+        f"### Starting analysis on `{Path(video_path).name}`...",
         None,
         None,
     )
+    # Preload model before loop.
+    if str(engine).startswith("YOLO"):
+        _ = load_yolo_model(str(yolo_model_file))
+    else:
+        _ = load_rfdetr_medium()
     tracker = sv.ByteTrack(frame_rate=int(round(fps)))
     out_video_path = tempfile.NamedTemporaryFile(suffix=".mp4", delete=False).name
     out_csv_path = tempfile.NamedTemporaryFile(suffix=".csv", delete=False).name
+    writer = cv2.VideoWriter(
+        out_video_path,
+        cv2.VideoWriter_fourcc(*"mp4v"),
+        fps,
+        (width, height),
+    )
     last_detections = sv.Detections.empty()
+    last_names: List[str] = []
     last_side_by_id: Dict[int, int] = {}
     counted_ids = set()
+    track_name_by_id: Dict[int, str] = {}
+    class_counts = {name: 0 for name in TARGET_CANONICAL_NAMES}
     total_count = 0
     cumulative_kg = 0.0
     history: List[Dict] = []
+    events: List[Dict] = []
     peak_live_load_kg = 0.0
     peak_load_index = 0.0
+    start_wall = time.time()
+    last_yield_wall = 0.0
+    last_plot_wall = 0.0
+    latest_plot = make_empty_plot()
+    processed = 0
     frame_idx = 0
+    final_frame_rgb = None
     while True:
         ok, frame = cap.read()
         if not ok:
             break
+        if frame_idx % int(frame_stride) == 0:
+            detections, names = predict_objects(
+                engine=str(engine),
+                yolo_model_file=str(yolo_model_file),
                 frame_bgr=frame,
                 confidence=float(confidence),
                 inference_width=int(inference_width),
             )
             detections = tracker.update_with_detections(detections)
+            # Preserve name alignment after tracker update.
+            # ByteTrack keeps detections order, so this is usually aligned.
+            if len(names) != len(detections):
+                names = names[:len(detections)]
+                if len(names) < len(detections):
+                    names += ["object"] * (len(detections) - len(names))
             last_detections = detections
+            last_names = names
         else:
             detections = last_detections
+            names = last_names
         centres = detection_centres(detections)
         live_load_kg = 0.0
         if len(detections) > 0 and detections.tracker_id is not None:
+            for i, (centre, tid) in enumerate(zip(centres, detections.tracker_id)):
+                if tid is None or int(tid) < 0:
                     continue
+                tid = int(tid)
+                name = names[i] if i < len(names) else track_name_by_id.get(tid, "object")
+                if name == "object":
+                    continue
+                track_name_by_id[tid] = name
+                cy = float(centre[1])
+                # Live load only for objects currently inside bridge deck ROI.
                 if roi_top_y <= cy <= roi_bottom_y:
+                    live_load_kg += float(DEFAULT_WEIGHTS_KG.get(name, 0))
                 current_side = side_of_line(cy, line_y)
                 previous_side = last_side_by_id.get(tid)
                 if current_side != 0:
+                    if previous_side is not None and previous_side != 0 and previous_side != current_side:
+                        if tid not in counted_ids:
                             counted_ids.add(tid)
                             total_count += 1
+                            class_counts[name] = int(class_counts.get(name, 0)) + 1
+                            weight_kg = float(DEFAULT_WEIGHTS_KG.get(name, 0))
+                            cumulative_kg += weight_kg
+                            direction = "down" if previous_side < current_side else "up"
+                            events.append({
                                 "video_time_s": frame_idx / fps,
                                 "frame": frame_idx,
                                 "tracker_id": tid,
+                                "object_type": name,
+                                "display_type": DISPLAY_NAME.get(name, name),
                                 "direction": direction,
+                                "estimated_weight_kg": weight_kg,
                                 "cumulative_estimated_mass_kg": cumulative_kg,
                             })
         peak_live_load_kg = max(peak_live_load_kg, live_load_kg)
         peak_load_index = max(peak_load_index, load_index_percent)
+        elapsed = time.time() - start_wall
+        processed += 1
+        proc_fps = processed / max(elapsed, 1e-6)
         history.append({
             "time_s": frame_idx / fps,
             "frame": frame_idx,
+            "total_crossings": total_count,
+            "people_crossed": class_counts.get("person", 0),
+            "bicycles_crossed": class_counts.get("bicycle", 0),
             "cars_crossed": class_counts.get("car", 0),
             "motorcycles_crossed": class_counts.get("motorcycle", 0),
             "buses_crossed": class_counts.get("bus", 0),
             "trucks_crossed": class_counts.get("truck", 0),
+            "cows_crossed": class_counts.get("cow", 0),
+            "sheep_goats_crossed": class_counts.get("sheep", 0) + class_counts.get("goat", 0),
+            "horse_donkey_crossed": class_counts.get("horse", 0) + class_counts.get("donkey", 0),
             "live_load_kg": live_load_kg,
             "live_load_tonnes": live_load_kg / 1000.0,
             "load_index_percent": load_index_percent,
             "cumulative_estimated_mass_tonnes": cumulative_kg / 1000.0,
         })
         annotated = annotate_frame(
             frame=frame,
             detections=detections,
+            canonical_names=names,
             line_y=line_y,
             roi_top_y=roi_top_y,
             roi_bottom_y=roi_bottom_y,
             cumulative_kg=cumulative_kg,
             live_load_kg=live_load_kg,
             load_index_percent=load_index_percent,
+            proc_fps=proc_fps,
+            engine=str(engine),
         )
         writer.write(annotated)
+        final_frame_rgb = cv2.cvtColor(annotated, cv2.COLOR_BGR2RGB)
         now = time.time()
+        if now - last_plot_wall >= 1.0:
+            latest_plot = render_load_plot(history)
+            last_plot_wall = now
         if now - last_yield_wall >= 0.35:
             last_yield_wall = now
             yield (
+                final_frame_rgb,
                 build_metrics_html(
                     total_count=total_count,
                     class_counts=class_counts,
                     load_index_percent=load_index_percent,
                     frame_idx=frame_idx + 1,
                     total_frames=total_frames,
+                    elapsed=elapsed,
+                    proc_fps=proc_fps,
+                    engine=str(engine),
                 ),
+                latest_plot,
                 "### Live analysis running...",
                 None,
                 None,
     cap.release()
     writer.release()
     history_df = pd.DataFrame(history)
+    events_df = pd.DataFrame(events)
+    if not events_df.empty:
+        # Save both frame-level history and crossing events in one CSV-like file
+        # by writing two separate CSV sections.
+        with open(out_csv_path, "w", encoding="utf-8") as f:
+            f.write("# FRAME_LEVEL_LOAD_INDEX\n")
+            history_df.to_csv(f, index=False)
+            f.write("\n# CROSSING_EVENTS\n")
+            events_df.to_csv(f, index=False)
+    else:
+        history_df.to_csv(out_csv_path, index=False)
+    elapsed = time.time() - start_wall
+    proc_fps = processed / max(elapsed, 1e-6)
     final_plot = render_load_plot(history)
     yield (
+        final_frame_rgb,
         build_metrics_html(
             total_count=total_count,
             class_counts=class_counts,
             load_index_percent=0,
             frame_idx=total_frames if total_frames else frame_idx,
             total_frames=total_frames if total_frames else frame_idx,
+            elapsed=elapsed,
+            proc_fps=proc_fps,
+            engine=str(engine),
         ),
         final_plot,
+        final_summary_md(
+            total_count=total_count,
+            class_counts=class_counts,
+            cumulative_kg=cumulative_kg,
+            peak_live_load_kg=peak_live_load_kg,
+            peak_load_index=peak_load_index,
+            auto_video_used=video_path if str(video_path).startswith(str(APP_DIR)) else "",
+        ),
         out_video_path,
         out_csv_path,
     )
 # ---------------------------------------------------------------------
+# UI
 # ---------------------------------------------------------------------
 CUSTOM_CSS = """
 .gradio-container {
+    max-width: 1360px !important;
     margin: auto !important;
 }
 #hero {
     text-align: center;
+    padding: 16px 8px 6px 8px;
 }
 #hero h1 {
     font-weight: 850;
+    letter-spacing: -0.8px;
     margin-bottom: 2px;
 }
 #hero p {
     border-radius: 18px;
     padding: 16px;
     background: #ffffff;
+    box-shadow: 0 8px 24px rgba(15, 23, 42, 0.045);
 }
 #live-frame img, #load-plot img {
     border-radius: 14px;
 """
 with gr.Blocks(
+    title="Fast Bridge Traffic + Livestock Load Demo",
     theme=gr.themes.Soft(primary_hue="indigo", secondary_hue="slate"),
     css=CUSTOM_CSS,
 ) as demo:
     with gr.Row(elem_id="hero"):
         gr.Markdown(
             """
+            # 🌉 Fast Bridge Traffic + Livestock Load Demo
+            YOLO-small / RF-DETR Medium detection, ByteTrack tracking, line-crossing counts,
+            estimated object weights, and live bridge load-index over time.
             """
         )
+    if DEFAULT_VIDEO:
+        gr.Markdown(f"✅ Found default video next to `app.py`: `{Path(DEFAULT_VIDEO).name}`. The app will auto-start inference when opened.")
+    else:
+        gr.Markdown("⚠️ No local video found next to `app.py`. Upload a video or place `bridge.mp4`, `traffic.mp4`, `input.mp4`, or any `.mp4` in the same folder.")
     with gr.Row():
         with gr.Column(scale=1):
             with gr.Group(elem_classes="panel"):
+                gr.Markdown("### 1) Video")
                 video_input = gr.Video(
+                    label="Video input",
                     sources=["upload"],
+                    value=DEFAULT_VIDEO,
                     format="mp4",
                     height=260,
                 )
+                start_btn = gr.Button("▶ Start / rerun analysis", variant="primary", size="lg")
+                gr.Markdown("### 2) Inference engine")
+                engine = gr.Radio(
+                    choices=[
+                        "YOLO small - fastest recommended",
+                        "RF-DETR Medium - slower but strong",
+                    ],
+                    value="YOLO small - fastest recommended",
+                    label="Engine",
                 )
+                yolo_model_file = gr.Textbox(
+                    value="yolo11s.pt",
+                    label="YOLO model file/name",
+                    info="Use yolo11s.pt for small. Put your custom .pt in the same folder as app.py and type its filename here.",
+                )
                 confidence = gr.Slider(
                     minimum=0.10,
                     maximum=0.90,
+                    value=0.35,
                     step=0.05,
                     label="Confidence threshold",
                 )
                 frame_stride = gr.Slider(
                     minimum=1,
+                    maximum=12,
                     value=3,
                     step=1,
                     label="Frame stride",
+                    info="Detect every Nth frame. 3-5 is much faster than every frame.",
                 )
                 inference_width = gr.Slider(
                     minimum=384,
                     maximum=1280,
                     value=640,
                     step=64,
+                    label="Inference image size / width",
+                    info="Lower is faster. Try 512 or 640 for fast demos.",
                 )
                 with gr.Accordion("Bridge settings", open=False):
                         label="Bridge deck ROI bottom (%)",
                     )
                     reference_capacity_tonnes = gr.Slider(
+                        minimum=1,
+                        maximum=250,
                         value=40,
+                        step=1,
                         label="Reference live-load capacity for demo index (tonnes)",
                     )
+                with gr.Accordion("Estimated weights", open=False):
+                    person_weight_kg = gr.Number(value=75, label="Person weight estimate (kg)")
+                    bicycle_weight_kg = gr.Number(value=120, label="Bicycle + rider estimate (kg)")
+                    motorcycle_weight_kg = gr.Number(value=250, label="Motorcycle estimate (kg)")
+                    car_weight_t = gr.Number(value=1.5, label="Car estimate (tonnes)")
+                    bus_weight_t = gr.Number(value=12.0, label="Bus estimate (tonnes)")
+                    truck_weight_t = gr.Number(value=18.0, label="Truck estimate (tonnes)")
+                    cow_weight_kg = gr.Number(value=450, label="Cow estimate (kg)")
+                    sheep_weight_kg = gr.Number(value=60, label="Sheep estimate (kg)")
+                    goat_weight_kg = gr.Number(value=45, label="Goat estimate (kg)")
+                    horse_weight_kg = gr.Number(value=350, label="Horse estimate (kg)")
+                    donkey_weight_kg = gr.Number(value=180, label="Donkey estimate (kg)")
                 gr.Markdown(
                     """
+                    **Fast demo settings:** YOLO small, confidence 0.30-0.40,
+                    frame stride 3-5, image size 512-640.
                     """
                 )
                 live_frame = gr.Image(
                     show_label=False,
                     elem_id="live-frame",
+                    height=500,
                 )
             with gr.Row():
                         metrics_html = gr.HTML(
                             value=build_metrics_html(
                                 total_count=0,
+                                class_counts={},
                                 cumulative_kg=0,
                                 live_load_kg=0,
                                 load_index_percent=0,
                                 frame_idx=0,
                                 total_frames=0,
                                 elapsed=0,
+                                proc_fps=0,
+                                engine="not started",
                             )
                         )
                         load_plot = gr.Image(
                             show_label=False,
                             elem_id="load-plot",
+                            height=300,
+                            value=make_empty_plot(),
                         )
     with gr.Row():
             with gr.Group(elem_classes="panel"):
                 gr.Markdown("### Final annotated video")
                 video_output = gr.Video(label="Replay / download annotated video", height=270)
         with gr.Column(scale=1):
             with gr.Group(elem_classes="panel"):
                 gr.Markdown("### Final summary")
+                summary_output = gr.Markdown("The summary will appear after analysis.")
+                csv_output = gr.File(label="Download CSV")
+    inputs = [
+        video_input,
+        engine,
+        yolo_model_file,
+        confidence,
+        frame_stride,
+        inference_width,
+        line_position_percent,
+        roi_top_percent,
+        roi_bottom_percent,
+        reference_capacity_tonnes,
+        person_weight_kg,
+        bicycle_weight_kg,
+        motorcycle_weight_kg,
+        car_weight_t,
+        bus_weight_t,
+        truck_weight_t,
+        cow_weight_kg,
+        sheep_weight_kg,
+        goat_weight_kg,
+        horse_weight_kg,
+        donkey_weight_kg,
+    ]
+    outputs = [
+        live_frame,
+        metrics_html,
+        load_plot,
+        summary_output,
+        video_output,
+        csv_output,
+    ]
     start_btn.click(
         fn=process_video,
+        inputs=inputs,
+        outputs=outputs,
     )
+    # Auto-start when a local video exists beside app.py.
+    if DEFAULT_VIDEO:
+        demo.load(
+            fn=process_video,
+            inputs=inputs,
+            outputs=outputs,
+        )
 if __name__ == "__main__":
+    demo.queue(max_size=2).launch()