Spaces:

MLBench
/

passenger_tracking

Sleeping

App Files Files Community

mlbench123 commited on Dec 8, 2025

Commit

309e137

verified ·

1 Parent(s): 538b7f4

Upload 4 files

Browse files

Files changed (4) hide show

head_detection_single_video_best.pt +3 -0
requirements.txt +21 -0
run7.py +829 -0
yolo11x.pt +3 -0

head_detection_single_video_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72a33be921c31b44083693db0d03025604fe60c94d4846a168fe7f93d158a15a
+size 16737774

requirements.txt ADDED Viewed

	@@ -0,0 +1,21 @@

+# Core Dependencies
+numpy==1.24.3
+opencv-python==4.8.1.78
+scipy==1.11.4
+# Computer Vision & Object Detection (CPU-only for Mac)
+torch==2.1.0
+torchvision==0.16.0
+ultralytics==8.1.3
+# Data Processing
+pandas==2.1.4
+openpyxl==3.1.2
+# Optional but recommended for better UX
+tqdm==4.66.1        # Progress bars
+PyYAML==6.0.1       # Configuration files
+# Optional visualization (can be removed if client doesn't need)
+matplotlib==3.8.0
+seaborn==0.13.0

run7.py ADDED Viewed

	@@ -0,0 +1,829 @@

+# run7.py
+# Updated to implement Option 1 directional crossing:
+# - Detect directional crossing of L1 then L2 (L1 coords and L2 coords provided)
+# - Maintain a global counter that increments only when an ID crosses L1 (outside->inside) then later crosses L2 (outside->inside)
+# - Maintain a live "inside polygon" counter
+# - Visualize both counters in Zone Summary panel
+# - Keeps all previous features: homography patch, foot-point mapping, travel distance, avg time, occlusion tolerance and reappearance inheritance
+# Paste and run. Output video and person_times.xlsx saved in working folder.
+import cv2
+import numpy as np
+import time
+import torch
+import pandas as pd
+from collections import defaultdict, deque
+from scipy.ndimage import gaussian_filter1d
+from ultralytics import YOLO
+import os
+# ---------------- Points in image (given) - adjust if needed
+A = (440.0, 829.0)
+B = (883.0, 928.0)
+C = (1052.0, 325.0)
+D = (739.0, 297.0)
+E = (727.0, 688.0)
+F = (893.0, 312.0)
+POLYGON = np.array([A, B, C, D], dtype=np.float32)
+# ---------------- Real-world segment lengths for path C -> B -> A -> D (meters)
+SEG_REAL_M = [5.0, 2.5, 5.0]   # C->B, B->A, A->D
+# image path (order C,B,A,D)
+PATH_IMAGE = np.array([C, B, A, D], dtype=np.float32)
+# Patch base scaling (pixels per meter). Will adapt to fit.
+BASE_SCALE_PX_PER_M = 80.0
+RIGHT_PANEL_W = 350
+SMOOTH_ALPHA = 0.65
+MISSING_TIMEOUT = 3.0
+# ---------------- Lines (L1, L2) coordinates (image space) - use these for counting
+L1_p1 = (898.0, 322.0)
+L1_p2 = (1020.0, 453.0)
+L2_p1 = (786.0, 576.0)
+L2_p2 = (977.0, 607.0)
+# ---------------- Utilities
+def progress_bar(current, total, bar_length=30):
+    if total <= 0:
+        return
+    ratio = current / total
+    filled = int(ratio * bar_length)
+    bar = "█" * filled + "-" * (bar_length - filled)
+    print(f"\r[{bar}] {int(ratio * 100)}%   Frame {current}/{total}", end="")
+def point_in_polygon(cx, cy, polygon):
+    return cv2.pointPolygonTest(polygon.astype(np.int32), (int(cx), int(cy)), False) >= 0
+def euclid(a, b):
+    return float(np.hypot(a[0]-b[0], a[1]-b[1]))
+def fmt(t):
+    return time.strftime('%H:%M:%S', time.gmtime(t))
+def calculate_foot_from_head(head_box, head_center):
+    """Calculate foot position from head detection."""
+    x1, y1, x2, y2 = head_box
+    head_cx, head_cy = head_center
+    head_height = y2 - y1
+    body_length_est = head_height * 5.5
+    foot_x = head_cx
+    foot_y = head_cy + body_length_est
+    return foot_x, foot_y
+def nms_obb(boxes, scores, threshold=0.4):
+    """Non-Maximum Suppression for Oriented Bounding Boxes"""
+    if len(boxes) == 0:
+        return []
+    boxes_np = np.array(boxes)
+    scores_np = np.array(scores)
+    x_coords = boxes_np[:, 0::2]
+    y_coords = boxes_np[:, 1::2]
+    x_min = np.min(x_coords, axis=1)
+    y_min = np.min(y_coords, axis=1)
+    x_max = np.max(x_coords, axis=1)
+    y_max = np.max(y_coords, axis=1)
+    areas = (x_max - x_min) * (y_max - y_min)
+    order = scores_np.argsort()[::-1]
+    keep = []
+    while order.size > 0:
+        i = order[0]
+        keep.append(i)
+        xx1 = np.maximum(x_min[i], x_min[order[1:]])
+        yy1 = np.maximum(y_min[i], y_min[order[1:]])
+        xx2 = np.minimum(x_max[i], x_max[order[1:]])
+        yy2 = np.minimum(y_max[i], y_max[order[1:]])
+        w = np.maximum(0.0, xx2 - xx1)
+        h = np.maximum(0.0, yy2 - yy1)
+        intersection = w * h
+        union = areas[i] + areas[order[1:]] - intersection
+        iou = intersection / union
+        inds = np.where(iou <= threshold)[0]
+        order = order[inds + 1]
+    return keep
+# ---------------- Project point onto polyline (returns along distance in px and proj point)
+def project_point_to_polyline(pt, poly):
+    best_dist = None
+    best_proj = None
+    best_cum = 0.0
+    cum = 0.0
+    for i in range(1, len(poly)):
+        a = np.array(poly[i-1], dtype=np.float32)
+        b = np.array(poly[i], dtype=np.float32)
+        v = b - a
+        w = np.array(pt, dtype=np.float32) - a
+        seg_len = float(np.hypot(v[0], v[1]))
+        if seg_len == 0:
+            t = 0.0
+            proj = a.copy()
+        else:
+            t = float(np.dot(w, v) / (seg_len*seg_len))
+            t = max(0.0, min(1.0, t))
+            proj = a + t*v
+        d = float(np.hypot(proj[0]-pt[0], proj[1]-pt[1]))
+        along_px = cum + t * seg_len
+        if best_dist is None or d < best_dist:
+            best_dist = d
+            best_proj = proj
+            best_cum = along_px
+        cum += seg_len
+    return float(best_cum), (float(best_proj[0]), float(best_proj[1]))
+def polyline_pixel_lengths(poly):
+    return [euclid(poly[i-1], poly[i]) for i in range(1, len(poly))]
+# ---------------- Compute conversion per segment (image)
+img_seg_px_lengths = polyline_pixel_lengths(PATH_IMAGE)
+if len(img_seg_px_lengths) != len(SEG_REAL_M):
+    raise RuntimeError("PATH_IMAGE and SEG_REAL_M length mismatch")
+seg_px_to_m = []
+for px_len, m_len in zip(img_seg_px_lengths, SEG_REAL_M):
+    seg_px_to_m.append((m_len / px_len) if px_len > 1e-6 else 0.0)
+# helper: compute along_m from an image point using image PATH_IMAGE
+def image_point_to_along_m(pt):
+    along_px, _ = project_point_to_polyline(pt, PATH_IMAGE)
+    px_cum = 0.0
+    cum_m = 0.0
+    for i, seg_px in enumerate(img_seg_px_lengths):
+        next_px = px_cum + seg_px
+        if along_px <= next_px + 1e-9:
+            offset_px = along_px - px_cum
+            along_m = cum_m + offset_px * seg_px_to_m[i]
+            return float(max(0.0, min(sum(SEG_REAL_M), along_m)))
+        px_cum = next_px
+        cum_m += SEG_REAL_M[i]
+    return float(sum(SEG_REAL_M))
+# ---------------- Build patch rectangle layout (pixel coordinates)
+def build_patch_layout(scale_px_per_m):
+    margin = 18
+    rect_w_px = int(2.5 * scale_px_per_m)
+    rect_h_px = int(5.0 * scale_px_per_m)
+    patch_w = rect_w_px + 2*margin
+    patch_h = rect_h_px + 2*margin
+    left_x = margin
+    right_x = margin + rect_w_px
+    top_y = margin
+    bottom_y = margin + rect_h_px
+    # top row: D (left-top), F (mid-top), C (right-top)
+    D_p = (left_x, top_y)
+    F_p = ( (left_x + right_x)//2, top_y )
+    C_p = (right_x, top_y)
+    A_p = (left_x, bottom_y)
+    B_p = (right_x, bottom_y)
+    # E point down from F
+    E_p = (F_p[0], top_y + int(rect_h_px * 0.55))
+    path_patch = np.array([C_p, B_p, A_p, D_p], dtype=np.float32)  # C->B->A->D
+    extras = {"patch_w": patch_w, "patch_h": patch_h, "D": D_p, "F": F_p, "C": C_p, "A": A_p, "B": B_p, "E": E_p, "scale": scale_px_per_m}
+    return path_patch, extras
+PATCH_PATH, PATCH_EXTRAS = build_patch_layout(BASE_SCALE_PX_PER_M)
+PATCH_W = PATCH_EXTRAS["patch_w"]
+PATCH_H = PATCH_EXTRAS["patch_h"]
+# ---------------- Line helpers for crossing detection
+def line_coeffs(p1, p2):
+    # returns a,b,c for line ax+by+c=0
+    (x1,y1), (x2,y2) = p1, p2
+    a = y1 - y2
+    b = x2 - x1
+    c = x1*y2 - x2*y1
+    return a, b, c
+def signed_dist_to_line(p, line_coeff):
+    a,b,c = line_coeff
+    x,y = p
+    return (a*x + b*y + c) / (np.hypot(a,b) + 1e-12)
+def segment_intersects(a1,a2,b1,b2):
+    # standard segment intersection test
+    def ccw(A,B,C):
+        return (C[1]-A[1])*(B[0]-A[0]) > (B[1]-A[1])*(C[0]-A[0])
+    A=a1; B=a2; C=b1; D=b2
+    return (ccw(A,C,D) != ccw(B,C,D)) and (ccw(A,B,C) != ccw(A,B,D))
+L1_coeff = line_coeffs(L1_p1, L1_p2)
+L2_coeff = line_coeffs(L2_p1, L2_p2)
+# Determine inside side for each line using polygon centroid:
+poly_centroid = tuple(np.mean(POLYGON, axis=0).tolist())
+L1_inside_sign = np.sign(signed_dist_to_line(poly_centroid, L1_coeff))
+if L1_inside_sign == 0:
+    L1_inside_sign = 1.0
+L2_inside_sign = np.sign(signed_dist_to_line(poly_centroid, L2_coeff))
+if L2_inside_sign == 0:
+    L2_inside_sign = 1.0
+# ---------------- BBox smoother
+class BBoxSmoother:
+    def __init__(self, buffer_size=5):
+        self.buf = buffer_size
+        self.hist = defaultdict(lambda: deque(maxlen=buffer_size))
+    def smooth(self, boxes, ids):
+        out = []
+        for box, tid in zip(boxes, ids):
+            self.hist[tid].append(box)
+            arr = np.array(self.hist[tid])
+            if arr.shape[0] >= 3:
+                sm = gaussian_filter1d(arr, sigma=1, axis=0)[-1]
+            else:
+                sm = arr[-1]
+            out.append(sm)
+        return np.array(out)
+# ---------------- Main processing function
+def process_video(
+    input_video_path="crop_video.mp4",
+    output_video_path="people_polygon_tracking_corrected.avi",
+    model_name="yolo11x.pt",
+    head_model_name="head_detection_model.pt",
+    conf_threshold=0.3,
+    img_size=1280,
+    use_gpu=True,
+    enhance_frames=False,
+    smooth_bbox_tracks=True,
+    missing_timeout=MISSING_TIMEOUT
+):
+    device = "cuda" if torch.cuda.is_available() and use_gpu else "cpu"
+    model = YOLO(model_name)
+    PERSON_CLASS = 0
+    head_model = YOLO(head_model_name)  # Your OBB head detection model
+    HEAD_CLASS = 0
+    bbox_smoother = BBoxSmoother(5) if smooth_bbox_tracks else None
+    # persistent state
+    inside_state = {}
+    entry_time = {}
+    accumulated_time = defaultdict(float)
+    first_entry_vid = {}
+    last_exit_vid = {}
+    last_seen = {}
+    prev_along = {}
+    prev_time = {}
+    entry_along = {}
+    travel_distance = defaultdict(float)
+    display_pos = {}
+    head_foot_positions = {}  # Stores head detections with estimated foot positions
+    person_only_ids = set()   # Track person-only detections
+    head_only_ids = set()     # Track head-only detections
+    # crossing trackers
+    prev_foot = {}           # {id: (x,y)} previous foot coordinate (image space)
+    crossed_l1_flag = {}     # {id: bool} whether this id has crossed L1 (in required direction) and not yet used to count
+    crossed_l2_counted = {}  # {id: bool} whether this id has already triggered the global count by crossing L2 after L1
+    global_counter = 0       # counts completed L1->L2 sequences
+    completed_times = []     # for avg time taken
+    cap = cv2.VideoCapture(input_video_path)
+    if not cap.isOpened():
+        raise RuntimeError("Cannot open input video: " + input_video_path)
+    fps = int(cap.get(cv2.CAP_PROP_FPS)) or 25
+    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    out_w = width + RIGHT_PANEL_W
+    out_h = height
+    fourcc = cv2.VideoWriter_fourcc(*'MJPG')
+    writer = cv2.VideoWriter(output_video_path, fourcc, fps, (out_w, out_h))
+    if not writer.isOpened():
+        raise RuntimeError("Failed to open VideoWriter. Try different codec or path.")
+    # adjust patch scale if too tall
+    PATCH_PATH_local = PATCH_PATH.copy()
+    patch_w = PATCH_W
+    patch_h = PATCH_H
+    patch_scale = PATCH_EXTRAS["scale"]
+    if patch_h > height - 40:
+        factor = (height - 60) / patch_h
+        PATCH_PATH_local = PATCH_PATH_local * factor
+        patch_w = int(patch_w * factor)
+        patch_h = int(patch_h * factor)
+        patch_scale = patch_scale * factor
+    # Create homography from POLYGON (image A,B,C,D) to rect corners in patch coordinates (A_p,B_p,C_p,D_p)
+    A_p = PATCH_EXTRAS["A"]
+    B_p = PATCH_EXTRAS["B"]
+    C_p = PATCH_EXTRAS["C"]
+    D_p = PATCH_EXTRAS["D"]
+    dest_rect = np.array([A_p, B_p, C_p, D_p], dtype=np.float32)
+    H_img2patch = cv2.getPerspectiveTransform(POLYGON.astype(np.float32), dest_rect.astype(np.float32))
+    start_time = time.time()
+    frame_idx = 0
+    # precompute line endpoints & ints for visualization and intersection tests
+    L1 = (L1_p1, L1_p2)
+    L2 = (L2_p1, L2_p2)
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            break
+        frame_idx += 1
+        progress_bar(frame_idx, total_frames)
+        now = time.time()
+        vid_seconds = now - start_time
+        if enhance_frames:
+            frame = cv2.fastNlMeansDenoisingColored(frame, None, 5,5,7,21)
+        results = model.track(
+            frame,
+            persist=True,
+            tracker="bytetrack.yaml",
+            classes=[PERSON_CLASS],
+            conf=conf_threshold,
+            iou=0.5,
+            imgsz=img_size,
+            device=device,
+            half=use_gpu,
+            verbose=False
+        )
+        # Head detection (NEW - runs in parallel)
+        head_results = head_model(frame, conf=conf_threshold, classes=[HEAD_CLASS], verbose=False)[0]
+        # Process head detections
+        obb_boxes = []
+        obb_scores = []
+        obb_data = []
+        head_foot_positions = {}  # {estimated_foot_pos: (head_box, conf)}
+        if head_results.obb is not None and len(head_results.obb) > 0:
+            for obb in head_results.obb:
+                xyxyxyxy = obb.xyxyxyxy[0].cpu().numpy()
+                conf = float(obb.conf[0])
+                if conf < conf_threshold:
+                    continue
+                obb_boxes.append(xyxyxyxy.flatten().tolist())
+                obb_scores.append(conf)
+                obb_data.append((xyxyxyxy, conf))
+            # Apply NMS to head detections
+            if len(obb_boxes) > 0:
+                keep_indices = nms_obb(obb_boxes, obb_scores, 0.4)
+                for idx in keep_indices:
+                    xyxyxyxy, conf = obb_data[idx]
+                    # Convert OBB to axis-aligned bbox
+                    x_min = int(xyxyxyxy[:, 0].min())
+                    y_min = int(xyxyxyxy[:, 1].min())
+                    x_max = int(xyxyxyxy[:, 0].max())
+                    y_max = int(xyxyxyxy[:, 1].max())
+                    head_cx = (x_min + x_max) / 2.0
+                    head_cy = float(y_min)
+                    # Calculate foot from head
+                    foot_x, foot_y = calculate_foot_from_head(
+                        [x_min, y_min, x_max, y_max],
+                        (head_cx, head_cy)
+                    )
+                    head_foot_positions[(foot_x, foot_y)] = ((x_min, y_min, x_max, y_max, xyxyxyxy), conf)
+        # draw polygon on frame
+        cv2.polylines(frame, [POLYGON.astype(np.int32)], True, (255,0,0), 3)
+        # draw L1 and L2 on frame (blue)
+        cv2.line(frame, tuple(map(int, L1_p1)), tuple(map(int, L1_p2)), (255,180,0), 3)
+        cv2.line(frame, tuple(map(int, L2_p1)), tuple(map(int, L2_p2)), (255,180,0), 3)
+        right_panel = np.ones((height, RIGHT_PANEL_W, 3), dtype=np.uint8) * 40
+        patch = np.ones((patch_h, patch_w, 3), dtype=np.uint8) * 255
+        # draw patch structure: rectangle and center divider
+        A_px = (int(dest_rect[0][0]), int(dest_rect[0][1]))
+        B_px = (int(dest_rect[1][0]), int(dest_rect[1][1]))
+        C_px = (int(dest_rect[2][0]), int(dest_rect[2][1]))
+        D_px = (int(dest_rect[3][0]), int(dest_rect[3][1]))
+        # walls (thick black lines)
+        cv2.line(patch, A_px, D_px, (0,0,0), 6)  # left
+        cv2.line(patch, A_px, B_px, (0,0,0), 6)  # bottom
+        cv2.line(patch, B_px, C_px, (0,0,0), 6)  # right
+        cv2.line(patch, D_px, C_px, (0,0,0), 6)  # top
+        # center divider F->E
+        F_px = ( (D_px[0] + C_px[0])//2, D_px[1] )
+        E_px = (F_px[0], D_px[1] + int((patch_h) * 0.5))
+        cv2.line(patch, F_px, E_px, (0,0,0), 6)
+        for p in [A_px, B_px, C_px, D_px, F_px, E_px]:
+            cv2.circle(patch, p, 5, (0,0,0), -1)
+                # Match person detections with head detections
+        person_head_matches = {}  # {person_id: head_foot_pos}
+        matched_heads = set()
+        b = results[0].boxes
+        detected_ids = set()
+        current_inside = []
+        current_projs = []
+        if b is not None and b.id is not None:
+            boxes = b.xyxy.cpu().numpy()
+            ids = b.id.cpu().numpy().astype(int)
+            if bbox_smoother is not None:
+                boxes = bbox_smoother.smooth(boxes, ids)
+            # First pass: match person detections with head detections
+            for box, tid in zip(boxes, ids):
+                x1, y1, x2, y2 = map(int, box)
+                person_foot_x = float((x1 + x2) / 2.0)
+                person_foot_y = float(y2)
+                # Find closest head detection within reasonable distance
+                best_head = None
+                best_dist = 100  # pixels threshold
+                for head_foot_pos, (head_box_data, head_conf) in head_foot_positions.items():
+                    head_fx, head_fy = head_foot_pos
+                    dist = np.sqrt((person_foot_x - head_fx)**2 + (person_foot_y - head_fy)**2)
+                    # Check if head is roughly above person bbox (y_head < y_person_top)
+                    head_box = head_box_data[:4]
+                    if head_box[3] < y1 + 50:  # head bottom should be near person top
+                        if dist < best_dist and head_foot_pos not in matched_heads:
+                            best_dist = dist
+                            best_head = head_foot_pos
+                if best_head:
+                    person_head_matches[tid] = best_head
+                    matched_heads.add(best_head)
+                    person_only_ids.discard(tid)
+                else:
+                    person_only_ids.add(tid)
+            for box, tid in zip(boxes, ids):
+                x1, y1, x2, y2 = map(int, box)
+                # Use head-derived foot if available, otherwise use person bbox foot
+                if tid in person_head_matches:
+                    fx, fy = person_head_matches[tid]
+                    head_box_data, head_conf = head_foot_positions[person_head_matches[tid]]
+                    head_box = head_box_data[:4]
+                    xyxyxyxy = head_box_data[4]
+                    # Draw head OBB (cyan for matched detection)
+                    points = xyxyxyxy.astype(np.int32)
+                    cv2.polylines(frame, [points], True, (255, 255, 0), 2)
+                else:
+                    fx = float((x1 + x2) / 2.0)
+                    fy = float(y2)   # bottom center (foot)
+                detected_ids.add(tid)
+                last_seen[tid] = now
+                inside = point_in_polygon(fx, fy, POLYGON)
+                prev = inside_state.get(tid, False)
+                # maintain prev_foot for intersection tests
+                prev_pt = prev_foot.get(tid, None)
+                current_pt = (fx, fy)
+                # Crossing detection for L1
+                if prev_pt is not None:
+                    # check intersection with L1
+                    inter_l1 = segment_intersects(prev_pt, current_pt, L1_p1, L1_p2)
+                    if inter_l1:
+                        # check direction: we want prev_sign != curr_sign and curr_sign == inside sign
+                        prev_sign = np.sign(signed_dist_to_line(prev_pt, L1_coeff))
+                        curr_sign = np.sign(signed_dist_to_line(current_pt, L1_coeff))
+                        if prev_sign == 0:
+                            prev_sign = -curr_sign if curr_sign != 0 else 1.0
+                        if curr_sign == 0:
+                            curr_sign = prev_sign
+                        if prev_sign != curr_sign and curr_sign == L1_inside_sign:
+                            # crossed L1 in correct direction (outside -> inside)
+                            crossed_l1_flag[tid] = True
+                    # check intersection with L2
+                    inter_l2 = segment_intersects(prev_pt, current_pt, L2_p1, L2_p2)
+                    if inter_l2:
+                        prev_sign = np.sign(signed_dist_to_line(prev_pt, L2_coeff))
+                        curr_sign = np.sign(signed_dist_to_line(current_pt, L2_coeff))
+                        if prev_sign == 0:
+                            prev_sign = -curr_sign if curr_sign != 0 else 1.0
+                        if curr_sign == 0:
+                            curr_sign = prev_sign
+                        if prev_sign != curr_sign and curr_sign == L2_inside_sign:
+                            # crossed L2 in correct direction; if previously crossed L1 and not yet counted => count
+                            if crossed_l1_flag.get(tid, False) and not crossed_l2_counted.get(tid, False):
+                                global_counter += 1
+                                crossed_l2_counted[tid] = True
+                                # once person completed crossing sequence, we keep their travel/time records intact
+                # update prev_foot
+                prev_foot[tid] = current_pt
+                if inside and not prev:
+                    inside_state[tid] = True
+                    if tid not in entry_time:
+                        entry_time[tid] = now
+                    if tid not in first_entry_vid:
+                        first_entry_vid[tid] = vid_seconds
+                if tid not in accumulated_time:
+                    accumulated_time[tid] = 0.0
+                if tid not in travel_distance:
+                    travel_distance[tid] = 0.0
+                # draw bbox only for inside persons
+                if inside:
+                    # Green if matched with head, yellow if person-only
+                    color = (0, 200, 0) if tid in person_head_matches else (0, 200, 200)
+                    cv2.rectangle(frame, (x1,y1), (x2,y2), color, 2)
+                    cv2.putText(frame, f"ID {tid}", (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.8, color, 2)
+                    # map foot point through homography to patch coordinates (this is the key)
+                    pt_img = np.array([[[fx, fy]]], dtype=np.float32)
+                    mapped = cv2.perspectiveTransform(pt_img, H_img2patch)[0][0]
+                    mx = float(np.clip(mapped[0], 0, patch_w - 1))
+                    my = float(np.clip(mapped[1], 0, patch_h - 1))
+                    # smooth display position
+                    if tid in display_pos:
+                        px_prev, py_prev = display_pos[tid]
+                        sx = SMOOTH_ALPHA
+                        dx = px_prev*(1 - sx) + mx*sx
+                        dy = py_prev*(1 - sx) + my*sx
+                    else:
+                        dx, dy = mx, my
+                    display_pos[tid] = (dx, dy)
+                    current_inside.append(tid)
+                    # compute along_m using image-based method for metric consistency
+                    along_m = image_point_to_along_m((fx, fy))
+                    current_projs.append((tid, along_m))
+                    # initialize prev_along if first time
+                    if tid not in prev_along:
+                        prev_along[tid] = along_m
+                        entry_along[tid] = along_m
+                        prev_time[tid] = now
+                    # compute forward-only travel distance
+                    delta = along_m - prev_along.get(tid, along_m)
+                    if delta > 0:
+                        travel_distance[tid] += delta
+                    prev_along[tid] = along_m
+                    prev_time[tid] = now
+        for head_foot_pos, (head_box_data, head_conf) in head_foot_positions.items():
+            if head_foot_pos in matched_heads:
+                continue  # Already matched with a person
+            fx, fy = head_foot_pos
+            # Only process if inside polygon
+            if not point_in_polygon(fx, fy, POLYGON):
+                continue
+            # Try to match with existing tracked IDs by proximity
+            matched_existing = False
+            for tid in list(inside_state.keys()):
+                if tid in detected_ids:
+                    continue  # Already detected this frame
+                if tid in display_pos:
+                    prev_x, prev_y = display_pos[tid]
+                    # Check if head is near previous position
+                    dist = np.sqrt((fx - prev_x)**2 + (fy - prev_y)**2)
+                    if dist < 80:  # pixels threshold
+                        # Reactivate this ID using head detection
+                        detected_ids.add(tid)
+                        last_seen[tid] = now
+                        prev_foot[tid] = (fx, fy)
+                        matched_existing = True
+                        head_only_ids.add(tid)
+                        # Draw head detection (red for head-only recovery)
+                        head_box = head_box_data[:4]
+                        xyxyxyxy = head_box_data[4]
+                        points = xyxyxyxy.astype(np.int32)
+                        cv2.polylines(frame, [points], True, (0, 0, 255), 2)
+                        cv2.putText(frame, f"ID {tid} (H)", (int(head_box[0]), int(head_box[1]) - 10),
+                                   cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 255), 2)
+                        # Continue tracking
+                        inside_state[tid] = True
+                        current_inside.append(tid)
+                        # Map through homography
+                        pt_img = np.array([[[fx, fy]]], dtype=np.float32)
+                        mapped = cv2.perspectiveTransform(pt_img, H_img2patch)[0][0]
+                        mx = float(np.clip(mapped[0], 0, patch_w - 1))
+                        my = float(np.clip(mapped[1], 0, patch_h - 1))
+                        # Smooth display position
+                        if tid in display_pos:
+                            px_prev, py_prev = display_pos[tid]
+                            sx = SMOOTH_ALPHA
+                            dx = px_prev*(1 - sx) + mx*sx
+                            dy = py_prev*(1 - sx) + my*sx
+                        else:
+                            dx, dy = mx, my
+                        display_pos[tid] = (dx, dy)
+                        # Track travel distance
+                        along_m = image_point_to_along_m((fx, fy))
+                        current_projs.append((tid, along_m))
+                        if tid not in prev_along:
+                            prev_along[tid] = along_m
+                            entry_along[tid] = along_m
+                            prev_time[tid] = now
+                        delta = along_m - prev_along.get(tid, along_m)
+                        if delta > 0:
+                            travel_distance[tid] += delta
+                        prev_along[tid] = along_m
+                        prev_time[tid] = now
+                        break
+        # finalize exits after missing timeout
+        known_ids = set(list(inside_state.keys()) + list(last_seen.keys()))
+        for tid in list(known_ids):
+            if inside_state.get(tid, False) and tid not in detected_ids:
+                ls = last_seen.get(tid, None)
+                if ls is None:
+                    continue
+                missing = now - ls
+                if missing > missing_timeout:
+                    inside_state[tid] = False
+                    if tid in entry_time:
+                        accumulated_time[tid] += now - entry_time[tid]
+                        # record last exit time in video seconds (use last seen time)
+                        last_exit_vid[tid] = ls - start_time
+                        completed_times.append(accumulated_time[tid])
+                        entry_time.pop(tid, None)
+                else:
+                    # within occlusion grace window -> keep inside state
+                    pass
+        # Reappearance inheritance logic (same as prior): copy neighbor state if ID lost & reappears
+        current_projs_map = {tid: a for tid, a in current_projs}
+        for tid, along in current_projs:
+            if tid in prev_along:
+                continue
+            candidates = []
+            for other_tid, other_al in current_projs_map.items():
+                if other_tid == tid:
+                    continue
+                candidates.append((other_tid, other_al))
+            if not candidates and prev_along:
+                candidates = [(other_tid, prev_along_val) for other_tid, prev_along_val in prev_along.items() if other_tid != tid]
+            if not candidates:
+                prev_along[tid] = along
+                entry_along.setdefault(tid, along)
+                prev_time[tid] = now
+                continue
+            neighbor_tid, neighbor_al = min(candidates, key=lambda x: abs(x[1] - along))
+            if abs(neighbor_al - along) < max(0.5, sum(SEG_REAL_M)*0.5):
+                prev_along[tid] = prev_along.get(neighbor_tid, neighbor_al)
+                entry_along[tid] = entry_along.get(neighbor_tid, neighbor_al)
+                prev_time[tid] = now
+                accumulated_time[tid] = accumulated_time.get(neighbor_tid, 0.0)
+                if neighbor_tid in entry_time:
+                    entry_time[tid] = entry_time[neighbor_tid]
+                else:
+                    entry_time[tid] = now - accumulated_time[tid]
+                # also inherit crossed L1/L2 flags if neighbor had them (helps maintain global count consistency)
+                if crossed_l1_flag.get(neighbor_tid, False) and not crossed_l1_flag.get(tid, False):
+                    crossed_l1_flag[tid] = True
+                if crossed_l2_counted.get(neighbor_tid, False) and not crossed_l2_counted.get(tid, False):
+                    crossed_l2_counted[tid] = True
+            else:
+                prev_along[tid] = along
+                entry_along.setdefault(tid, along)
+                prev_time[tid] = now
+        # build display list sorted by along for consistent ordering
+        disp = []
+        for tid in current_inside:
+            if tid not in display_pos:
+                continue
+            dx, dy = display_pos[tid]
+            cur_al = prev_along.get(tid, entry_along.get(tid, 0.0))
+            t_inside = int(now - entry_time[tid]) if tid in entry_time else int(accumulated_time.get(tid, 0.0))
+            trav = travel_distance.get(tid, 0.0)
+            disp.append((tid, int(round(dx)), int(round(dy)), t_inside, trav, cur_al))
+        disp.sort(key=lambda x: x[5])  # by along
+        # draw patch dots and labels (no velocity)
+        for tid, xi, yi, t_inside, trav, _ in disp:
+            cv2.circle(patch, (xi, yi), 6, (0,0,255), -1)
+            cv2.putText(patch, f"ID {tid}", (xi+8, yi-8), cv2.FONT_HERSHEY_SIMPLEX, 0.45, (0,0,0), 1)
+            cv2.putText(patch, f"{t_inside}s {trav:.2f}m", (xi+8, yi+8), cv2.FONT_HERSHEY_SIMPLEX, 0.4, (0,0,0), 1)
+        # compute avg time taken from completed_times
+        avg_time_taken = float(np.mean(completed_times)) if len(completed_times) > 0 else 0.0
+        # top-right summary: show both counters
+        panel_h, panel_w = 220, 350
+        panel = np.ones((panel_h, panel_w, 3), dtype=np.uint8) * 255
+        cv2.putText(panel, "Zone Summary", (12, 24), cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0,0,0), 2)
+        cv2.putText(panel, f"Inside count: {len(disp)}", (12, 58), cv2.FONT_HERSHEY_SIMPLEX, 0.9, (0,120,0), 2)
+        cv2.putText(panel, f"Global count: {global_counter}", (12, 92), cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0,0,128), 2)
+        cv2.putText(panel, f"Avg time taken: {int(avg_time_taken)}s", (12, 126), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0,0,0), 2)
+        yv = 150
+        for tid, _, _, t_inside, trav, _ in disp[:8]:
+            cv2.putText(panel, f"ID {tid}: {t_inside}s, {trav:.2f}m", (12, yv), cv2.FONT_HERSHEY_SIMPLEX, 0.55, (50,50,50), 1)
+            yv += 18
+        final = np.hstack((frame, right_panel))
+        # place panel top-right inside right panel
+        panel_x = width + (RIGHT_PANEL_W - panel_w)//2
+        panel_y = 10
+        final[panel_y:panel_y+panel_h, panel_x:panel_x+panel_w] = panel
+        # place patch below panel
+        patch_x = width + (RIGHT_PANEL_W - patch_w)//2
+        patch_y = panel_y + panel_h + 10
+        if patch_y + patch_h > height:
+            patch_y = height - patch_h - 10
+        final[patch_y:patch_y+patch_h, patch_x:patch_x+patch_w] = patch
+        writer.write(np.ascontiguousarray(final))
+    # finalize
+    end_t = time.time()
+    for tid in list(entry_time.keys()):
+        accumulated_time[tid] += end_t - entry_time[tid]
+        last_exit_vid[tid] = last_seen.get(tid, end_t) - start_time
+        completed_times.append(accumulated_time[tid])
+        entry_time.pop(tid, None)
+        inside_state[tid] = False
+    cap.release()
+    writer.release()
+    # export excel (only >0)
+    rows = []
+    for tid, tot in accumulated_time.items():
+        if tot <= 0:
+            continue
+        tin = first_entry_vid.get(tid, 0.0)
+        tout = last_exit_vid.get(tid, tin)
+        rows.append({
+            "Passenger": int(tid),
+            "Time in": fmt(tin),
+            "Time out": fmt(tout),
+            "Time in queue (seconds)": round(float(tot), 2)
+        })
+    df = pd.DataFrame(rows, columns=["Passenger","Time in","Time out","Time in queue (seconds)"])
+    if len(df) > 0:
+        df.to_excel("person_times.xlsx", index=False)
+    else:
+        pd.DataFrame(columns=["Passenger","Time in","Time out","Time in queue (seconds)"]).to_excel("person_times.xlsx", index=False)
+    print("\nFinished. Output:", os.path.abspath(output_video_path))
+    print("Saved times:", os.path.abspath("person_times.xlsx"))
+# ---------------- Runner
+if __name__ == "__main__":
+    CONFIG = {
+        'input_video_path': "sample_vid.mp4",
+        'output_video_path': "output22.avi",
+        'model_name': "yolo11x.pt",
+        'head_model_name': "head_detection_single_video_best.pt",
+        'conf_threshold': 0.3,
+        'img_size': 1280,
+        'use_gpu': True,
+        'enhance_frames': False,
+        'smooth_bbox_tracks': True,
+        'missing_timeout': 3.0
+    }
+    process_video(
+        input_video_path = CONFIG['input_video_path'],
+        output_video_path = CONFIG['output_video_path'],
+        model_name = CONFIG['model_name'],
+        head_model_name = CONFIG['head_model_name'],
+        conf_threshold = CONFIG['conf_threshold'],
+        img_size = CONFIG['img_size'],
+        use_gpu = CONFIG['use_gpu'],
+        enhance_frames = CONFIG['enhance_frames'],
+        smooth_bbox_tracks = CONFIG['smooth_bbox_tracks'],
+        missing_timeout = CONFIG['missing_timeout']
+    )

yolo11x.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bc158aa95c0ebfdd87f70f01653c1131b93e92522dbe15c228bcd742e773a24
+size 114636239