Spaces:

chanelcolgate
/

demo-counting

Runtime error

App Files Files Community

chanelcolgate commited on May 23, 2024

Commit

55f0564

1 Parent(s): a458541

init

Browse files

Files changed (13) hide show

.gitignore +4 -0
app.py +291 -0
images/62167111_jpg.rf.a28be3ccf9faa13da52aa007a7f7ed7a.jpg +0 -0
images/A1A37A49_jpg.rf.43566e5df62b02365ced4a5bd5e21f47.jpg +0 -0
images/A2A2E11D_jpg.rf.b366674522f576b023f5fbe116993eb7.jpg +0 -0
images/A3EEA8A1_jpg.rf.f66d063ebbf0fe0ccc969198c6eaab63.jpg +0 -0
images/A48928D0_jpg.rf.7926dbc20dfd480327a6ff81cfc69961.jpg +0 -0
images/A49FFA35_jpg.rf.44ef65e540674b2bfc40361ec77569ea.jpg +0 -0
images/A6EE237B_jpg.rf.92877f1bc68547a947773e58d62dd59d.jpg +0 -0
images/A6F01C78_jpg.rf.3f74c020ece68222d8221abcda7b6461.jpg +0 -0
images/A8658634_jpg.rf.52fc338e7cb1c1ba92322299ae32ce2b.jpg +0 -0
images/ABB2195A_jpg.rf.4f96f89ee3348fb7ee8cdf77e026998a.jpg +0 -0
requirements.txt +6 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,4 @@

+.git/
+flagged/
+gradio_cached_examples/
+yolov8n.pt

app.py ADDED Viewed

	@@ -0,0 +1,291 @@

+import os
+import glob
+import uuid
+import gradio as gr
+from PIL import Image
+import cv2
+import numpy as np
+import supervision as sv
+from ultralyticsplus import YOLO, download_from_hub
+hf_model_ids = ["chanelcolgate/rods-count-v1", "chanelcolgate/cab-v1"]
+image_paths = [
+    [image_path, "chanelcolgate/rods-cout-v1", 640, 0.6, 0.45]
+    for image_path in glob.glob("./images/*.jpg")
+]
+video_paths = [
+    [video_path, "chanelcolgate/cab-v1"]
+    for video_path in glob.glob("./videos/*.mp4")
+]
+def get_center_of_bbox(bbox):
+    x1, y1, x2, y2 = bbox
+    return int((x1 + x2) / 2), int((y1 + y2) / 2)
+def get_bbox_width(bbox):
+    return int(bbox[2] - bbox[0])
+def draw_circle(pil_image, bbox, color, id):
+    # Convert PIL image to a numpy array (OpenCV format)
+    cv_image = np.array(pil_image)
+    # Convert RGB to BGR (OpenCV format)
+    cv_image = cv2.cvtColor(cv_image, cv2.COLOR_RGB2BGR)
+    x_center, y_center = get_center_of_bbox(bbox)
+    width = get_bbox_width(bbox)
+    # Draw the circle on the image
+    cv2.circle(
+        cv_image,
+        center=(x_center, y_center),
+        radius=int(width * 0.5 * 0.6),
+        color=color,
+        thickness=1,
+    )
+    cv2.putText(
+        cv_image,
+        f"{id}",
+        (x_center - 6, y_center + 6),
+        cv2.FONT_HERSHEY_SIMPLEX,
+        0.5,
+        (255, 249, 208),
+        2,
+    )
+    # Convert BGR back to RGB (PIL format)
+    cv_image = cv2.cvtColor(cv_image, cv2.COLOR_BGR2RGB)
+    # Convert the numpy array back to a PIL Image
+    pil_image = Image.fromarray(cv_image)
+    return pil_image
+def count_predictions(
+    image=None,
+    hf_model_id="chanelcolgate/rods-count-v1",
+    image_size=640,
+    conf_threshold=0.25,
+    iou_threshold=0.45,
+):
+    model_path = download_from_hub(hf_model_id)
+    model = YOLO(model_path)
+    results = model(
+        image, imgsz=image_size, conf=conf_threshold, iou=iou_threshold
+    )
+    detections = sv.Detections.from_ultralytics(results[0])
+    for id, detection in enumerate(detections):
+        image = image.copy()
+        bbox = detection[0].tolist()
+        image = draw_circle(image, bbox, (90, 178, 255), id + 1)
+    return image, len(detections)
+def count_across_line(
+    source_video_path=None,
+    hf_model_id="chanelcolgate/cab-v1",
+):
+    TARGET_VIDEO_PATH = os.path.join("./", f"{uuid.uuid4()}.mp4")
+    LINE_START = sv.Point(976, 212)
+    LINE_END = sv.Point(976, 1276)
+    model_path = download_from_hub(hf_model_id)
+    model = YOLO(model_path)
+    byte_tracker = sv.ByteTrack(
+        track_thresh=0.25, track_buffer=30, match_thresh=0.8, frame_rate=30
+    )
+    video_info = sv.VideoInfo.from_video_path(source_video_path)
+    generator = sv.get_video_frames_generator(source_video_path)
+    line_zone = sv.LineZone(start=LINE_START, end=LINE_END)
+    box_annotator = sv.BoxAnnotator(thickness=4, text_thickness=4, text_scale=2)
+    trace_annotator = sv.TraceAnnotator(thickness=4, trace_length=50)
+    line_zone_annotator = sv.LineZoneAnnotator(
+        thickness=4, text_thickness=4, text_scale=2
+    )
+    def callback(frame: np.ndarray, index: int) -> np.ndarray:
+        results = model.predict(frame)
+        cls_names = results[0].names
+        detection = sv.Detections.from_ultralytics(results[0])
+        detection_supervision = byte_tracker.update_with_detections(detection)
+        labels_convert = [
+            f"#{tracker_id} {cls_names[class_id]} {confidence:0.2f}"
+            for _, _, confidence, class_id, tracker_id, _ in detection_supervision
+        ]
+        annotated_frame = trace_annotator.annotate(
+            scene=frame.copy(), detections=detection_supervision
+        )
+        annotated_frame = box_annotator.annotate(
+            scene=annotated_frame,
+            detections=detection_supervision,
+            skip_label=True,
+            # labels=labels_convert,
+        )
+        # update line counter
+        line_zone.trigger(detection_supervision)
+        # return frame with box and line annotated result
+        return line_zone_annotator.annotate(
+            annotated_frame, line_counter=line_zone
+        )
+    # process the whole video
+    sv.process_video(
+        source_path=source_video_path,
+        target_path=TARGET_VIDEO_PATH,
+        callback=callback,
+    )
+    return TARGET_VIDEO_PATH, line_zone.out_count
+def count_in_zone(
+    source_video_path=None,
+    hf_model_id="chanelcolgate/cab-v1",
+):
+    TARGET_VIDEO_PATH = os.path.join("./", f"{uuid.uuid4()}.mp4")
+    colors = sv.ColorPalette.default()
+    polygons = [
+        np.array([[88, 292], [748, 284], [736, 1160], [96, 1148]]),
+        np.array([[844, 240], [844, 1132], [1580, 1124], [1584, 264]]),
+    ]
+    model_path = download_from_hub(hf_model_id)
+    model = YOLO(model_path)
+    byte_tracker = sv.ByteTrack(
+        track_thresh=0.25, track_buffer=30, match_thresh=0.8, frame_rate=30
+    )
+    video_info = sv.VideoInfo.from_video_path(source_video_path)
+    generator = sv.get_video_frames_generator(source_video_path)
+    zones = [
+        sv.PolygonZone(
+            polygon=polygon, frame_resolution_wh=video_info.resolution_wh
+        )
+        for polygon in polygons
+    ]
+    zone_annotators = [
+        sv.PolygonZoneAnnotator(
+            zone=zone,
+            color=colors.by_idx(index),
+            thickness=4,
+            text_thickness=4,
+            text_scale=2,
+        )
+        for index, zone in enumerate(zones)
+    ]
+    box_annotators = [
+        sv.BoxAnnotator(
+            thickness=4,
+            text_thickness=4,
+            text_scale=2,
+            color=colors.by_idx(index),
+        )
+        for index in range(len(polygons))
+    ]
+    def callback(frame: np.ndarray, index: int) -> np.ndarray:
+        results = model.predict(frame)
+        detection = sv.Detections.from_ultralytics(results[0])
+        detection_supervision = byte_tracker.update_with_detections(detection)
+        for zone, zone_annotator, box_annotator in zip(
+            zones, zone_annotators, box_annotators
+        ):
+            zone.trigger(detections=detection_supervision)
+            frame = box_annotator.annotate(
+                scene=frame, detections=detection_supervision, skip_label=True
+            )
+            frame = zone_annotator.annotate(scene=frame)
+        return frame
+    sv.process_video(
+        source_path=source_video_path,
+        target_path=TARGET_VIDEO_PATH,
+        callback=callback,
+    )
+    return TARGET_VIDEO_PATH, [zone.current_count for zone in zones]
+title = "Demo Counting"
+interface_count_predictions = gr.Interface(
+    fn=count_predictions,
+    inputs=[
+        gr.Image(type="pil"),
+        gr.Dropdown(hf_model_ids),
+        gr.Slider(
+            minimum=320, maximum=1280, value=640, step=32, label="Image Size"
+        ),
+        gr.Slider(
+            minimum=0.0,
+            maximum=1.0,
+            value=0.25,
+            step=0.05,
+            label="Confidence Threshold",
+        ),
+        gr.Slider(
+            minimum=0.0,
+            maximum=1.0,
+            value=0.45,
+            step=0.05,
+            label="IOU Threshold",
+        ),
+    ],
+    outputs=[gr.Image(type="pil"), gr.Textbox(show_label=False)],
+    title="Count Predictions",
+    examples=image_paths,
+    cache_examples=True if image_paths else False,
+)
+interface_count_across_line = gr.Interface(
+    fn=count_across_line,
+    inputs=[
+        gr.Video(label="Input Video"),
+        gr.Dropdown(hf_model_ids),
+    ],
+    outputs=[gr.Video(label="Output Video"), gr.Textbox(show_label=False)],
+    title="Count Across Line",
+    examples=video_paths,
+    cache_examples=True if video_paths else False,
+)
+interface_count_in_zone = gr.Interface(
+    fn=count_in_zone,
+    inputs=[gr.Video(label="Input Video"), gr.Dropdown(hf_model_ids)],
+    outputs=[gr.Video(label="Output Video"), gr.Textbox(show_label=False)],
+    title="Count in Zone",
+    examples=video_paths,
+    cache_examples=True if video_paths else False,
+)
+gr.TabbedInterface(
+    [
+        interface_count_predictions,
+        interface_count_across_line,
+        interface_count_in_zone,
+    ],
+    tab_names=["Count Predictions", "Count Across Line", "Count in Zone"],
+    title="Demo Counting",
+).queue().launch()