Spaces:

CuriousDolphin
/

YoloGP

Sleeping

+from pytube import YouTube
+import gradio as gr
+from pathlib import Path
+import os
+from supervision import (
+    ImageSink,
+    get_video_frames_generator,
+    list_files_with_extensions,
+)
+from tqdm import tqdm
+from helpers import zoom_center
+import shutil
+data_path = Path(__file__).parent.parent / "data"
+print("DATA PATH: ", data_path)
+def download_youtube_url(url, out_dir) -> str:
+    yt = YouTube(url=url)
+    files = yt.streams.filter(file_extension="mp4", only_video=True)
+    itag = files[0].itag
+    video = yt.streams.get_by_itag(int(itag))
+    path = video.download(output_path=out_dir)
+    return path
+def extract_frames(
+    url,
+    video_path,
+    stride,
+    start,
+    end,
+    resize_w,
+    zoom,
+    progress=gr.Progress(track_tqdm=True),
+):
+    if video_path is not None:
+        v_path = Path(video_path.name)
+    elif len(url) > 0:
+        progress(0.1, "Downloading..")
+        d_path = download_youtube_url(url, data_path)
+        v_path = Path(d_path)
+    print("video path:", v_path)
+    video_name = str(v_path.stem).replace(" ", "")
+    target_dir = Path(f"{data_path}/{video_name}_frames")
+    cont = 0
+    with ImageSink(
+        target_dir_path=target_dir,
+        image_name_pattern="image_{:05d}.jpg",
+        overwrite=True,
+    ) as sink:
+        for image in tqdm(
+            get_video_frames_generator(
+                source_path=str(v_path), stride=stride, start=start
+            )
+        ):
+            if zoom > 1:
+                image = zoom_center(img=image.copy(), zoom_factor=zoom)
+            sink.save_image(image=image.copy())
+            cont += 1
+    progress(0.8, "Zipping..")
+    print("Target_dir", target_dir)
+    frames = list_files_with_extensions(directory=target_dir, extensions=["jpg", "png"])
+    print(len(frames))
+    archive_ = shutil.make_archive(
+        target_dir,
+        "zip",
+        target_dir,
+    )
+    print(archive_)
+    v_path.unlink()
+    return frames[0:10], [archive_]
+inputs = [
+    gr.Textbox(label="Youtube_url"),
+    gr.File(label="mp4 or mov", file_types=["video"]),
+    gr.Slider(label="Stride", value=60, maximum=1200),
+    gr.Number(label="Start Frame", value=0),
+    gr.Number(label="End Frame", value=-1),
+    gr.Number(label="Resize Width (px)", value=-1),
+    gr.Slider(label="Image Zoom", minimum=1.0, maximum=2.99, value=1.4),
+]
+outputs = [gr.Gallery(label="preview"), gr.File()]
+interface = gr.Interface(
+    fn=extract_frames,
+    inputs=inputs,
+    outputs=outputs,
+    examples=[["https://www.youtube.com/watch?v=XDhjS_fzhsQ"]],
+    allow_flagging=False,
+)
+if __name__ == "__main__":
+    interface.queue(max_size=10).launch(server_name="0.0.0.0")

yologp/inference_gradio_app.py CHANGED Viewed

@@ -24,9 +24,9 @@ classes = ["curb", "curb", "helmet", "wheel", "moto", "moto", "rider", "road"]
 selected_classes = [0, 2, 3, 5, 6]
-def inference(image, progress=gr.Progress()):
     frame = cv2.resize(image, (960, 640))
-    res = model(frame, imgsz=(960, 640), conf=0.3, iou=0.4)[0]
     detections = sv.Detections.from_ultralytics(res)
     detections = detections[np.isin(detections.class_id, selected_classes)]
     if len(detections) > 0:
@@ -45,7 +45,11 @@ with gr.Blocks() as inference_app:
     with gr.Row():
         with gr.Column():
             image = gr.Image()
-            button = gr.Button(variant="primary")
             examples = gr.Examples(
                 examples=[
                     ["./assets/Rossi_Lorenzo_Catalunya2009.png"],
@@ -56,8 +60,7 @@ with gr.Blocks() as inference_app:
         with gr.Column():
             output_im = gr.Image()
-    button.click(fn=inference, inputs=[image], outputs=output_im)
 if __name__ == "__main__":
     inference_app.queue(max_size=10).launch(server_name="0.0.0.0")

 selected_classes = [0, 2, 3, 5, 6]
+def inference(image, conf: float, iou: float, progress=gr.Progress()):
     frame = cv2.resize(image, (960, 640))
+    res = model(frame, imgsz=(960, 640), conf=conf, iou=iou)[0]
     detections = sv.Detections.from_ultralytics(res)
     detections = detections[np.isin(detections.class_id, selected_classes)]
     if len(detections) > 0:
     with gr.Row():
         with gr.Column():
             image = gr.Image()
+            conf = gr.Slider(label="Confidence", minimum=0, maximum=0.99, value=0.3)
+            iou = gr.Slider(label="IoU", minimum=0, maximum=0.99, value=0.45)
+            with gr.Row():
+                button = gr.Button(variant="primary")
             examples = gr.Examples(
                 examples=[
                     ["./assets/Rossi_Lorenzo_Catalunya2009.png"],
         with gr.Column():
             output_im = gr.Image()
+    button.click(fn=inference, inputs=[image, conf, iou], outputs=output_im)
 if __name__ == "__main__":
     inference_app.queue(max_size=10).launch(server_name="0.0.0.0")

yologp/live_inference.py CHANGED Viewed

@@ -39,7 +39,7 @@ while True:
         frame = cv2.resize(frame, (960, 640))
         res = model(frame, imgsz=(960, 640), conf=0.25, iou=0.45)[0]
         if len(res) > 0:
-            detections = sv.Detections.from_yolov8(res)
             detections = detections[np.isin(detections.class_id, selected_classes)]
             helmets_wheel = detections[np.isin(detections.class_id, [2, 3, 4])]
             curbs = detections[np.isin(detections.class_id, [0, 1, 7])]

         frame = cv2.resize(frame, (960, 640))
         res = model(frame, imgsz=(960, 640), conf=0.25, iou=0.45)[0]
         if len(res) > 0:
+            detections = sv.Detections.from_ultralytics(res)
             detections = detections[np.isin(detections.class_id, selected_classes)]
             helmets_wheel = detections[np.isin(detections.class_id, [2, 3, 4])]
             curbs = detections[np.isin(detections.class_id, [0, 1, 7])]