Spaces:

damndeepesh
/

QuickTrack

Sleeping

App Files Files Community

damndeepesh commited on Mar 18, 2025

Commit

9de653a

verified ·

1 Parent(s): 2b91ee4

Uploaded Project Files

Browse files

Files changed (8) hide show

.gitattributes +2 -0
LICENSE +201 -0
README copy.md +165 -0
app.py +313 -0
asset/ezgif-5-12682faad5.gif +3 -0
asset/ezgif-5-28a1705b9b.gif +3 -0
detection_utils.py +245 -0
requirements.txt +7 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+asset/ezgif-5-12682faad5.gif filter=lfs diff=lfs merge=lfs -text
+asset/ezgif-5-28a1705b9b.gif filter=lfs diff=lfs merge=lfs -text

LICENSE ADDED Viewed

	@@ -0,0 +1,201 @@

+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+   1. Definitions.
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+   END OF TERMS AND CONDITIONS
+   APPENDIX: How to apply the Apache License to your work.
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+   Copyright [yyyy] [name of copyright owner]
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+       http://www.apache.org/licenses/LICENSE-2.0
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.

README copy.md ADDED Viewed

	@@ -0,0 +1,165 @@

+# Real-Time Object Detection with YOLOv8
+A Streamlit-based web application for real-time object detection in videos using YOLOv8. This application supports multiple YOLO models, real-time detection, object tracking, and video processing with annotated output.
+## Demo
+![me](https://github.com/damndeepesh/QuickTrack/blob/main/asset/ezgif-5-12682faad5.gif)
+![me](https://github.com/damndeepesh/QuickTrack/blob/main/asset/ezgif-5-28a1705b9b.gif)
+## Features
+- Multiple YOLOv8 model support (Nano to XLarge)
+- Real-time object detection and tracking
+- Support for video files and live streams
+- Unique ID tracking for detected objects
+- Customizable detection confidence
+- Color-coded object categories
+- Downloadable processed videos
+- Interactive web interface
+## Installation
+### Prerequisites
+- Python 3.8 or higher
+- CUDA-compatible GPU (optional, but recommended for better performance)
+### Step 1: Clone the Repository
+- git clone <repository-url>
+- cd <repository-name>
+### Step 2: Create a Virtual Environment (Recommended)
+## Windows
+- python -m venv venv
+- venv\Scripts\activate
+## Linux/Mac
+- python3 -m venv venv
+- source venv/bin/activate
+### Step 3: Install Dependencies
+- pip install -r requirements.txt
+## Usage
+### Starting the Application
+- streamlit run app.py
+### Step-by-Step Guide
+1. **Select a Model**:
+   - Choose from available YOLOv8 models in the sidebar
+   - Models range from Nano (fastest) to XLarge (most accurate)
+   - Review model details in the expandable section
+   - Click "Load Selected Model" to download and initialize
+2. **Configure Settings**:
+   - Adjust detection confidence using the slider
+   - Lower values detect more objects but may increase false positives
+   - Higher values are more selective but might miss some objects
+3. **Input Selection**:
+   - Choose between "Video File" or "Live Stream URL"
+   - For video files: Upload MP4 or AVI format
+   - For streams: Enter a valid stream URL
+4. **Start Detection**:
+   - Click "Start Detection" in the sidebar
+   - Watch real-time detection with bounding boxes
+   - Each object gets a unique tracking ID
+5. **Download Results**:
+   - Stop detection when finished
+   - Download button appears automatically
+   - Processed video includes all annotations
+## About YOLO Models
+### Available Models
+1. **YOLOv8n (Nano)**:
+   - Size: 6.7 MB
+   - Best for: Real-time applications on CPU
+   - Speed: ⚡⚡⚡⚡⚡
+   - Accuracy: ⭐⭐
+2. **YOLOv8s (Small)**:
+   - Size: 22.4 MB
+   - Best for: Balanced performance
+   - Speed: ⚡⚡⚡⚡
+   - Accuracy: ⭐⭐⭐
+3. **YOLOv8m (Medium)**:
+   - Size: 52.2 MB
+   - Best for: Standard detection tasks
+   - Speed: ⚡⚡⚡
+   - Accuracy: ⭐⭐⭐⭐
+4. **YOLOv8l (Large)**:
+   - Size: 87.7 MB
+   - Best for: High accuracy needs
+   - Speed: ⚡⚡
+   - Accuracy: ⭐⭐⭐⭐⭐
+5. **YOLOv8x (XLarge)**:
+   - Size: 131.7 MB
+   - Best for: Maximum accuracy
+   - Speed: ⚡
+   - Accuracy: ⭐⭐⭐⭐⭐⭐
+### Model Selection Guide
+- **CPU Only**: Use Nano or Small models
+- **GPU Available**: Medium to XLarge models recommended
+- **Real-time Needs**: Nano or Small models
+- **Accuracy Priority**: Large or XLarge models
+- **Balanced**: Medium model
+## Technical Details
+- Built with Streamlit and OpenCV
+- Uses Ultralytics YOLOv8 implementation
+- Supports multiple video codecs
+- Real-time frame processing and buffering
+- Unique object tracking with IoU
+- Color-coded object categories
+- Frame buffer for smooth video writing
+## Troubleshooting
+1. **Video Not Loading**:
+   - Check file format (MP4/AVI supported)
+   - Ensure file isn't corrupted
+   - Try a different video codec
+2. **Slow Performance**:
+   - Use a smaller YOLO model
+   - Reduce input video resolution
+   - Check GPU availability
+3. **Detection Issues**:
+   - Adjust confidence threshold
+   - Try a larger YOLO model
+   - Ensure good lighting in video
+4. **Download Issues**:
+   - Wait for processing to complete
+   - Check available disk space
+   - Try a different browser
+## Requirements
+- streamlit>=1.24.0
+- opencv-python-headless>=4.7.0
+- torch>=2.0.0
+- torchvision>=0.15.0
+- numpy>=1.24.0
+- ultralytics>=8.0.0
+- python-dateutil>=2.8.2
+## Acknowledgments
+- YOLOv8 by Ultralytics - https://docs.ultralytics.com/models/yolov8/
+- Streamlit Framework - https://streamlit.io
+- OpenCV Project - https://docs.opencv.org/4.x/index.html

app.py ADDED Viewed

	@@ -0,0 +1,313 @@

+import streamlit as st
+import cv2
+import torch
+import numpy as np
+import time
+import tempfile
+from pathlib import Path
+# Import detection utilities
+from detection_utils import load_model, detect_objects, draw_boxes, ObjectTracker
+def initialize_video_capture(input_source, video_file=None, url=None):
+    """Initialize video capture and writer"""
+    cap = None
+    out = None
+    output_path = None
+    if input_source == "Video File" and video_file is not None:
+        # Save uploaded file to temp location
+        tfile = tempfile.NamedTemporaryFile(delete=False, suffix='.mp4')
+        tfile.write(video_file.read())
+        tfile.flush()
+        video_path = tfile.name
+        # Open video capture
+        cap = cv2.VideoCapture(video_path)
+        if cap.isOpened():
+            # Get video properties
+            width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+            height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+            fps = int(cap.get(cv2.CAP_PROP_FPS))
+            # Ensure valid FPS
+            if fps <= 0:
+                fps = 30
+            # Create output path in a temporary directory
+            temp_dir = tempfile.gettempdir()
+            output_path = str(Path(temp_dir) / 'detected_output.mp4')
+            # Try different codecs in order of preference
+            codecs = [
+                ('avc1', '.mp4'),
+                ('mp4v', '.mp4'),
+                ('XVID', '.avi')
+            ]
+            for codec, ext in codecs:
+                try:
+                    output_path = str(Path(temp_dir) / f'detected_output{ext}')
+                    fourcc = cv2.VideoWriter_fourcc(*codec)
+                    out = cv2.VideoWriter(
+                        output_path,
+                        fourcc,
+                        fps,
+                        (width, height),
+                        isColor=True
+                    )
+                    # Test if writer is working
+                    if out.isOpened():
+                        break
+                except Exception:
+                    continue
+            if out is None or not out.isOpened():
+                st.error("Failed to create video writer")
+                return None, None, None
+    elif input_source == "Live Stream URL" and url:
+        cap = cv2.VideoCapture(url)
+    return cap, out, output_path
+def get_model_info():
+    """Return information about available YOLO models"""
+    return {
+        'yolov8n.pt': {
+            'name': 'YOLOv8 Nano',
+            'description': 'Smallest and fastest model. Best for CPU or low-power devices.',
+            'speed': '⚡⚡⚡⚡⚡',
+            'accuracy': '⭐⭐',
+            'size': '6.7 MB',
+            'details': 'Ideal for real-time applications with limited computing power.'
+        },
+        'yolov8s.pt': {
+            'name': 'YOLOv8 Small',
+            'description': 'Small model balancing speed and accuracy.',
+            'speed': '⚡⚡⚡⚡',
+            'accuracy': '⭐⭐⭐',
+            'size': '22.4 MB',
+            'details': 'Good for general purpose detection with decent performance.'
+        },
+        'yolov8m.pt': {
+            'name': 'YOLOv8 Medium',
+            'description': 'Medium-sized model with good balance.',
+            'speed': '⚡⚡⚡',
+            'accuracy': '⭐⭐⭐⭐',
+            'size': '52.2 MB',
+            'details': 'Recommended for standard detection tasks with good GPU.'
+        },
+        'yolov8l.pt': {
+            'name': 'YOLOv8 Large',
+            'description': 'Large model with high accuracy.',
+            'speed': '⚡⚡',
+            'accuracy': '⭐⭐⭐⭐⭐',
+            'size': '87.7 MB',
+            'details': 'Best for high-accuracy requirements with good computing power.'
+        },
+        'yolov8x.pt': {
+            'name': 'YOLOv8 XLarge',
+            'description': 'Extra large model with highest accuracy.',
+            'speed': '⚡',
+            'accuracy': '⭐⭐⭐⭐⭐⭐',
+            'size': '131.7 MB',
+            'details': 'Best for tasks requiring maximum accuracy, requires powerful GPU.'
+        }
+    }
+def main():
+    st.title("Real-Time Object Detection")
+    # Initialize session state
+    if 'tracker' not in st.session_state:
+        st.session_state.tracker = ObjectTracker()
+    if 'cap' not in st.session_state:
+        st.session_state.cap = None
+    if 'out' not in st.session_state:
+        st.session_state.out = None
+    if 'output_path' not in st.session_state:
+        st.session_state.output_path = None
+    if 'processed_frames' not in st.session_state:
+        st.session_state.processed_frames = 0
+    if 'selected_model' not in st.session_state:
+        st.session_state.selected_model = 'yolov8x.pt'
+    if 'model' not in st.session_state:
+        st.session_state.model = None
+    # Sidebar settings
+    st.sidebar.title("Settings")
+    # Model selection
+    st.sidebar.subheader("Model Selection")
+    model_info = get_model_info()
+    selected_model = st.sidebar.selectbox(
+        "Choose YOLO Model",
+        options=list(model_info.keys()),
+        format_func=lambda x: model_info[x]['name'],
+        index=list(model_info.keys()).index(st.session_state.selected_model)
+    )
+    # Display model information
+    with st.sidebar.expander("Model Details", expanded=True):
+        st.markdown(f"**{model_info[selected_model]['name']}**")
+        st.write(model_info[selected_model]['description'])
+        st.write(f"Speed: {model_info[selected_model]['speed']}")
+        st.write(f"Accuracy: {model_info[selected_model]['accuracy']}")
+        st.write(f"Size: {model_info[selected_model]['size']}")
+        st.write(f"Details: {model_info[selected_model]['details']}")
+    # Add Load Model button
+    if st.sidebar.button("Load Selected Model"):
+        with st.spinner(f"Loading {model_info[selected_model]['name']}..."):
+            st.session_state.model = load_model(selected_model)
+            st.session_state.selected_model = selected_model
+            st.sidebar.success("Model loaded successfully!")
+    # Detection confidence
+    detection_confidence = st.sidebar.slider("Detection Confidence", 0.0, 1.0, 0.5)
+    # Input selection
+    input_source = st.radio("Select Input Source", ["Video File", "Live Stream URL"])
+    try:
+        # Handle video input
+        if input_source == "Video File":
+            video_file = st.file_uploader("Upload Video", type=['mp4', 'avi'])
+            if video_file is not None:
+                st.session_state.cap, st.session_state.out, st.session_state.output_path = initialize_video_capture(input_source, video_file=video_file)
+        else:
+            url = st.text_input("Enter Stream URL")
+            if url:
+                st.session_state.cap, st.session_state.out, st.session_state.output_path = initialize_video_capture(input_source, url=url)
+        if st.session_state.cap is not None and not st.session_state.cap.isOpened():
+            st.error("Error: Could not open video source")
+            st.stop()
+        # Create placeholder for video display
+        video_placeholder = st.empty()
+        # Initialize frame buffer in session state
+        if 'frame_buffer' not in st.session_state:
+            st.session_state.frame_buffer = []
+        # Control buttons - Move them to sidebar to avoid duplication
+        st.sidebar.markdown("---")
+        st.sidebar.subheader("Controls")
+        start_button = st.sidebar.button("Start Detection")
+        stop_button = st.sidebar.button("Stop Detection")
+        if start_button:
+            if st.session_state.model is None:
+                st.error("Please load a model first using the 'Load Selected Model' button")
+                st.stop()
+            if st.session_state.cap is None:
+                st.error("Please upload a video or provide a stream URL first")
+                st.stop()
+            st.session_state.run_detection = True
+            st.session_state.processed_frames = 0
+            st.session_state.frame_buffer = []  # Clear buffer on start
+        if stop_button:
+            st.session_state.run_detection = False
+        # Detection loop
+        while (hasattr(st.session_state, 'run_detection') and
+               st.session_state.run_detection and
+               st.session_state.cap is not None):
+            ret, frame = st.session_state.cap.read()
+            if not ret:
+                break
+            # Perform detection
+            detections = detect_objects(st.session_state.model, frame, detection_confidence)
+            # Draw boxes on frame
+            annotated_frame = draw_boxes(frame, detections, st.session_state.tracker)
+            # Add frame to buffer
+            st.session_state.frame_buffer.append(annotated_frame)
+            # Write frames to video periodically
+            if len(st.session_state.frame_buffer) >= 30:  # Write every 30 frames
+                for buffered_frame in st.session_state.frame_buffer:
+                    if st.session_state.out is not None:
+                        st.session_state.out.write(buffered_frame)
+                        st.session_state.processed_frames += 1
+                st.session_state.frame_buffer.clear()
+            # Update display every 3rd frame
+            if st.session_state.processed_frames % 3 == 0:
+                video_placeholder.image(annotated_frame, channels="BGR")
+            # Minimal sleep to prevent UI freezing
+            time.sleep(0.001)
+        # Write remaining frames in buffer
+        if st.session_state.frame_buffer and st.session_state.out is not None:
+            for buffered_frame in st.session_state.frame_buffer:
+                st.session_state.out.write(buffered_frame)
+                st.session_state.processed_frames += 1
+            st.session_state.frame_buffer.clear()
+    except Exception as e:
+        st.error(f"An error occurred: {str(e)}")
+        raise e
+    finally:
+        # Ensure proper cleanup and save remaining frames
+        if hasattr(st.session_state, 'frame_buffer') and st.session_state.frame_buffer and hasattr(st.session_state, 'out') and st.session_state.out is not None:
+            for buffered_frame in st.session_state.frame_buffer:
+                st.session_state.out.write(buffered_frame)
+                st.session_state.processed_frames += 1
+            st.session_state.frame_buffer.clear()
+        # Release resources
+        if hasattr(st.session_state, 'cap') and st.session_state.cap is not None:
+            st.session_state.cap.release()
+        if hasattr(st.session_state, 'out') and st.session_state.out is not None:
+            st.session_state.out.release()
+            cv2.destroyAllWindows()
+        # Add a separator
+        st.markdown("---")
+        # Download section
+        if st.session_state.processed_frames > 0:
+            st.subheader("Download Processed Video")
+            # Force flush and wait
+            time.sleep(3)  # Increased wait time
+            if (st.session_state.output_path and
+                Path(st.session_state.output_path).exists()):
+                try:
+                    with open(st.session_state.output_path, 'rb') as f:
+                        video_data = f.read()
+                        if len(video_data) > 1000:
+                            st.success(f"Successfully processed {st.session_state.processed_frames} frames")
+                            # Make download button more prominent
+                            st.download_button(
+                                label="📥 Download Processed Video",
+                                data=video_data,
+                                file_name=f"detected_video_{time.strftime('%Y%m%d_%H%M%S')}.mp4",
+                                mime="video/mp4",
+                                key="download_button"
+                            )
+                        else:
+                            st.error("Error: Video file is empty or corrupted")
+                            st.info("Try processing the video again with different settings")
+                except Exception as e:
+                    st.error(f"Error preparing download: {str(e)}")
+                    st.info("Please try processing the video again")
+            else:
+                st.error("Output video file not found")
+                st.info("Make sure to complete the video processing before downloading")
+if __name__ == "__main__":
+    main()

asset/ezgif-5-12682faad5.gif ADDED Viewed

Git LFS Details

SHA256: c2ff2214f48cc1728de93b9b204fef93e3c29f0054867ac4baf4e32b2087100d
Pointer size: 132 Bytes
Size of remote file: 1.24 MB

asset/ezgif-5-28a1705b9b.gif ADDED Viewed

Git LFS Details

SHA256: 952bf5acd331642dea3f8806f592ff6a8d03fe705473afb3dc7b65a397a2d853
Pointer size: 131 Bytes
Size of remote file: 976 kB

detection_utils.py ADDED Viewed

	@@ -0,0 +1,245 @@

+import torch
+import cv2
+import numpy as np
+from collections import defaultdict
+import streamlit as st
+# Add this color_map dictionary before the draw_boxes function
+# Extended color map for different classes
+color_map = {
+    # People and animals
+    'person': (0, 0, 255),      # Red
+    'dog': (0, 255, 255),       # Cyan
+    'cat': (255, 0, 255),       # Magenta
+    'bird': (165, 42, 42),      # Brown
+    'horse': (128, 0, 0),       # Maroon
+    'sheep': (230, 216, 173),   # Beige
+    'cow': (112, 128, 144),     # Slate
+    # Vehicles
+    'car': (255, 0, 0),         # Blue
+    'truck': (255, 165, 0),     # Orange
+    'bicycle': (128, 0, 128),   # Purple
+    'motorcycle': (255, 192, 203), # Pink
+    'bus': (255, 255, 0),       # Yellow
+    'train': (0, 128, 0),       # Dark Green
+    'airplane': (70, 130, 180),  # Steel Blue
+    'boat': (0, 165, 255),      # Orange-Red
+    # Objects
+    'traffic light': (0, 255, 127),  # Spring Green
+    'fire hydrant': (255, 69, 0),    # Red-Orange
+    'stop sign': (220, 20, 60),      # Crimson
+    'bench': (107, 142, 35),         # Olive
+    'chair': (0, 128, 128),          # Teal
+    'dining table': (255, 215, 0),   # Gold
+    'cell phone': (138, 43, 226),    # Blue Violet
+    'laptop': (0, 191, 255),         # Deep Sky Blue
+    'keyboard': (255, 127, 80),      # Coral
+    'book': (218, 112, 214),         # Orchid
+    'clock': (240, 230, 140),        # Khaki
+    # Sports
+    'sports ball': (0, 250, 154),    # Medium Spring Green
+    'kite': (255, 240, 245),         # Lavender
+    'baseball bat': (188, 143, 143), # Rosy Brown
+    'baseball glove': (46, 139, 87), # Sea Green
+    # Food
+    'bottle': (0, 206, 209),         # Turquoise
+    'wine glass': (255, 248, 220),   # Cornsilk
+    'cup': (147, 112, 219),          # Medium Purple
+    'fork': (218, 165, 32),          # Goldenrod
+    'sandwich': (210, 105, 30),      # Chocolate
+    'pizza': (188, 143, 143),        # Rosy Brown
+    # Additional objects
+    'backpack': (0, 100, 0),         # Dark Green
+    'umbrella': (255, 182, 193),     # Light Pink
+    'handbag': (219, 112, 147),      # Pale Violet Red
+    'tie': (106, 90, 205),           # Slate Blue
+    'suitcase': (72, 61, 139),       # Dark Slate Blue
+    'frisbee': (32, 178, 170),       # Light Sea Green
+    'skis': (135, 206, 250),         # Light Sky Blue
+    'snowboard': (176, 224, 230),    # Powder Blue
+    'tennis racket': (218, 112, 214),# Orchid
+    'surfboard': (0, 139, 139),      # Dark Cyan
+    'remote': (143, 188, 143),       # Dark Sea Green
+    'mouse': (216, 191, 216),        # Thistle
+    'toaster': (255, 222, 173),      # Navajo White
+    'sink': (112, 128, 144),         # Slate Gray
+    'refrigerator': (47, 79, 79),    # Dark Slate Gray
+    'tv': (25, 25, 112),             # Midnight Blue
+    'microwave': (0, 139, 139),      # Dark Cyan
+    'oven': (160, 82, 45),           # Sienna
+    'toothbrush': (199, 21, 133),    # Medium Violet Red
+    'scissors': (176, 196, 222),     # Light Steel Blue
+}
+def load_model(model_path='yolov8x.pt'):
+    """Load YOLOv8 model"""
+    try:
+        from ultralytics import YOLO
+        import os
+        os.environ['NNPACK_FAST_MATH'] = 'OFF'
+        # Load the selected model
+        model = YOLO(model_path)
+        # Warmup the model
+        model.predict(np.zeros((640, 640, 3)), verbose=False)
+        return model
+    except Exception as e:
+        st.error(f"Error loading model: {str(e)}")
+        st.stop()
+def detect_objects(model, frame, conf_threshold=0.5):
+    """
+    Detect objects in a frame using YOLO with optimized processing
+    """
+    # Convert frame to RGB
+    frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+    # Perform detection with optimized settings
+    results = model.predict(
+        frame_rgb,
+        conf=conf_threshold,
+        verbose=False,
+        device='0' if torch.cuda.is_available() else 'cpu',
+        imgsz=1280,  # Increased size for better detection
+        iou=0.4,    # Adjusted IOU threshold
+        max_det=300,  # Increase maximum detections
+        agnostic_nms=True,  # Better handling of objects of different sizes
+    )
+    result = results[0]
+    detections = []
+    if hasattr(result, 'boxes'):
+        boxes = result.boxes.cpu().numpy()
+        for box in boxes:
+            try:
+                x1, y1, x2, y2 = map(int, box.xyxy[0])
+                class_id = int(box.cls[0])
+                confidence = float(box.conf[0])
+                class_name = result.names[class_id]
+                detection = {
+                    'bbox': [x1, y1, x2, y2],
+                    'class': class_name,
+                    'confidence': confidence
+                }
+                detections.append(detection)
+            except Exception as e:
+                continue
+    return detections
+class ObjectTracker:
+    def __init__(self):
+        self.next_id = 1
+        self.object_ids = {}
+        self.id_timeout = 30
+        self.last_positions = {}
+    def get_object_id(self, bbox, class_name):
+        """Assign or retrieve ID for detected object based on position and IoU"""
+        center = ((bbox[0] + bbox[2]) // 2, (bbox[1] + bbox[3]) // 2)
+        # Calculate box area
+        box_area = (bbox[2] - bbox[0]) * (bbox[3] - bbox[1])
+        best_iou = 0
+        best_id = None
+        # Check existing objects
+        for obj_id, (old_bbox, old_class, last_seen) in list(self.last_positions.items()):
+            if last_seen > self.id_timeout:
+                del self.last_positions[obj_id]
+                continue
+            # Calculate IoU
+            x1 = max(bbox[0], old_bbox[0])
+            y1 = max(bbox[1], old_bbox[1])
+            x2 = min(bbox[2], old_bbox[2])
+            y2 = min(bbox[3], old_bbox[3])
+            if x2 > x1 and y2 > y1:
+                intersection = (x2 - x1) * (y2 - y1)
+                old_area = (old_bbox[2] - old_bbox[0]) * (old_bbox[3] - old_bbox[1])
+                union = box_area + old_area - intersection
+                iou = intersection / union
+                if iou > best_iou and iou > 0.3 and class_name == old_class:
+                    best_iou = iou
+                    best_id = obj_id
+        if best_id is not None:
+            self.last_positions[best_id] = (bbox, class_name, 0)
+            return best_id
+        # If no match found, assign new ID
+        new_id = self.next_id
+        self.next_id += 1
+        self.last_positions[new_id] = (bbox, class_name, 0)
+        return new_id
+    def update_timeouts(self):
+        """Update timeout counters for all tracked objects"""
+        for obj_id in self.last_positions:
+            bbox, class_name, timeout = self.last_positions[obj_id]
+            self.last_positions[obj_id] = (bbox, class_name, timeout + 1)
+def draw_boxes(frame, detections, tracker):
+    """
+    Optimized version of drawing bounding boxes and labels with improved visibility
+    """
+    annotated_frame = frame.copy()
+    tracker.update_timeouts()
+    # Thicker lines and larger text for better visibility
+    box_thickness = 3
+    text_scale = 0.7
+    text_thickness = 2
+    for det in detections:
+        x1, y1, x2, y2 = det['bbox']
+        obj_id = tracker.get_object_id(det['bbox'], det['class'])
+        # Get color with default
+        color = color_map.get(det['class'].lower(), (0, 255, 0))
+        # Create label with better formatting
+        label = f"#{obj_id} {det['class']} {det['confidence']:.2f}"
+        # Draw box with thicker lines
+        cv2.rectangle(annotated_frame, (x1, y1), (x2, y2), color, box_thickness)
+        # Improve text background
+        (text_width, text_height), baseline = cv2.getTextSize(
+            label, cv2.FONT_HERSHEY_SIMPLEX, text_scale, text_thickness)
+        # Make background rectangle slightly larger
+        padding = 5
+        cv2.rectangle(annotated_frame,
+                     (x1, y1 - text_height - baseline - padding * 2),
+                     (x1 + text_width + padding * 2, y1),
+                     color, -1)
+        # Add white border around the text for better visibility
+        for dx, dy in [(-1,-1), (-1,1), (1,-1), (1,1)]:
+            cv2.putText(annotated_frame, label,
+                       (x1 + padding + dx, y1 - padding + dy),
+                       cv2.FONT_HERSHEY_SIMPLEX, text_scale,
+                       (0, 0, 0), text_thickness + 1)
+        # Draw main text
+        cv2.putText(annotated_frame, label,
+                    (x1 + padding, y1 - padding),
+                    cv2.FONT_HERSHEY_SIMPLEX, text_scale,
+                    (255, 255, 255), text_thickness)
+        det['id'] = obj_id
+    return annotated_frame

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+opencv-python-headless>=4.7.0
+torch>=2.0.0
+torchvision>=0.15.0
+numpy>=1.24.0
+streamlit>=1.24.0
+ultralytics>=8.0.0
+python-dateutil>=2.8.2