Spaces:

damndeepesh
/

QuickTrack

Sleeping

App Files Files Community

QuickTrack / app.py

damndeepesh

Uploaded Project Files

9de653a verified 12 months ago

raw

history blame contribute delete

12.8 kB

	import streamlit as st
	import cv2
	import torch
	import numpy as np
	import time
	import tempfile
	from pathlib import Path

	# Import detection utilities
	from detection_utils import load_model, detect_objects, draw_boxes, ObjectTracker

	def initialize_video_capture(input_source, video_file=None, url=None):
	"""Initialize video capture and writer"""
	cap = None
	out = None
	output_path = None

	if input_source == "Video File" and video_file is not None:
	# Save uploaded file to temp location
	tfile = tempfile.NamedTemporaryFile(delete=False, suffix='.mp4')
	tfile.write(video_file.read())
	tfile.flush()
	video_path = tfile.name

	# Open video capture
	cap = cv2.VideoCapture(video_path)

	if cap.isOpened():
	# Get video properties
	width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
	height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
	fps = int(cap.get(cv2.CAP_PROP_FPS))

	# Ensure valid FPS
	if fps <= 0:
	fps = 30

	# Create output path in a temporary directory
	temp_dir = tempfile.gettempdir()
	output_path = str(Path(temp_dir) / 'detected_output.mp4')

	# Try different codecs in order of preference
	codecs = [
	('avc1', '.mp4'),
	('mp4v', '.mp4'),
	('XVID', '.avi')
	]

	for codec, ext in codecs:
	try:
	output_path = str(Path(temp_dir) / f'detected_output{ext}')
	fourcc = cv2.VideoWriter_fourcc(*codec)
	out = cv2.VideoWriter(
	output_path,
	fourcc,
	fps,
	(width, height),
	isColor=True
	)

	# Test if writer is working
	if out.isOpened():
	break
	except Exception:
	continue

	if out is None or not out.isOpened():
	st.error("Failed to create video writer")
	return None, None, None

	elif input_source == "Live Stream URL" and url:
	cap = cv2.VideoCapture(url)

	return cap, out, output_path

	def get_model_info():
	"""Return information about available YOLO models"""
	return {
	'yolov8n.pt': {
	'name': 'YOLOv8 Nano',
	'description': 'Smallest and fastest model. Best for CPU or low-power devices.',
	'speed': '⚡⚡⚡⚡⚡',
	'accuracy': '⭐⭐',
	'size': '6.7 MB',
	'details': 'Ideal for real-time applications with limited computing power.'
	},
	'yolov8s.pt': {
	'name': 'YOLOv8 Small',
	'description': 'Small model balancing speed and accuracy.',
	'speed': '⚡⚡⚡⚡',
	'accuracy': '⭐⭐⭐',
	'size': '22.4 MB',
	'details': 'Good for general purpose detection with decent performance.'
	},
	'yolov8m.pt': {
	'name': 'YOLOv8 Medium',
	'description': 'Medium-sized model with good balance.',
	'speed': '⚡⚡⚡',
	'accuracy': '⭐⭐⭐⭐',
	'size': '52.2 MB',
	'details': 'Recommended for standard detection tasks with good GPU.'
	},
	'yolov8l.pt': {
	'name': 'YOLOv8 Large',
	'description': 'Large model with high accuracy.',
	'speed': '⚡⚡',
	'accuracy': '⭐⭐⭐⭐⭐',
	'size': '87.7 MB',
	'details': 'Best for high-accuracy requirements with good computing power.'
	},
	'yolov8x.pt': {
	'name': 'YOLOv8 XLarge',
	'description': 'Extra large model with highest accuracy.',
	'speed': '⚡',
	'accuracy': '⭐⭐⭐⭐⭐⭐',
	'size': '131.7 MB',
	'details': 'Best for tasks requiring maximum accuracy, requires powerful GPU.'
	}
	}

	def main():
	st.title("Real-Time Object Detection")

	# Initialize session state
	if 'tracker' not in st.session_state:
	st.session_state.tracker = ObjectTracker()
	if 'cap' not in st.session_state:
	st.session_state.cap = None
	if 'out' not in st.session_state:
	st.session_state.out = None
	if 'output_path' not in st.session_state:
	st.session_state.output_path = None
	if 'processed_frames' not in st.session_state:
	st.session_state.processed_frames = 0
	if 'selected_model' not in st.session_state:
	st.session_state.selected_model = 'yolov8x.pt'
	if 'model' not in st.session_state:
	st.session_state.model = None

	# Sidebar settings
	st.sidebar.title("Settings")

	# Model selection
	st.sidebar.subheader("Model Selection")
	model_info = get_model_info()
	selected_model = st.sidebar.selectbox(
	"Choose YOLO Model",
	options=list(model_info.keys()),
	format_func=lambda x: model_info[x]['name'],
	index=list(model_info.keys()).index(st.session_state.selected_model)
	)

	# Display model information
	with st.sidebar.expander("Model Details", expanded=True):
	st.markdown(f"{model_info[selected_model]['name']}")
	st.write(model_info[selected_model]['description'])
	st.write(f"Speed: {model_info[selected_model]['speed']}")
	st.write(f"Accuracy: {model_info[selected_model]['accuracy']}")
	st.write(f"Size: {model_info[selected_model]['size']}")
	st.write(f"Details: {model_info[selected_model]['details']}")

	# Add Load Model button
	if st.sidebar.button("Load Selected Model"):
	with st.spinner(f"Loading {model_info[selected_model]['name']}..."):
	st.session_state.model = load_model(selected_model)
	st.session_state.selected_model = selected_model
	st.sidebar.success("Model loaded successfully!")

	# Detection confidence
	detection_confidence = st.sidebar.slider("Detection Confidence", 0.0, 1.0, 0.5)

	# Input selection
	input_source = st.radio("Select Input Source", ["Video File", "Live Stream URL"])

	try:
	# Handle video input
	if input_source == "Video File":
	video_file = st.file_uploader("Upload Video", type=['mp4', 'avi'])
	if video_file is not None:
	st.session_state.cap, st.session_state.out, st.session_state.output_path = initialize_video_capture(input_source, video_file=video_file)
	else:
	url = st.text_input("Enter Stream URL")
	if url:
	st.session_state.cap, st.session_state.out, st.session_state.output_path = initialize_video_capture(input_source, url=url)

	if st.session_state.cap is not None and not st.session_state.cap.isOpened():
	st.error("Error: Could not open video source")
	st.stop()

	# Create placeholder for video display
	video_placeholder = st.empty()

	# Initialize frame buffer in session state
	if 'frame_buffer' not in st.session_state:
	st.session_state.frame_buffer = []

	# Control buttons - Move them to sidebar to avoid duplication
	st.sidebar.markdown("---")
	st.sidebar.subheader("Controls")
	start_button = st.sidebar.button("Start Detection")
	stop_button = st.sidebar.button("Stop Detection")

	if start_button:
	if st.session_state.model is None:
	st.error("Please load a model first using the 'Load Selected Model' button")
	st.stop()
	if st.session_state.cap is None:
	st.error("Please upload a video or provide a stream URL first")
	st.stop()
	st.session_state.run_detection = True
	st.session_state.processed_frames = 0
	st.session_state.frame_buffer = [] # Clear buffer on start
	if stop_button:
	st.session_state.run_detection = False

	# Detection loop
	while (hasattr(st.session_state, 'run_detection') and
	st.session_state.run_detection and
	st.session_state.cap is not None):

	ret, frame = st.session_state.cap.read()
	if not ret:
	break

	# Perform detection
	detections = detect_objects(st.session_state.model, frame, detection_confidence)

	# Draw boxes on frame
	annotated_frame = draw_boxes(frame, detections, st.session_state.tracker)

	# Add frame to buffer
	st.session_state.frame_buffer.append(annotated_frame)

	# Write frames to video periodically
	if len(st.session_state.frame_buffer) >= 30: # Write every 30 frames
	for buffered_frame in st.session_state.frame_buffer:
	if st.session_state.out is not None:
	st.session_state.out.write(buffered_frame)
	st.session_state.processed_frames += 1
	st.session_state.frame_buffer.clear()

	# Update display every 3rd frame
	if st.session_state.processed_frames % 3 == 0:
	video_placeholder.image(annotated_frame, channels="BGR")

	# Minimal sleep to prevent UI freezing
	time.sleep(0.001)

	# Write remaining frames in buffer
	if st.session_state.frame_buffer and st.session_state.out is not None:
	for buffered_frame in st.session_state.frame_buffer:
	st.session_state.out.write(buffered_frame)
	st.session_state.processed_frames += 1
	st.session_state.frame_buffer.clear()

	except Exception as e:
	st.error(f"An error occurred: {str(e)}")
	raise e

	finally:
	# Ensure proper cleanup and save remaining frames
	if hasattr(st.session_state, 'frame_buffer') and st.session_state.frame_buffer and hasattr(st.session_state, 'out') and st.session_state.out is not None:
	for buffered_frame in st.session_state.frame_buffer:
	st.session_state.out.write(buffered_frame)
	st.session_state.processed_frames += 1
	st.session_state.frame_buffer.clear()

	# Release resources
	if hasattr(st.session_state, 'cap') and st.session_state.cap is not None:
	st.session_state.cap.release()

	if hasattr(st.session_state, 'out') and st.session_state.out is not None:
	st.session_state.out.release()
	cv2.destroyAllWindows()

	# Add a separator
	st.markdown("---")

	# Download section
	if st.session_state.processed_frames > 0:
	st.subheader("Download Processed Video")

	# Force flush and wait
	time.sleep(3) # Increased wait time

	if (st.session_state.output_path and
	Path(st.session_state.output_path).exists()):

	try:
	with open(st.session_state.output_path, 'rb') as f:
	video_data = f.read()
	if len(video_data) > 1000:
	st.success(f"Successfully processed {st.session_state.processed_frames} frames")
	# Make download button more prominent
	st.download_button(
	label="📥 Download Processed Video",
	data=video_data,
	file_name=f"detected_video_{time.strftime('%Y%m%d_%H%M%S')}.mp4",
	mime="video/mp4",
	key="download_button"
	)
	else:
	st.error("Error: Video file is empty or corrupted")
	st.info("Try processing the video again with different settings")
	except Exception as e:
	st.error(f"Error preparing download: {str(e)}")
	st.info("Please try processing the video again")
	else:
	st.error("Output video file not found")
	st.info("Make sure to complete the video processing before downloading")

	if __name__ == "__main__":
	main()