Spaces:

EthanStanks
/

DroneCrashClassification

Sleeping

App Files Files Community

DroneCrashClassification / model /video_classifier.py

EthanStanks

Reducing frame size for hopefully faster cpu processing

f7306b6 over 1 year ago

raw

history blame contribute delete

6.41 kB

	import os
	import cv2
	from ultralytics import YOLO
	import gradio as gr

	def get_model(path):
	return YOLO(path)

	def format_time(seconds):
	# seconds to minutes:seconds
	return f"{int(seconds // 60)}:{seconds % 60:05.2f}"

	def merge_crash_events(crash_events):
	# many crash events have the same start time
	if not crash_events:
	return []

	merged_events = [crash_events[0]] # start with the first crash event

	for current_start, current_end in crash_events[1:]:
	last_start, last_end = merged_events[-1] # get the last start and end
	if current_start - last_end <= 5.0: # check if less than merge time threshold
	merged_events[-1] = (last_start, max(last_end, current_end)) # update end time to the latest time
	else:
	merged_events.append((current_start, current_end)) # no merging needed
	return merged_events

	def video_classification(video_path,label_vid_output,crash_vid_output, model ,min_crash_duration=2.0): # min_crash_duration weeds out false flags
	# start video process
	cap = cv2.VideoCapture(video_path)
	total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
	fps = cap.get(cv2.CAP_PROP_FPS)
	width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
	height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
	count = 0

	fourcc = cv2.VideoWriter_fourcc(*'mp4v')
	labeled_out = cv2.VideoWriter(label_vid_output, fourcc, fps, (width, height))
	crash_out = cv2.VideoWriter(crash_vid_output, fourcc, fps, (width, height))

	# label dictionary
	label_counts = {
	"Crash": 0,
	"Flight": 0,
	"No drone": 0,
	"No signal": 0,
	"No started": 0,
	"Started": 0,
	"Unstable": 0,
	"Landing": 0,
	"Unknown": 0
	}

	is_crash = False # is current frame a crash
	crash_events = [] # store crash event tuples (start,end)
	crash_start_time = None # keep track of start time

	non_crash_frame_threshold = int(fps * 1.0) # number of frames to consider crash over
	non_crash_frame_count = 0 # count current non crash frames

	while True:
	ret, og_frame = cap.read() # read current frame
	if not ret:
	break

	print(f"\rProcessing frame {count + 1}/{total_frames}", end='', flush=True)

	# preprocess frame for prediction
	frame = cv2.resize(og_frame, (320, 320)) # reducing to help processing time on cpu
	#frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)

	# get timestamp of the frame
	current_time_ms = cap.get(cv2.CAP_PROP_POS_MSEC)
	current_time_sec = current_time_ms / 1000.0

	# make prediction
	results = model.predict(source=frame, imgsz=640, verbose=False)
	current_label = "Unknown"

	# update frame's label
	if results and hasattr(results[0], 'probs') and results[0].probs is not None:
	top1_index = results[0].probs.top1

	if top1_index == 0:
	label_counts["Crash"] += 1
	current_label = "Crash"
	elif top1_index == 1:
	label_counts["Flight"] += 1
	current_label = "Flight"
	elif top1_index == 2:
	label_counts["No drone"] += 1
	current_label = "No drone"
	elif top1_index == 3:
	label_counts["No signal"] += 1
	current_label = "No signal"
	elif top1_index == 4:
	label_counts["No started"] += 1
	current_label = "No started"
	elif top1_index == 5:
	label_counts["Started"] += 1
	current_label = "Started"
	elif top1_index == 6:
	label_counts["Unstable"] += 1
	current_label = "Unstable"
	elif top1_index == 7:
	label_counts["Landing"] += 1
	current_label = "Landing"
	else:
	label_counts["Unknown"] += 1

	if current_label == "Crash":
	crash_out.write(og_frame)
	if not is_crash:
	# start new crash event
	crash_start_time = current_time_sec
	is_crash = True
	non_crash_frame_count = 0
	else:
	if is_crash:
	# currently in crash event
	non_crash_frame_count += 1
	if non_crash_frame_count >= non_crash_frame_threshold:
	# end crash event if non_crash is more than threshold
	crash_end_time = current_time_sec
	crash_duration = crash_end_time - crash_start_time
	if crash_duration >= min_crash_duration:
	crash_events.append((crash_start_time, crash_end_time))
	is_crash = False
	crash_start_time = None
	non_crash_frame_count = 0
	else:
	# not in a crash event
	non_crash_frame_count = 0

	# write label to frame
	font = cv2.FONT_HERSHEY_SIMPLEX
	font_scale = 0.6
	font_color = (255, 255, 255)
	thickness = 2
	position = (10, 30)
	text_size = cv2.getTextSize(current_label, font, font_scale, thickness)[0]
	text_x, text_y = position
	cv2.rectangle(og_frame, (text_x - 5, text_y - text_size[1] - 5), (text_x + text_size[0] + 5, text_y + 5), (0, 0, 0), -1)
	cv2.putText(og_frame, current_label, position, font, font_scale, font_color, thickness)
	labeled_out.write(og_frame)

	frame_out = cv2.cvtColor(og_frame, cv2.COLOR_BGR2RGB)
	progress_text = f"Processing frame {count + 1}/{total_frames}"
	yield {'type': 'frame', 'frame': frame_out, 'progress_text': progress_text}

	count += 1 # frame is over

	# video is over
	if is_crash:
	# ended on a crash frame
	crash_end_time = total_frames / fps
	crash_duration = crash_end_time - crash_start_time
	if crash_duration >= min_crash_duration:
	crash_events.append((crash_start_time, crash_end_time))

	cap.release()
	labeled_out.release()
	crash_out.release()
	cv2.destroyAllWindows()

	# merge events to only have unique crashes
	merged_crash_events = merge_crash_events(crash_events)

	yield {'type': 'results', 'label_counts': label_counts, 'crash_events': merged_crash_events}