Spaces:

ABAO77
/

Autonomous_Car

No application file

App Files Files Community

Autonomous_Car / ultrafast /ultrafastLaneDetector.py

ABAO77

alo

f09998e about 1 year ago

raw

history blame contribute delete

7.66 kB

	import onnxruntime
	import scipy.special
	from enum import Enum
	import cv2
	import time
	import numpy as np

	lane_colors = [(0, 0, 255), (0, 255, 0), (255, 0, 0), (0, 255, 255)]

	tusimple_row_anchor = [
	64,
	68,
	72,
	76,
	80,
	84,
	88,
	92,
	96,
	100,
	104,
	108,
	112,
	116,
	120,
	124,
	128,
	132,
	136,
	140,
	144,
	148,
	152,
	156,
	160,
	164,
	168,
	172,
	176,
	180,
	184,
	188,
	192,
	196,
	200,
	204,
	208,
	212,
	216,
	220,
	224,
	228,
	232,
	236,
	240,
	244,
	248,
	252,
	256,
	260,
	264,
	268,
	272,
	276,
	280,
	284,
	]
	culane_row_anchor = [
	121,
	131,
	141,
	150,
	160,
	170,
	180,
	189,
	199,
	209,
	219,
	228,
	238,
	248,
	258,
	267,
	277,
	287,
	]


	class ModelType(Enum):
	TUSIMPLE = 0
	CULANE = 1


	class ModelConfig:

	def __init__(self, model_type):

	if model_type == ModelType.TUSIMPLE:
	self.init_tusimple_config()
	else:
	self.init_culane_config()

	def init_tusimple_config(self):
	self.img_w = 1280
	self.img_h = 720
	self.row_anchor = tusimple_row_anchor
	self.griding_num = 100
	self.cls_num_per_lane = 56

	def init_culane_config(self):
	self.img_w = 1640
	self.img_h = 590
	self.row_anchor = culane_row_anchor
	self.griding_num = 200
	self.cls_num_per_lane = 18


	class UltrafastLaneDetector:

	def __init__(self, model_path, model_type=ModelType.TUSIMPLE):
	self.fps = 0
	self.timeLastPrediction = time.time()
	self.frameCounter = 0

	# Load model configuration based on the model type
	self.cfg = ModelConfig(model_type)

	# Initialize model
	self.initialize_model(model_path)

	def initialize_model(self, model_path):
	available_providers = onnxruntime.get_available_providers()

	if 'CUDAExecutionProvider' in available_providers:
	# "TensorrtExecutionProvider"
	# "CUDAExecutionProvider"
	providers = ['CUDAExecutionProvider', 'CPUExecutionProvider']
	print("Using CUDA provider")
	else:
	providers = ['CPUExecutionProvider']
	print("Using CPU provider")

	self.session = onnxruntime.InferenceSession(model_path, providers=providers)

	# Get model info
	self.getModel_input_details()
	self.getModel_output_details()

	def detect_lanes(self, image, draw_points=True):

	input_tensor = self.prepare_input(image)

	# Perform inference on the image
	output = self.inference(input_tensor)
	# Process output data
	self.lanes_points, self.lanes_detected = self.process_output(output, self.cfg)

	return self.lanes_points, self.lanes_detected

	def prepare_input(self, image):
	img = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
	self.img_height, self.img_width, self.img_channels = img.shape

	# Input values should be from -1 to 1 with a size of 288 x 800 pixels
	img_input = cv2.resize(img, (self.input_width, self.input_height)).astype(
	np.float32
	)

	# Scale input pixel values to -1 to 1
	mean = [0.485, 0.456, 0.406]
	std = [0.229, 0.224, 0.225]

	img_input = (img_input / 255.0 - mean) / std
	img_input = img_input.transpose(2, 0, 1)
	img_input = img_input[np.newaxis, :, :, :]

	# Convert to float16
	return img_input.astype(np.float16)

	def inference(self, input_tensor):
	input_name = self.session.get_inputs()[0].name
	output_name = self.session.get_outputs()[0].name

	output = self.session.run([output_name], {input_name: input_tensor})

	return output

	def getModel_input_details(self):

	self.input_shape = self.session.get_inputs()[0].shape
	self.channes = self.input_shape[2]
	self.input_height = self.input_shape[2]
	self.input_width = self.input_shape[3]

	def getModel_output_details(self):

	self.output_shape = self.session.get_outputs()[0].shape
	self.num_points = self.output_shape[1]
	self.num_anchors = self.output_shape[2]
	self.num_lanes = self.output_shape[3]

	@staticmethod
	def process_output(output, cfg):
	# Parse the output of the model
	processed_output = np.squeeze(output[0])
	processed_output = processed_output[:, ::-1, :]
	prob = scipy.special.softmax(processed_output[:-1, :, :], axis=0)
	idx = np.arange(cfg.griding_num) + 1
	idx = idx.reshape(-1, 1, 1)
	loc = np.sum(prob * idx, axis=0)
	processed_output = np.argmax(processed_output, axis=0)
	loc[processed_output == cfg.griding_num] = 0
	processed_output = loc

	col_sample = np.linspace(0, 800 - 1, cfg.griding_num)
	col_sample_w = col_sample[1] - col_sample[0]

	lanes_points = []
	lanes_detected = []

	max_lanes = processed_output.shape[1]
	for lane_num in range(max_lanes):
	lane_points = []
	# Check if there are any points detected in the lane
	if np.sum(processed_output[:, lane_num] != 0) > 2:
	lanes_detected.append(True)
	# Process each of the points for each lane
	for point_num in range(processed_output.shape[0]):
	if processed_output[point_num, lane_num] > 0:
	lane_point = [
	int(
	processed_output[point_num, lane_num]
	* col_sample_w
	* cfg.img_w
	/ 800
	)
	- 1,
	int(
	cfg.img_h
	* (
	cfg.row_anchor[cfg.cls_num_per_lane - 1 - point_num]
	/ 288
	)
	)
	- 1,
	]
	lane_points.append(lane_point)
	else:
	lanes_detected.append(False)

	lanes_points.append(lane_points)

	return lanes_points, np.array(lanes_detected)

	@staticmethod
	def draw_lanes(input_img, lanes_points, lanes_detected, cfg, draw_points=True):
	# Write the detected line points in the image
	visualization_img = cv2.resize(
	input_img, (cfg.img_w, cfg.img_h), interpolation=cv2.INTER_AREA
	)

	# Draw a mask for the current lane
	if lanes_detected[1] and lanes_detected[2]:
	lane_segment_img = visualization_img.copy()

	cv2.fillPoly(
	lane_segment_img,
	pts=[np.vstack((lanes_points[1], np.flipud(lanes_points[2])))],
	color=(255, 191, 0),
	)
	visualization_img = cv2.addWeighted(
	visualization_img, 0.7, lane_segment_img, 0.3, 0
	)

	if draw_points:
	for lane_num, lane_points in enumerate(lanes_points):
	for lane_point in lane_points:
	cv2.circle(
	visualization_img,
	(lane_point[0], lane_point[1]),
	3,
	lane_colors[lane_num],
	-1,
	)

	return visualization_img