R2SE_model / mmdet3d_plugin /datasets /carla_utils /transfuser_utils.py

Upload folder using huggingface_hub

663494c verified 2 months ago

32.7 kB

	"""
	Some utility functions e.g. for normalizing angles
	Functions for detecting red lights are adapted from scenario runners
	atomic_criteria.py
	"""
	import math
	import carla
	import numpy as np
	import torch
	import torch.nn.functional as F
	from torch import nn
	import cv2
	from collections import deque
	from shapely.geometry import Polygon, Point
	import shapely
	import itertools
	from copy import deepcopy


	def normalize_angle(x):
	x = x % (2 * np.pi) # force in range [0, 2 pi)
	if x > np.pi: # move to [-pi, pi)
	x -= 2 * np.pi
	return x


	def normalize_angle_degree(x):
	x = x % 360.0
	if x > 180.0:
	x -= 360.0
	return x


	def rotate_point(point, angle):
	"""
	rotate a given point by a given angle
	"""
	x_ = math.cos(math.radians(angle)) * point.x - math.sin(math.radians(angle)) * point.y
	y_ = math.sin(math.radians(angle)) * point.x + math.cos(math.radians(angle)) * point.y
	return carla.Vector3D(x_, y_, point.z)


	def get_traffic_light_waypoints(traffic_light, carla_map):
	"""
	get area of a given traffic light
	"""
	base_transform = traffic_light.get_transform()
	base_loc = traffic_light.get_location()
	base_rot = base_transform.rotation.yaw
	area_loc = base_transform.transform(traffic_light.trigger_volume.location)

	# Discretize the trigger box into points
	area_ext = traffic_light.trigger_volume.extent
	x_values = np.arange(-0.9 * area_ext.x, 0.9 * area_ext.x, 1.0) # 0.9 to avoid crossing to adjacent lanes

	area = []
	for x in x_values:
	point = rotate_point(carla.Vector3D(x, 0, area_ext.z), base_rot)
	point_location = area_loc + carla.Location(x=point.x, y=point.y)
	area.append(point_location)

	# Get the waypoints of these points, removing duplicates
	ini_wps = []
	for pt in area:
	wpx = carla_map.get_waypoint(pt)
	# As x_values are arranged in order, only the last one has to be checked
	if not ini_wps or ini_wps[-1].road_id != wpx.road_id or ini_wps[-1].lane_id != wpx.lane_id:
	ini_wps.append(wpx)

	# Advance them until the intersection
	wps = []
	eu_wps = []
	for wpx in ini_wps:
	distance_to_light = base_loc.distance(wpx.transform.location)
	eu_wps.append(wpx)
	next_distance_to_light = distance_to_light + 1.0
	while not wpx.is_intersection:
	next_wp = wpx.next(0.5)[0]
	next_distance_to_light = base_loc.distance(next_wp.transform.location)
	if next_wp and not next_wp.is_intersection \
	and next_distance_to_light <= distance_to_light:
	eu_wps.append(next_wp)
	distance_to_light = next_distance_to_light
	wpx = next_wp
	else:
	break

	if not next_distance_to_light <= distance_to_light and len(eu_wps) >= 4:
	wps.append(eu_wps[-4])
	else:
	wps.append(wpx)

	return area_loc, wps


	def lidar_to_ego_coordinate(config, lidar):
	"""
	Converts the LiDAR points given by the simulator into the ego agents
	coordinate system
	:param config: GlobalConfig, used to read out lidar orientation and location
	:param lidar: the LiDAR point cloud as provided in the input of run_step
	:return: lidar where the points are w.r.t. 0/0/0 of the car and the carla
	coordinate system.
	"""
	yaw = np.deg2rad(config.lidar_rot[2])
	rotation_matrix = np.array([[np.cos(yaw), -np.sin(yaw), 0.0], [np.sin(yaw), np.cos(yaw), 0.0], [0.0, 0.0, 1.0]])

	translation = np.array(config.lidar_pos)

	# The double transpose is a trick to compute all the points together.
	ego_lidar = (rotation_matrix @ lidar[1][:, :3].T).T + translation

	return ego_lidar


	def algin_lidar(lidar, translation, yaw):
	"""
	Translates and rotates a LiDAR into a new coordinate system.
	Rotation is inverse to translation and yaw
	:param lidar: numpy LiDAR point cloud (N,3)
	:param translation: translations in meters
	:param yaw: yaw angle in radians
	:return: numpy LiDAR point cloud in the new coordinate system.
	"""

	rotation_matrix = np.array([[np.cos(yaw), -np.sin(yaw), 0.0], [np.sin(yaw), np.cos(yaw), 0.0], [0.0, 0.0, 1.0]])

	aligned_lidar = (rotation_matrix.T @ (lidar - translation).T).T

	return aligned_lidar


	def inverse_conversion_2d(point, translation, yaw):
	"""
	Performs a forward coordinate conversion on a 2D point
	:param point: Point to be converted
	:param translation: 2D translation vector of the new coordinate system
	:param yaw: yaw in radian of the new coordinate system
	:return: Converted point
	"""
	rotation_matrix = np.array([[np.cos(yaw), -np.sin(yaw)], [np.sin(yaw), np.cos(yaw)]])

	converted_point = rotation_matrix.T @ (point - translation)
	return converted_point


	def preprocess_compass(compass):
	"""
	Checks the compass for Nans and rotates it into the default CARLA coordinate
	system with range [-pi,pi].
	:param compass: compass value provided by the IMU, in radian
	:return: yaw of the car in radian in the CARLA coordinate system.
	"""
	if math.isnan(compass): # simulation bug
	compass = 0.0
	# The minus 90.0 degree is because the compass sensor uses a different
	# coordinate system then CARLA. Check the coordinate_sytems.txt file
	compass = normalize_angle(compass - np.deg2rad(90.0))

	return compass


	def get_relative_transform(ego_matrix, vehicle_matrix):
	"""
	Returns the position of the vehicle matrix in the ego coordinate system.
	:param ego_matrix: ndarray 4x4 Matrix of the ego vehicle in global
	coordinates
	:param vehicle_matrix: ndarray 4x4 Matrix of another actor in global
	coordinates
	:return: ndarray position of the other vehicle in the ego coordinate system
	"""
	relative_pos = vehicle_matrix[:3, 3] - ego_matrix[:3, 3]
	rot = ego_matrix[:3, :3].T
	relative_pos = rot @ relative_pos

	return relative_pos


	def extract_yaw_from_matrix(matrix):
	"""Extracts the yaw from a CARLA world matrix"""
	yaw = math.atan2(matrix[1, 0], matrix[0, 0])
	yaw = normalize_angle(yaw)
	return yaw


	# Taken from https://stackoverflow.com/a/47381058/9173068
	def trapez(y, y0, w):
	return np.clip(np.minimum(y + 1 + w / 2 - y0, -y + 1 + w / 2 + y0), 0, 1)


	def weighted_line(r0, c0, r1, c1, w, rmin=0, rmax=np.inf):
	# The algorithm below works fine if c1 >= c0 and c1-c0 >= abs(r1-r0).
	# If either of these cases are violated, do some switches.
	if abs(c1 - c0) < abs(r1 - r0):
	# Switch x and y, and switch again when returning.
	xx, yy, val = weighted_line(c0, r0, c1, r1, w, rmin=rmin, rmax=rmax) # pylint: disable=locally-disabled, arguments-out-of-order
	return (yy, xx, val)

	# At this point we know that the distance in columns (x) is greater
	# than that in rows (y). Possibly one more switch if c0 > c1.
	if c0 > c1:
	return weighted_line(r1, c1, r0, c0, w, rmin=rmin, rmax=rmax) # pylint: disable=locally-disabled, arguments-out-of-order

	# The following is now always < 1 in abs
	if (c1 - c0) != 0.0:
	slope = (r1 - r0) / (c1 - c0)
	else:
	slope = 0.0

	# Adjust weight by the slope
	w *= np.sqrt(1 + np.abs(slope)) / 2

	# We write y as a function of x, because the slope is always <= 1
	# (in absolute value)
	x = np.arange(c0, c1 + 1, dtype=float)
	if (c1 - c0) != 0.0:
	y = x * slope + (c1 * r0 - c0 * r1) / (c1 - c0)
	else:
	y = np.zeros_like(x)

	# Now instead of 2 values for y, we have 2*np.ceil(w/2).
	# All values are 1 except the upmost and bottommost.
	thickness = np.ceil(w / 2)
	yy = (np.floor(y).reshape(-1, 1) + np.arange(-thickness - 1, thickness + 2).reshape(1, -1))
	xx = np.repeat(x, yy.shape[1])
	vals = trapez(yy, y.reshape(-1, 1), w).flatten()

	yy = yy.flatten()

	# Exclude useless parts and those outside of the interval
	# to avoid parts outside of the picture
	mask = np.logical_and.reduce((yy >= rmin, yy < rmax, vals > 0))

	return (yy[mask].astype(int), xx[mask].astype(int), vals[mask])


	def draw_line(img, start_row, start_column, end_row, end_column, color=(255, 255, 255), thickness=1, rmax=256):

	if start_row == end_row and start_column == end_column:
	rr, cc, val = start_row, start_column, 1.0
	else:
	rr, cc, val = weighted_line(r0=start_row, c0=start_column, r1=end_row, c1=end_column, w=thickness, rmax=rmax)

	img[rr, cc, 0] = val * color[0] + (1.0 - val) * img[rr, cc, 0]
	img[rr, cc, 1] = val * color[1] + (1.0 - val) * img[rr, cc, 1]
	img[rr, cc, 2] = val * color[2] + (1.0 - val) * img[rr, cc, 2]
	return img


	def draw_box(img, box, color=(255, 255, 255), pixel_per_meter=4, thickness=1):
	translation = np.array([[box[0], box[1]]])
	width = box[2]
	height = box[3]
	yaw = box[4]
	rotation_matrix = np.array([[np.cos(yaw), -np.sin(yaw)], [np.sin(yaw), np.cos(yaw)]])
	speed = box[5] * pixel_per_meter
	speed_coords = np.array([[0.0, 0.0], [0.0, speed]])
	corners = np.array([[-width, -height], [width, -height], [width, height], [-width, height]])
	corner_global = (rotation_matrix @ corners.T).T + translation
	speed_coords_global = (rotation_matrix @ speed_coords.T).T + translation
	corner_global = corner_global.astype(np.int64)
	speed_coords_global = speed_coords_global.astype(np.int64)

	# Only the center is guaranteed to be within the image. Need to clip the corner points.
	max_row = img.shape[0]
	max_column = img.shape[1]
	corner_global[:, 0] = np.clip(corner_global[:, 0], a_min=0, a_max=max_row - 1)
	corner_global[:, 1] = np.clip(corner_global[:, 1], a_min=0, a_max=max_column - 1)
	speed_coords_global[:, 0] = np.clip(speed_coords_global[:, 0], a_min=0, a_max=max_row - 1)
	speed_coords_global[:, 1] = np.clip(speed_coords_global[:, 1], a_min=0, a_max=max_column - 1)

	img = draw_line(img,
	start_row=corner_global[0, 0],
	start_column=corner_global[0, 1],
	end_row=corner_global[1, 0],
	end_column=corner_global[1, 1],
	color=color,
	thickness=thickness,
	rmax=max_row)
	img = draw_line(img,
	start_row=corner_global[1, 0],
	start_column=corner_global[1, 1],
	end_row=corner_global[2, 0],
	end_column=corner_global[2, 1],
	color=color,
	thickness=thickness,
	rmax=max_row)
	img = draw_line(img,
	start_row=corner_global[2, 0],
	start_column=corner_global[2, 1],
	end_row=corner_global[3, 0],
	end_column=corner_global[3, 1],
	color=color,
	thickness=thickness,
	rmax=max_row)
	img = draw_line(img,
	start_row=corner_global[3, 0],
	start_column=corner_global[3, 1],
	end_row=corner_global[0, 0],
	end_column=corner_global[0, 1],
	color=color,
	thickness=thickness,
	rmax=max_row)
	img = draw_line(img,
	start_row=speed_coords_global[0, 0],
	start_column=speed_coords_global[0, 1],
	end_row=speed_coords_global[1, 0],
	end_column=speed_coords_global[1, 1],
	color=color,
	thickness=thickness,
	rmax=max_row)

	return img


	class PIDController(object):
	"""
	PID controller that converts waypoints to steer, brake and throttle commands
	"""

	def __init__(self, k_p=1.0, k_i=0.0, k_d=0.0, n=20):
	self.k_p = k_p
	self.k_i = k_i
	self.k_d = k_d

	self.window = deque([0 for _ in range(n)], maxlen=n)

	def step(self, error):
	self.window.append(error)

	if len(self.window) >= 2:
	integral = np.mean(self.window)
	derivative = self.window[-1] - self.window[-2]
	else:
	integral = 0.0
	derivative = 0.0

	return self.k_p * error + self.k_i * integral + self.k_d * derivative


	def gaussian_focal_loss(pred, gaussian_target, alpha=2.0, gamma=4.0, reduction='mean'):
	""" Adapted from mmdetection
	Args:
	pred (torch.Tensor): The prediction.
	gaussian_target (torch.Tensor): The learning target of the prediction
	in gaussian distribution.
	alpha (float, optional): A balanced form for Focal Loss.
	Defaults to 2.0.
	gamma (float, optional): The gamma for calculating the modulating
	factor. Defaults to 4.0.
	"""
	eps = 1e-12
	pos_weights = gaussian_target.eq(1)
	neg_weights = (1 - gaussian_target).pow(gamma)
	pos_loss = -(pred + eps).log() * (1 - pred).pow(alpha) * pos_weights
	neg_loss = -(1 - pred + eps).log() * pred.pow(alpha) * neg_weights
	loss = pos_loss + neg_loss

	if reduction == 'mean':
	loss = loss.mean()
	elif reduction == 'sum':
	loss = loss.sum()
	# All other reductions will be no reduction.
	return loss


	def bb_vehicle_to_image_system(box, pixels_per_meter, min_x, min_y):
	"""
	Changed a bounding box from the vehicle x front, y right coordinate system
	to the x back, y right coordinate system of an image, where the center of
	the car is in the center of the image.
	:return:
	"""
	# Multiply position and extent by pixels_per_meter to convert the unit from meters to pixels
	box[:4] = box[:4] * pixels_per_meter
	# Pixel coordinates is y front, x right. CARLA is x front, y right.
	# So we need to swap the axes to convert the coordinates.
	box[0], box[1] = box[1], box[0]
	box[2], box[3] = box[3], box[2]
	# Compute pixel location that represents 0/0 in the image
	translation = np.array([-(min_x * pixels_per_meter), -(min_y * pixels_per_meter)])
	# Shift the coordinates so that the ego_vehicle is at the center of the image
	box[:2] = box[:2] + translation
	box[4] = -box[4]
	return box


	def bb_image_to_vehicle_system(box, pixels_per_meter, min_x, min_y):
	"""
	Changed a bounding box from the vehicle x front, y right coordinate system
	to the x back, y right coordinate system of an image, where the center of
	the car is in the center of the image.
	:return:
	"""
	box[4] = -box[4]
	# Compute pixel location that represents 0/0 in the image
	translation = np.array([-(min_x * pixels_per_meter), -(min_y * pixels_per_meter)])
	# Shift the coordinates so that the ego_vehicle is at [0,0]
	box[:2] = box[:2] - translation
	# Pixel coordinates is y front, x right. CARLA is x front, y right.
	# So we need to swap the axes to convert the coordinates.
	box[0], box[1] = box[1], box[0]
	box[2], box[3] = box[3], box[2]
	# Divide position and extent by pixels_per_meter to convert the unit from pixels to meters
	box[:4] = box[:4] / pixels_per_meter
	return box


	def non_maximum_suppression(bounding_boxes, iou_treshhold):
	filtered_boxes = []
	bounding_boxes = np.array(list(itertools.chain.from_iterable(bounding_boxes)), dtype=object)

	if bounding_boxes.size == 0: #If no bounding boxes are detected can't do NMS
	return filtered_boxes

	confidences_indices = np.argsort(bounding_boxes[:, -1])
	while len(confidences_indices) > 0:
	idx = confidences_indices[-1]
	current_bb = bounding_boxes[idx]
	filtered_boxes.append(current_bb)
	# Remove last element from the list
	confidences_indices = confidences_indices[:-1]

	if len(confidences_indices) == 0:
	break

	for idx2 in deepcopy(confidences_indices):
	if iou_bbs(current_bb, bounding_boxes[idx2]) > iou_treshhold: # Remove BB from list
	confidences_indices = confidences_indices[confidences_indices != idx2]

	return filtered_boxes


	def rect_polygon(x, y, width, height, angle):
	"""Return a shapely Polygon describing the rectangle with centre at
	(x, y) and the given width and height, rotated by angle quarter-turns.

	"""
	p = Polygon([(-width, -height), (width, -height), (width, height), (-width, height)])
	# Shapely is very inefficient at these operations, worth rewriting
	return shapely.affinity.translate(shapely.affinity.rotate(p, angle, use_radians=True), x, y)


	def iou_bbs(bb1, bb2):
	a = rect_polygon(bb1[0], bb1[1], bb1[2], bb1[3], bb1[4])
	b = rect_polygon(bb2[0], bb2[1], bb2[2], bb2[3], bb2[4])
	intersection_area = a.intersection(b).area
	union_area = a.union(b).area
	iou = intersection_area / union_area
	return iou


	def dot_product(vector1, vector2):
	return vector1.x * vector2.x + vector1.y * vector2.y + vector1.z * vector2.z


	def cross_product(vector1, vector2):
	return carla.Vector3D(x=vector1.y * vector2.z - vector1.z * vector2.y,
	y=vector1.z * vector2.x - vector1.x * vector2.z,
	z=vector1.x * vector2.y - vector1.y * vector2.x)


	def get_separating_plane(r_pos, plane, obb1, obb2):
	''' Checks if there is a seperating plane
	rPos Vec3
	plane Vec3
	obb1 Bounding Box
	obb2 Bounding Box
	'''
	return (abs(dot_product(r_pos, plane)) >
	(abs(dot_product((obb1.rotation.get_forward_vector() * obb1.extent.x), plane)) +
	abs(dot_product((obb1.rotation.get_right_vector() * obb1.extent.y), plane)) +
	abs(dot_product((obb1.rotation.get_up_vector() * obb1.extent.z), plane)) +
	abs(dot_product((obb2.rotation.get_forward_vector() * obb2.extent.x), plane)) +
	abs(dot_product((obb2.rotation.get_right_vector() * obb2.extent.y), plane)) +
	abs(dot_product((obb2.rotation.get_up_vector() * obb2.extent.z), plane))))


	def check_obb_intersection(obb1, obb2):
	'''
	Checks whether two bounding boxes intersect
	Rather complex looking because it is the general algorithm for 3D oriented bounding boxes.
	'''
	r_pos = obb2.location - obb1.location
	return not (
	get_separating_plane(r_pos, obb1.rotation.get_forward_vector(), obb1, obb2) or
	get_separating_plane(r_pos, obb1.rotation.get_right_vector(), obb1, obb2) or
	get_separating_plane(r_pos, obb1.rotation.get_up_vector(), obb1, obb2) or
	get_separating_plane(r_pos, obb2.rotation.get_forward_vector(), obb1, obb2) or
	get_separating_plane(r_pos, obb2.rotation.get_right_vector(), obb1, obb2) or
	get_separating_plane(r_pos, obb2.rotation.get_up_vector(), obb1, obb2) or get_separating_plane(
	r_pos, cross_product(obb1.rotation.get_forward_vector(), obb2.rotation.get_forward_vector()), obb1, obb2) or
	get_separating_plane(r_pos, cross_product(
	obb1.rotation.get_forward_vector(), obb2.rotation.get_right_vector()), obb1, obb2) or get_separating_plane(
	r_pos, cross_product(obb1.rotation.get_forward_vector(), obb2.rotation.get_up_vector()), obb1, obb2) or
	get_separating_plane(r_pos, cross_product(
	obb1.rotation.get_right_vector(), obb2.rotation.get_forward_vector()), obb1, obb2) or get_separating_plane(
	r_pos, cross_product(obb1.rotation.get_right_vector(), obb2.rotation.get_right_vector()), obb1, obb2) or
	get_separating_plane(r_pos, cross_product(
	obb1.rotation.get_right_vector(), obb2.rotation.get_up_vector()), obb1, obb2) or get_separating_plane(
	r_pos, cross_product(obb1.rotation.get_up_vector(), obb2.rotation.get_forward_vector()), obb1, obb2) or
	get_separating_plane(r_pos, cross_product(
	obb1.rotation.get_up_vector(), obb2.rotation.get_right_vector()), obb1, obb2) or get_separating_plane(
	r_pos, cross_product(obb1.rotation.get_up_vector(), obb2.rotation.get_up_vector()), obb1, obb2))


	def command_to_one_hot(command):
	if command < 0:
	command = 4
	command -= 1
	if command not in [0, 1, 2, 3, 4, 5]:
	command = 3
	cmd_one_hot = [0.0, 0.0, 0.0, 0.0, 0.0, 0.0]
	cmd_one_hot[command] = 1.0

	return np.array(cmd_one_hot)


	class InfoDummy(object):
	""" Info dummy that tries to mimic TIMMs info class"""

	def __init__(self, info):
	super().__init__()
	self.info = info


	def calculate_intrinsic_matrix(fov, height, width):
	""" Intrinsics and extrinsics for a single camera.
	adapted from MILE
	https://github.com/wayveai/mile/blob/247280758b40ae999a5de14a8423f0d4db2655ac/mile/data/dataset.py#L194
	"""

	# Intrinsics
	f = width / (2.0 * np.tan(fov * np.pi / 360.0))
	cx = width / 2.0
	cy = height / 2.0
	intrinsics = np.array([[f, 0.0, cx], [0.0, f, cy], [0.0, 0.0, 1.0]])

	return intrinsics


	def normalize_imagenet(x):
	""" Normalize input images according to ImageNet standards.
	Args:
	x (tensor): input images
	"""
	x = x.clone()
	x[:, 0] = ((x[:, 0] / 255.0) - 0.485) / 0.229
	x[:, 1] = ((x[:, 1] / 255.0) - 0.456) / 0.224
	x[:, 2] = ((x[:, 2] / 255.0) - 0.406) / 0.225
	return x


	class CarlaActorDummy(object):
	"""
	Actor dummy structure used to simulate a CARLA actor for data augmentation
	"""
	world = None
	bounding_box = None
	transform = None
	id = None

	def __init__(self, world, bounding_box, transform, id): # pylint: disable=locally-disabled, redefined-builtin
	self.world = world
	self.bounding_box = bounding_box
	self.transform = transform
	self.id = id

	def get_world(self):
	return self.world

	def get_transform(self):
	return self.transform

	def get_bounding_box(self):
	return self.bounding_box


	def convert_depth(data):
	"""
	Computes the normalized depth from a CARLA depth map.
	"""
	data = data.astype(np.float32)

	normalized = np.dot(data, [65536.0, 256.0, 1.0])
	normalized /= (256 * 256 * 256 - 1)
	# in_meters = 1000 * normalized
	# clip to 50 meters
	normalized = np.clip(normalized, a_min=0.0, a_max=0.05)
	normalized = normalized * 20.0 # Rescale map to lie in [0,1]

	return normalized


	def create_projection_grid(config):
	"""
	Creates a voxel grid around the car with each voxel containing the pixel index indicating the pixel
	it would land on if you project it into the camera of the car with a pinhole camera model.
	Also returns a valid mask indicating which voxels are visible from the camera.
	Because the coordinates are in normalized display coordinates, the image can also be a down-sampled version.
	:return: grid: voxel grid around the car. Each voxel contains the index of the corresponding camera pixel (x, y, 0).
	Coordinates are in normalized display coordinates [-1, 1].
	(-1,-1) is the top left pixel, (1,1) is the bottom right pixel .
	all_valid: The same voxel grid containing a bool that indicates whether the voxel is visible from the
	camera.
	"""
	meters_per_pixel = 1.0 / config.pixels_per_meter
	# + half a pixel because we want the center of the voxel.
	depths = torch.arange(config.min_x, config.max_x, meters_per_pixel) + (meters_per_pixel * 0.5)
	widths = torch.arange(config.min_y, config.max_y, meters_per_pixel) + (meters_per_pixel * 0.5)
	meters_per_pixel_height = meters_per_pixel * config.bev_grid_height_downsample_factor
	heights = torch.arange(config.min_z_projection, config.max_z_projection,
	meters_per_pixel_height) + (meters_per_pixel_height * 0.5)

	depths, widths, heights = torch.meshgrid(depths, widths, heights, indexing='ij')
	test_cloud = torch.stack((depths, widths, heights), dim=0) # CARLA coordinate system
	_, d, w, h = test_cloud.shape # channel, depth, width, height
	# If you rotate the camera adjust the rotation matrix here
	assert config.camera_rot_0[0] == config.camera_rot_0[1] == config.camera_rot_0[2] == 0.0
	rotation_matrix = torch.tensor([[1.0, 0.0, 0.0], [0.0, 1.0, 0.0], [0.0, 0.0, 1.0]])
	t = torch.tensor(config.camera_pos).unsqueeze(1)
	test_cloud2 = (rotation_matrix.T @ test_cloud.view(3, -1)) - (rotation_matrix.T @ t)

	# Convert CARLA coordiante system x front, y right, z up to pinhole coordinate system: x right, y down, z front
	test_cloud2 = torch.stack((test_cloud2[1], test_cloud2[2], test_cloud2[0]))

	# Apply intrinsic camera matrix
	intrinsic_matrix = torch.from_numpy(
	calculate_intrinsic_matrix(fov=config.camera_fov, height=config.camera_height,
	width=config.camera_width)).to(dtype=torch.float32)
	test_cloud2 = intrinsic_matrix @ test_cloud2

	depths = test_cloud2[2:3]
	grid = torch.zeros_like(test_cloud2).to(dtype=torch.float32)
	# Project to image coordinates using pinhole camera model
	# The depth grid is designed, so that the smallest number is +-0.125. Prevent division by 0 if you change it.
	grid[:2] = test_cloud2[:2] / depths

	# Note that the points themselfs are in pinhole camera coordinates, but the index in the grid represents the voxel
	# in the 3D volume
	grid = grid.view(3, d, w, h)

	width_valid = grid[0:1] >= 0.0
	witdh_valid2 = grid[0:1] < config.camera_width
	width_valid = torch.logical_and(width_valid, witdh_valid2)

	height_valid = grid[1:2] >= 0.0
	height_valid2 = grid[1:2] < config.camera_height
	height_valid = torch.logical_and(height_valid, height_valid2)

	depths = depths.view(1, d, w, h)
	depth_valid = depths > 0.0

	all_valid = torch.logical_and(width_valid, height_valid)
	all_valid = torch.logical_and(all_valid, depth_valid)

	# Normalizes pixel values to [-1, 1] normalized display coordinates
	grid[0:1] = (grid[0:1] / (0.5 * config.camera_width - 0.5)) - 1.0
	grid[1:2] = (grid[1:2] / (0.5 * config.camera_height - 0.5)) - 1.0

	grid = torch.reshape(grid, [1, 3, d, w, h, 1])
	grid = torch.transpose(grid, 1, 5).squeeze(1)

	return grid, all_valid.to(dtype=torch.float32)


	class PerspectiveDecoder(nn.Module):
	"""
	Decodes a low resolution perspective grid to a full resolution output. E.g. semantic segmentation, depth
	"""

	def __init__(self, in_channels, out_channels, inter_channel_0, inter_channel_1, inter_channel_2, scale_factor_0,
	scale_factor_1):
	super().__init__()
	self.scale_factor_0 = scale_factor_0
	self.scale_factor_1 = scale_factor_1

	self.deconv1 = nn.Sequential(
	nn.Conv2d(in_channels, inter_channel_0, 3, 1, 1),
	nn.ReLU(True),
	nn.Conv2d(inter_channel_0, inter_channel_1, 3, 1, 1),
	nn.ReLU(True),
	)
	self.deconv2 = nn.Sequential(
	nn.Conv2d(inter_channel_1, inter_channel_2, 3, 1, 1),
	nn.ReLU(True),
	nn.Conv2d(inter_channel_2, inter_channel_2, 3, 1, 1),
	nn.ReLU(True),
	)
	self.deconv3 = nn.Sequential(
	nn.Conv2d(inter_channel_2, inter_channel_2, 3, 1, 1),
	nn.ReLU(True),
	nn.Conv2d(inter_channel_2, out_channels, 3, 1, 1),
	)

	def forward(self, x):
	x = self.deconv1(x)
	x = F.interpolate(x, scale_factor=self.scale_factor_0, mode='bilinear', align_corners=False)
	x = self.deconv2(x)
	x = F.interpolate(x, scale_factor=self.scale_factor_1, mode='bilinear', align_corners=False)
	x = self.deconv3(x)

	return x


	def draw_probability_boxes(img, speed_prob, target_speeds, color=(128, 128, 128), color_selected=(255, 165, 0)):
	speed_index = np.argmax(speed_prob)
	colors = [color for _ in range(len(speed_prob))]
	colors[speed_index] = color_selected
	start_x = 0
	start_y = img.shape[0] - 155 - 150 # 1024-155-150 # start_x and start_y specify position of upper left corner of box
	width_bar = 20 * 4
	width_space = 10
	cv2.rectangle(img, (start_x, start_y), (1024, start_y + 155), (255, 255, 255), cv2.FILLED)

	for idx, s in enumerate(speed_prob):
	start = start_x + idx * (width_space + width_bar)
	cv2.rectangle(img, (start, start_y + 130), (start + width_bar, start_y + 130 - int(s * 100)), colors[idx],
	cv2.FILLED)
	cv2.putText(img, f'{s:.2f}', (int(start + 0.33 * width_bar), start_y + 127 - int(s * 100)),
	cv2.FONT_HERSHEY_SIMPLEX, 0.4, (0, 0, 0), 1, cv2.LINE_AA)

	# 3.6 is conversion from m/s to km/h
	cv2.putText(img, f'{int(round(target_speeds[idx] * 3.6)):02d}', (int(start + 0.33 * width_bar), start_y + 150),
	cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 0), 1, cv2.LINE_AA)

	cv2.putText(img, 'km/h', (start + width_bar + width_space, start_y + 150), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 0),
	1, cv2.LINE_AA)


	def plant_quant_to_box(config, pred_bounding_boxes):
	"""Convert a plant auxiliary class to an x,y location of a box"""
	pred_bb_x = F.softmax(pred_bounding_boxes[0][0], dim=1)
	pred_bb_y = F.softmax(pred_bounding_boxes[1][0], dim=1)
	pred_bb_ext_x = F.softmax(pred_bounding_boxes[2][0], dim=1)
	pred_bb_ext_y = F.softmax(pred_bounding_boxes[3][0], dim=1)
	pred_bb_yaw = F.softmax(pred_bounding_boxes[4][0], dim=1)
	pred_bb_speed = F.softmax(pred_bounding_boxes[5][0], dim=1)

	pred_bb_x = torch.argmax(pred_bb_x, dim=1)
	pred_bb_y = torch.argmax(pred_bb_y, dim=1)
	pred_bb_ext_x = torch.argmax(pred_bb_ext_x, dim=1)
	pred_bb_ext_y = torch.argmax(pred_bb_ext_y, dim=1)
	pred_bb_yaw = torch.argmax(pred_bb_yaw, dim=1)
	pred_bb_speed = torch.argmax(pred_bb_speed, dim=1)

	x_step = (config.max_x - config.min_x) / pow(2, config.plant_precision_pos)
	y_step = (config.max_y - config.min_y) / pow(2, config.plant_precision_pos)
	extent_step = (30) / pow(2, config.plant_precision_pos)
	yaw_step = (2 * np.pi) / pow(2, config.plant_precision_angle)
	speed_step = (config.plant_max_speed_pred / 3.6) / pow(2, config.plant_precision_speed)

	pred_bb_x = pred_bb_x * x_step - config.max_x
	pred_bb_y = pred_bb_y * y_step - config.max_y
	pred_bb_ext_x = pred_bb_ext_x * extent_step
	pred_bb_ext_y = pred_bb_ext_y * extent_step
	pred_bb_yaw = pred_bb_yaw * yaw_step - np.pi
	pred_bb_speed = pred_bb_speed * speed_step
	pred_bb_center = torch.stack((pred_bb_x, pred_bb_y, pred_bb_ext_x, pred_bb_ext_y, pred_bb_yaw, pred_bb_speed), dim=1)

	return pred_bb_center


	def circle_line_segment_intersection(circle_center, circle_radius, pt1, pt2, full_line=True, tangent_tol=1e-9):
	""" Find the points at which a circle intersects a line-segment. This can happen at 0, 1, or 2 points.

	:param circle_center: The (x, y) location of the circle center
	:param circle_radius: The radius of the circle
	:param pt1: The (x, y) location of the first point of the segment
	:param pt2: The (x, y) location of the second point of the segment
	:param full_line: True to find intersections along full line - not just in the segment.
	False will just return intersections within the segment.
	:param tangent_tol: Numerical tolerance at which we decide the intersections are close enough to consider it a
	tangent
	:return Sequence[Tuple[float, float]]: A list of length 0, 1, or 2, where each element is a point at which the
	circle intercepts a line segment.

	Note: We follow: http://mathworld.wolfram.com/Circle-LineIntersection.html
	Credit: https://stackoverflow.com/a/59582674/9173068
	"""

	if np.linalg.norm(pt1 - pt2) < 0.000000001:
	print('Problem')

	(p1x, p1y), (p2x, p2y), (cx, cy) = pt1, pt2, circle_center
	(x1, y1), (x2, y2) = (p1x - cx, p1y - cy), (p2x - cx, p2y - cy)
	dx, dy = (x2 - x1), (y2 - y1)
	dr = (dx2 + dy2)**.5
	big_d = x1 * y2 - x2 * y1
	discriminant = circle_radius*2 dr2 - big_d2

	if discriminant < 0: # No intersection between circle and line
	return []
	else: # There may be 0, 1, or 2 intersections with the segment
	# This makes sure the order along the segment is correct
	intersections = [(cx + (big_d * dy + sign * (-1 if dy < 0 else 1) * dx * discriminant.5) / dr2,
	cy + (-big_d * dx + sign * abs(dy) * discriminant.5) / dr2)
	for sign in ((1, -1) if dy < 0 else (-1, 1))]
	if not full_line: # If only considering the segment, filter out intersections that do not fall within the segment
	fraction_along_segment = [(xi - p1x) / dx if abs(dx) > abs(dy) else (yi - p1y) / dy for xi, yi in intersections]
	intersections = [pt for pt, frac in zip(intersections, fraction_along_segment) if 0 <= frac <= 1]
	# If line is tangent to circle, return just one point (as both intersections have same location)
	if len(intersections) == 2 and abs(discriminant) <= tangent_tol:
	return [intersections[0]]
	else:
	return intersections


	def crop_array(config, images_i): # images_i must have dimensions (H,W,C) or (H,W)
	"""
	Crop rgb images to the desired height and width
	"""
	if config.crop_image:
	# crops rgb/depth/semantics from the bottom to cropped_height and symetrically from both sides to cropped_width
	assert config.cropped_height <= images_i.shape[0]
	assert config.cropped_width <= images_i.shape[1]
	side_crop_amount = (images_i.shape[1] - config.cropped_width) // 2
	if len(images_i.shape) > 2: # for rgb, we have 3 channels
	return images_i[0:config.cropped_height, side_crop_amount:images_i.shape[1] - side_crop_amount, :]
	else: # for depth and semantics, there is no channel dimension
	return images_i[0:config.cropped_height, side_crop_amount:images_i.shape[1] - side_crop_amount]
	else:
	return images_i