R2SE_model / mmdet3d_plugin /datasets /utils /calibration.py

Upload folder using huggingface_hub

663494c verified 2 months ago

13.5 kB

	import copy
	import math

	# import pickle5 as pickle
	import pickle
	from typing import Dict, Tuple

	import numpy as np

	np.set_printoptions(precision=2, suppress=True)


	def create_transform(location: np.ndarray, rotation: np.ndarray) -> np.ndarray:
	"""Create 4x4 transformation matrix from location and rotation

	Args:
	location: (3, ) xyz in the world coordinate (Carla left-handed coords)
	rotation: (3, ) pitch, yaw, roll

	Returns:
	transform: 4 x 4, the transformation from object to world coordinate
	"""

	pitch, yaw, roll = rotation
	c_y = np.cos(np.radians(yaw))
	s_y = np.sin(np.radians(yaw))
	c_r = np.cos(np.radians(roll))
	s_r = np.sin(np.radians(roll))
	c_p = np.cos(np.radians(pitch))
	s_p = np.sin(np.radians(pitch))
	transform = np.matrix(np.identity(4))
	transform[0, 3] = location[0]
	transform[1, 3] = location[1]
	transform[2, 3] = location[2]
	transform[0, 0] = c_p * c_y
	transform[0, 1] = c_y * s_p * s_r - s_y * c_r
	transform[0, 2] = -c_y * s_p * c_r - s_y * s_r
	transform[1, 0] = s_y * c_p
	transform[1, 1] = s_y * s_p * s_r + c_y * c_r
	transform[1, 2] = -s_y * s_p * c_r + c_y * s_r
	transform[2, 0] = s_p
	transform[2, 1] = -c_p * s_r
	transform[2, 2] = c_p * c_r

	return transform


	def transform_matrix_to_vector(transform: np.ndarray) -> Tuple[np.ndarray, np.ndarray]:
	"""Convert 4x4 transformation matrix back to the location and rotation

	Note that we assume 0 pitch and roll so the 3x3 rotation matrix becomes
	[c_y, -s_y, 0]
	[s_y, c_y, 0]
	[ 0, 0, 1]
	"""

	location: np.ndarray = transform[:3, 3] # (3, )

	# compute rotation
	rotation_matrix_2d: np.ndarray = transform[:2, :2] # (3, 3)
	sin_yaw: float = rotation_matrix_2d[1, 0]
	cos_yaw: float = rotation_matrix_2d[0, 0]
	yaw: float = math.atan2(sin_yaw, cos_yaw)
	rotation = np.array([0, np.rad2deg(yaw), 0])

	return (location, rotation)


	def get_transform_A2C(A2B: np.ndarray, B2C: np.ndarray):
	"""Compose 4x4 transformation matrix"""

	return np.dot(A2B.transpose(), B2C.transpose()).transpose()


	################## GPS


	def gps_offset(carla_version: str) -> Tuple[np.ndarray, np.ndarray]:
	"""GPS sensor parameters"""

	# challenge 1.0
	if carla_version == "0.9.10":
	mean = np.array([0.0, 0.0]) # for carla 9.10
	scale = np.array([111324.60662786, 111319.490945]) # for carla 9.10

	# for old carla evaluation
	elif carla_version == "0.9.9":
	mean = np.array([49.0, 8.0]) # for carla 9.9
	scale = np.array([111324.60662786, 73032.1570362]) # for carla 9.9

	return (mean, scale)


	def gps_normalize(gps: np.ndarray, carla_version="0.9.10") -> np.ndarray:
	"""Normalize GPS (latitude & longitude) to the typical x,y scale"""

	gps: np.ndarray = copy.copy(gps) # (3, )
	gps_mean, gps_scale = gps_offset(carla_version)
	gps[:2] = (gps[:2] - gps_mean) * gps_scale

	return gps


	def gps_to_world(gps: np.ndarray) -> np.ndarray:
	"""Convert normalized GPS coordinate to world coordinate

	Args:
	gps: (3, )
	"""

	gps_world = copy.copy(gps)
	gps_world[0] = gps[1]
	gps_world[1] = -gps[0]

	return gps_world


	def world_to_gps(gps_world: np.ndarray) -> np.ndarray:
	"""Convert world coordinate to normalized GPS coordinate

	Args:
	gps_world: (3, )
	"""

	gps = copy.copy(gps_world)
	gps[0] = -gps_world[1]
	gps[1] = gps_world[0]

	return gps


	################## IMU


	def accelerometer_to_world(accelerometer: np.ndarray) -> np.ndarray:
	"""Convert accelerometer from the IMU coords. to world coords"""

	# TODO: accelerometer depends on the yaw
	# accelerometer = gps_to_world(accelerometer)

	# remove gravity
	accelerometer[2] -= 9.80665

	return accelerometer


	def gyroscope_to_world(gyroscope: np.ndarray) -> np.ndarray:
	"""Convert gyroscope from the IMU coords. to world coords"""

	# TODO: check transformation
	gyroscope[1] = gyroscope[2]
	gyroscope[2] = 0

	return gyroscope


	def compass_to_rotation(compass: float) -> np.ndarray:
	"""Convert the raw compass readings from sensors to yaw in world coord.

	Note: compass is in the same coordinate as GPS, so a rotation is needed
	also, compass is in radians so we need to convert to degrees
	"""

	yaw = math.degrees(compass - np.pi / 2.0)

	# make sure yaw's range in [-180, 180]
	if yaw > 180:
	yaw -= 360
	if yaw < -180:
	yaw += 360

	rotation = np.array([0, yaw, 0])

	return rotation


	################## Camera


	def get_camera_intrinsics(cam_param: Dict, dim: int = 4) -> np.ndarray:
	"""Returns the camera intrinsics matrix

	Args:
	cam_param: include width/height/fov of a camera
	dim: 3 or 4, 4 leads to producing matrix in the homogeneous coordinate

	Returns:
	intrinsics: shape of (3, 3) or (4, 4)
	"""

	intrinsics = np.identity(dim)
	intrinsics[0, 2] = cam_param["width"] / 2.0
	intrinsics[1, 2] = cam_param["height"] / 2.0
	intrinsics[0, 0] = intrinsics[1, 1] = cam_param["width"] / (
	2.0 * np.tan(cam_param["fov"] * np.pi / 360.0)
	)

	return intrinsics


	def get_camera_param() -> Dict[str, Dict]:
	"""Returns our camera configuration, fixed"""

	# original configuration that has a large FOV, however, it can cause traffic light
	# too small and challenging to detect
	# cam_param = {
	# "left": {
	# "width": 400,
	# "height": 300,
	# "fov": 120,
	# "yaw": -90.0,
	# "x": 1.3,
	# "y": -0.2,
	# "z": 2.3,
	# },
	# "front": {
	# "width": 400,
	# "height": 300,
	# "fov": 120,
	# "yaw": 0.0,
	# "x": 1.3,
	# "y": 0.0,
	# "z": 2.3,
	# },
	# "right": {
	# "width": 400,
	# "height": 300,
	# "fov": 120,
	# "yaw": 90.0,
	# "x": 1.3,
	# "y": 0.2,
	# "z": 2.3,
	# },
	# "back": {
	# "width": 400,
	# "height": 300,
	# "fov": 120,
	# "yaw": 180.0,
	# "x": -1.5,
	# "y": 0.0,
	# "z": 2.3,
	# },
	# }

	# configuration borrowed from the conmmunity that is more compatible with traffic
	# light, however, it has a small resolution and fov, not optimal for 3D detection
	# cam_param = {
	# "left": {
	# "width": 256,
	# "height": 288,
	# "fov": 64,
	# "yaw": -60.0,
	# "x": 1.5,
	# "y": 0,
	# "z": 2.4,
	# },
	# "front": {
	# "width": 256,
	# "height": 288,
	# "fov": 64,
	# "yaw": 0.0,
	# "x": 1.5,
	# "y": 0.0,
	# "z": 2.4,
	# },
	# "right": {
	# "width": 256,
	# "height": 288,
	# "fov": 64,
	# "yaw": 60.0,
	# "x": 1.5,
	# "y": 0.0,
	# "z": 2.4,
	# },
	# "tel": {
	# "width": 480,
	# "height": 288,
	# "fov": 40,
	# "yaw": 0.0,
	# "x": 1.5,
	# "y": 0.0,
	# "z": 2.4,
	# },
	# }

	# combined configuration used in our initial submission that retains both types of
	# configuration for object and traffic detection
	# cam_param = {
	# "front_largefov": {
	# "width": 400,
	# "height": 300,
	# "fov": 120,
	# "yaw": 0.0,
	# "x": 1.3,
	# "y": 0.0,
	# "z": 2.3,
	# },
	# "front": {
	# "width": 256,
	# "height": 288,
	# "fov": 64,
	# "yaw": 0.0,
	# "x": 1.5,
	# "y": 0.0,
	# "z": 2.4,
	# },
	# "right": {
	# "width": 256,
	# "height": 288,
	# "fov": 64,
	# "yaw": 60.0,
	# "x": 1.5,
	# "y": 0.0,
	# "z": 2.4,
	# },
	# "tel": {
	# "width": 480,
	# "height": 288,
	# "fov": 40,
	# "yaw": 0.0,
	# "x": 1.5,
	# "y": 0.0,
	# "z": 2.4,
	# },
	# }

	# v1.1
	cam_param = {
	"left": {
	"width": 400,
	"height": 300,
	"fov": 100,
	"yaw": -100.0,
	"pitch": 0.0,
	"x": 1.3,
	"y": -0.2,
	"z": 2.3,
	},
	"front": {
	"width": 400,
	"height": 300,
	"fov": 100,
	"yaw": 0.0,
	"pitch": 0.0,
	"x": 1.3,
	"y": 0.0,
	"z": 2.3,
	},
	"right": {
	"width": 400,
	"height": 300,
	"fov": 100,
	"yaw": 100.0,
	"pitch": 0.0,
	"x": 1.3,
	"y": 0.2,
	"z": 2.3,
	},
	# upwards a bit to better leverage the space along height
	"tele": {
	"width": 400,
	"height": 300,
	"fov": 45,
	"yaw": 0.0,
	"pitch": 5,
	"x": 1.5,
	"y": 0.0,
	"z": 2.4,
	},
	}

	return cam_param


	def camera_to_ego_transform(cam_param: Dict[str, float]) -> np.ndarray:
	"""Get camera to ego 4 x 4 transformation matrix

	Rotation composition: roll * pitch * yaw
	roll_rot = np.array(
	[
	[1, 0, 0],
	[0, math.cos(pitch), -math.sin(pitch)],
	[0, math.sin(pitch), math.cos(pitch)],
	]
	)
	"""

	# initialize transformation matrix with location
	transform = np.eye(4)
	transform[0, 3] = cam_param["x"]
	transform[1, 3] = cam_param["y"]
	transform[2, 3] = cam_param["z"]

	# add rotation matrix
	yaw: float = math.radians(cam_param["yaw"])
	yaw_rot = np.array(
	[
	[math.cos(yaw), -math.sin(yaw), 0],
	[math.sin(yaw), math.cos(yaw), 0],
	[0, 0, 1],
	]
	)
	pitch: float = math.radians(-cam_param["pitch"])
	pitch_rot = np.array(
	[
	[ math.cos(pitch), 0, math.sin(pitch)],
	[0, 1, 0],
	[-math.sin(pitch), 0, math.cos(pitch)],
	]
	)
	transform[:3, :3] = np.matmul(pitch_rot, yaw_rot)
	# transform[:3, :3] = yaw_rot
	return transform


	def camera_to_lidar_transform(cam_param: Dict[str, float]) -> np.ndarray:
	"""Get camera to ego 4 x 4 transformation matrix"""

	ego2lidar_transform: np.ndarray = ego_to_lidar_transform() # 4 x 4
	camera2ego_transform: np.ndarray = camera_to_ego_transform(cam_param) # 4 x 4

	return np.dot(
	camera2ego_transform.transpose(), ego2lidar_transform.transpose()
	).transpose()


	################## LiDAR


	def get_lidar_param() -> Dict[str, float]:
	"""Returns our camera configuration, fixed"""

	lidar_param = {
	"yaw": -90.0,
	"x": 1.3,
	"y": 0.0,
	"z": 2.5,
	}

	return lidar_param


	def lidar_to_ego_transform() -> np.ndarray:
	"""Get lidar to ego 4 x 4 transformation matrix"""

	lidar_param: Dict[str, float] = get_lidar_param()

	# location of the lidar w.r.t. the ego vehicle
	transform = np.eye(4)
	transform[0, 3] = lidar_param["x"]
	transform[1, 3] = lidar_param["y"]
	transform[2, 3] = lidar_param["z"]

	# rotation of the lidar
	yaw = math.radians(lidar_param["yaw"])
	rot = np.array(
	[
	[math.cos(yaw), -math.sin(yaw), 0],
	[math.sin(yaw), math.cos(yaw), 0],
	[0, 0, 1],
	]
	)
	transform[:3, :3] = rot

	return transform


	def lidar_to_camera_transform(cam_param: Dict[str, float]) -> np.ndarray:
	"""Get lidar to camera 4 x 4 transformation matrix"""

	return np.linalg.inv(camera_to_lidar_transform(cam_param))


	def lidar_to_image_transform(cam_param: Dict[str, float]) -> np.ndarray:
	"""Get lidar to image (after projection) 4 x 4 transformation matrix"""

	# compose transformation
	lidar2camera_transform: np.ndarray = lidar_to_camera_transform(cam_param) # 4 x 4
	intrinsics: np.ndarray = get_camera_intrinsics(cam_param, dim=4) # 4 x 4

	lidar2image_transform = np.dot(
	lidar2camera_transform.transpose(), intrinsics.transpose()
	).transpose() # 4 x 4

	return lidar2image_transform


	################## Ego


	def load_ego2world_transform(ego_file: str) -> np.ndarray:
	"""load ego data and create ego's transformation matrix"""

	# load raw ego data
	with open(ego_file, "rb") as handle:
	ego_data: Dict = pickle.load(handle)

	# create transformation
	location: np.ndarray = ego_data["location"] # (3, )
	location[2] -= ego_data["size"][2] / 2 # shift to bottom
	rotation: np.ndarray = ego_data["rotation"] # (3, )
	ego2world: np.ndarray = create_transform(location, rotation) # 4 x 4

	return ego2world


	def ego_to_lidar_transform() -> np.ndarray:
	"""Get ego to lidar 4 x 4 transformation matrix"""

	return np.linalg.inv(lidar_to_ego_transform())


	def ego_to_camera_transform(cam_param: Dict[str, float]) -> np.ndarray:
	"""Get ego to camera 4 x 4 transformation matrix"""

	return np.linalg.inv(camera_to_ego_transform(cam_param))