R2SE_model / scripts /data_converter /nuplan /utils /canvas_3d.py

Upload folder using huggingface_hub

663494c verified 2 months ago

17.1 kB

	"""
	Written by Jinhyung Park

	Simple 3D visualization for 3D points & boxes. Intended as a simple, hackable
	alternative to mayavi for certain point cloud tasks.
	"""

	import numpy as np
	import cv2
	import copy
	from functools import partial
	import matplotlib


	class Canvas_3D(object):
	def __init__(
	self,
	canvas_shape=(500, 1000),
	camera_center_coords=(20, -40, 15),
	camera_focus_coords=(-4 + 0.9396926, 0, 4 - 0.34202014),
	focal_length=None,
	canvas_bg_color=(0, 0, 0),
	):
	"""
	Args:
	canvas_shape (Tuple[Int]): Canvas image size - height & width.
	camera_center_coords (Tuple[Float]): Location of camera center in
	3D space. x -> right, y -> front, z -> height
	camera_focus_coords (Tuple[Float]): Intuitively, what point in 3D
	space is the camera pointed at? These are absolute coordinates,
	not relative to camera center.
	focal_length (None \| Int):
	None: Half of the max of height & width of canvas_shape. This
	seems to be a decent default.
	Int: Specified directly.
	canvas_bg_color (Tuple[Int]): RGB (0 ~ 255) of canvas background
	color.
	"""

	self.canvas_shape = canvas_shape
	self.H, self.W = self.canvas_shape
	self.canvas_bg_color = canvas_bg_color

	self.camera_center_coords = camera_center_coords
	self.camera_focus_coords = camera_focus_coords

	if focal_length is None:
	self.focal_length = max(self.H, self.W) // 2
	else:
	self.focal_length = focal_length

	# Setup extrinsics and intrinsics of this virtual camera.
	self.ext_matrix = self.get_extrinsic_matrix(
	self.camera_center_coords, self.camera_focus_coords
	)
	self.int_matrix = np.array(
	[
	[self.focal_length, 0, self.W // 2, 0],
	[0, self.focal_length, self.H // 2, 0],
	[0, 0, 1, 0],
	]
	)

	self.clear_canvas()

	def get_canvas(self):
	return self.canvas

	def clear_canvas(self):
	self.canvas = np.zeros((self.H, self.W, 3), dtype=np.uint8)
	self.canvas[..., :] = self.canvas_bg_color

	def get_canvas_coords(self, xyz, depth_min=0.1, return_depth=False):
	"""
	Projects XYZ points onto the canvas and returns the projected canvas
	coordinates.

	Args:
	xyz (ndarray): (N, 3+) array of coordinates. Additional columns
	beyond the first three are ignored.
	depth_min (Float): Only points with a projected depth larger
	than this value are "valid".
	return_depth (Boolean): Whether to additionally return depth of
	projected points.
	Returns:
	canvas_xy (ndarray): (N, 2) array of projected canvas coordinates.
	"x" is dim0, "y" is dim1 of canvas.
	valid_mask (ndarray): (N,) boolean mask indicating which of
	canvas_xy fits into canvas (are visible from virtual camera).
	depth (ndarray): Optionally returned (N,) array of depth values
	"""
	xyz = np.copy(xyz) # prevent in-place modifications
	xyz = xyz[:, :3]

	xyz_hom = np.concatenate(
	[xyz, np.ones((xyz.shape[0], 1), dtype=np.float32)], axis=1
	)
	img_pts = (self.int_matrix @ self.ext_matrix @ xyz_hom.T).T

	depth = img_pts[:, 2]
	xy = img_pts[:, :2] / depth[:, None]
	xy_int = xy.round().astype(np.int32)

	# Flip X and Y so "x" is dim0, "y" is dim1 of canvas
	xy_int = xy_int[:, ::-1]

	valid_mask = (
	(depth > depth_min)
	& (xy_int[:, 0] >= 0)
	& (xy_int[:, 0] < self.H)
	& (xy_int[:, 1] >= 0)
	& (xy_int[:, 1] < self.W)
	)

	if return_depth:
	return xy_int, valid_mask, depth
	else:
	return xy_int, valid_mask

	def draw_canvas_points(
	self, canvas_xy, radius=-1, colors=None, colors_operand=None
	):
	"""
	Draws canvas_xy onto self.canvas.

	Args:
	canvas_xy (ndarray): (N, 2) array of valid canvas coordinates.
	"x" is dim0, "y" is dim1 of canvas.
	radius (Int):
	-1: Each point is visualized as a single pixel.
	r: Each point is visualized as a circle with radius r.
	colors:
	None: colors all points white.
	Tuple: RGB (0 ~ 255), indicating a single color for all points.
	ndarray: (N, 3) array of RGB values for each point.
	String: Such as "Spectral", uses a matplotlib cmap, with the
	operand (the value cmap is called on for each point) being
	colors_operand.
	colors_operand (ndarray): (N,) array of values cooresponding to
	canvas_xy, to be used only if colors is a cmap. Unlike
	Canvas_BEV, cannot be None if colors is a String.
	"""
	if len(canvas_xy) == 0:
	return

	if colors is None:
	colors = np.full((len(canvas_xy), 3), fill_value=255, dtype=np.uint8)
	elif isinstance(colors, tuple):
	assert len(colors) == 3
	colors_tmp = np.zeros((len(canvas_xy), 3), dtype=np.uint8)
	colors_tmp[..., : len(colors)] = np.array(colors)
	colors = colors_tmp
	elif isinstance(colors, np.ndarray):
	assert len(colors) == len(canvas_xy)
	colors = colors.astype(np.uint8)
	elif isinstance(colors, str):
	assert colors_operand is not None
	colors = matplotlib.cm.get_cmap(colors)

	# Normalize 0 ~ 1 for cmap
	colors_operand = colors_operand - colors_operand.min()
	colors_operand = colors_operand / colors_operand.max()

	# Get cmap colors - note that cmap returns (*input_shape, 4), with
	# colors scaled 0 ~ 1
	colors = (colors(colors_operand)[:, :3] * 255).astype(np.uint8)
	else:
	raise Exception(
	"colors type {} was not an expected type".format(type(colors))
	)

	if radius == -1:
	self.canvas[canvas_xy[:, 0], canvas_xy[:, 1], :] = colors
	else:
	for color, (x, y) in zip(colors.tolist(), canvas_xy.tolist()):
	self.canvas = cv2.circle(
	self.canvas, (y, x), radius, color, -1, lineType=cv2.LINE_AA
	)

	def draw_lines(self, start_xyz, end_xyz, colors=(255, 255, 255), thickness=1):
	"""
	Draws lines between provided 3D points.

	Args:
	start_xyz (ndarray): Shape (N, 3) of 3D points to start from.
	end_xyz (ndarray): Shape (N, 3) of 3D points to end at. Same length
	as start_xyz.
	colors:
	None: colors all points white.
	Tuple: RGB (0 ~ 255), indicating a single color for all points.
	ndarray: (N, 3) array of RGB values for each point.
	thickness (Int):
	Thickness of drawn cv2 line.
	"""
	if colors is None:
	colors = np.full((len(canvas_xy), 3), fill_value=255, dtype=np.uint8)
	elif isinstance(colors, tuple):
	assert len(colors) == 3
	colors_tmp = np.zeros((len(canvas_xy), 3), dtype=np.uint8)
	colors_tmp[..., : len(colors)] = np.array(colors)
	colors = colors_tmp
	elif isinstance(colors, np.ndarray):
	assert len(colors) == len(canvas_xy)
	colors = colors.astype(np.uint8)
	else:
	raise Exception(
	"colors type {} was not an expected type".format(type(colors))
	)

	start_pts_xy, start_pts_valid_mask, start_pts_d = self.get_canvas_coords(
	start_xyz, True
	)
	end_pts_xy, end_pts_valid_mask, end_pts_d = self.get_canvas_coords(
	end_xyz, True
	)

	for idx, (color, start_pt_xy, end_pt_xy) in enumerate(
	zip(colors.tolist(), start_pts_xy.tolist(), end_pts_xy.tolist())
	):

	if start_pts_valid_mask[idx] and end_pts_valid_mask[idx]:
	self.canvas = cv2.line(
	self.canvas,
	tuple(start_pt_xy[::-1]),
	tuple(end_pt_xy[::-1]),
	color=color,
	thickness=thickness,
	lineType=cv2.LINE_AA,
	)

	def draw_boxes(
	self,
	boxes=None,
	corners=None,
	colors=None,
	texts=None,
	depth_min=0.1,
	draw_incomplete_boxes=True,
	box_line_thickness=2,
	box_text_size=0.5,
	text_corner=1,
	):
	"""
	Draws 3D boxes.

	Args:
	boxes (ndarray): Shape (N, 7), each row representing a box of
	format (x, y, z, x_size, y_size, z_size, yaw). This function
	assumes bottom center - the xyz center of the provided box
	is the center of the bottom face of the 3D box, not the
	floating true center of the 3D box.
	colors:
	None: colors all points white.
	Tuple: RGB (0 ~ 255), indicating a single color for all points.
	ndarray: (N, 3) array of RGB values for each point.
	texts (List[String]): Length N; text to write next to boxes.
	depth_min (Float): Only box corners with a projected depth larger
	than this value are drawn if draw_incomplete_boxes is True.
	draw_incomplete_boxes (Boolean): If any boxes are incomplete,
	meaning it has a corner out of view based on depth_min, decide
	whether to draw them at all.
	thickness (Int):
	Thickness of drawn cv2 box lines.
	box_line_thickness (int): cv2 line/text thickness
	box_text_size (float): cv2 putText size
	text_corner (int): 0 ~ 7. Which corner of 3D box to write text at.
	"""

	num_boxes = len(boxes) if boxes is not None else len(corners)

	# Setup colors
	if colors is None:
	colors = np.full((num_boxes, 3), fill_value=255, dtype=np.uint8)
	elif isinstance(colors, tuple):
	assert len(colors) == 3
	colors_tmp = np.zeros((num_boxes, 3), dtype=np.uint8)
	colors_tmp[..., : len(colors)] = np.array(colors)
	colors = colors_tmp
	elif isinstance(colors, np.ndarray):
	assert len(colors) == num_boxes
	colors = colors.astype(np.uint8)
	else:
	raise Exception(
	"colors type {} was not an expected type".format(type(colors))
	)

	if boxes is not None:
	# boxes is N x 7
	boxes = np.copy(boxes) # prevent in-place modifications
	assert len(boxes.shape) == 2

	dims = boxes[:, 3:6]
	corners_norm = np.stack(np.unravel_index(np.arange(8), [2] * 3), axis=1)

	corners_norm = corners_norm[[0, 1, 3, 2, 4, 5, 7, 6]]
	# use relative origin [0.5, 0.5, 0], assuming bottom center
	corners_norm = corners_norm - np.array([0.5, 0.5, 0])
	corners = dims.reshape(-1, 1, 3) * corners_norm.reshape([1, 8, 3])
	# rotate around z axis
	angles = boxes[:, 6]
	rot_sin = np.sin(angles)
	rot_cos = np.cos(angles)
	ones = np.ones_like(rot_cos)
	zeros = np.zeros_like(rot_cos)
	rot_mat_T = np.stack(
	[
	np.stack([rot_cos, -rot_sin, zeros]),
	np.stack([rot_sin, rot_cos, zeros]),
	np.stack([zeros, zeros, ones]),
	]
	)
	corners = np.einsum("aij,jka->aik", corners, rot_mat_T)
	corners += boxes[:, :3].reshape(-1, 1, 3) # N x 8 x 3

	elif corners is not None:
	corners = corners

	# Now we have corners. Need them on the canvas 2D space.
	corners_xy, valid_mask = self.get_canvas_coords(
	corners.reshape(-1, 3), depth_min=depth_min
	)
	corners_xy = corners_xy.reshape(-1, 8, 2)
	valid_mask = valid_mask.reshape(-1, 8)

	# Now draw them with lines in correct places
	for i, (color, curr_corners_xy, curr_valid_mask) in enumerate(
	zip(colors.tolist(), corners_xy.tolist(), valid_mask.tolist())
	):

	if not draw_incomplete_boxes and sum(curr_valid_mask) != 8:
	# Some corner is invalid, don't draw the box at all.
	continue

	for start, end in [
	(0, 1),
	(1, 2),
	(2, 3),
	(3, 0),
	(0, 4),
	(1, 5),
	(2, 6),
	(3, 7),
	(4, 5),
	(5, 6),
	(6, 7),
	(7, 4),
	]:
	if not (curr_valid_mask[start] and curr_valid_mask[end]):
	continue # start or end is not valid

	self.canvas = cv2.line(
	self.canvas,
	(curr_corners_xy[start][1], curr_corners_xy[start][0]),
	(curr_corners_xy[end][1], curr_corners_xy[end][0]),
	color=color,
	thickness=box_line_thickness,
	lineType=cv2.LINE_AA,
	)

	# If even a single line was drawn, add text as well.
	if sum(curr_valid_mask) > 0:
	if texts is not None:
	self.canvas = cv2.putText(
	self.canvas,
	str(texts[i]),
	(
	curr_corners_xy[text_corner][1],
	curr_corners_xy[text_corner][0],
	),
	cv2.FONT_HERSHEY_SIMPLEX,
	box_text_size,
	color,
	thickness=box_line_thickness,
	)

	@staticmethod
	def cart2sph(xyz):
	x, y, z = xyz[:, 0], xyz[:, 1], xyz[:, 2]

	depth = np.linalg.norm(xyz, 2, axis=1)
	az = -np.arctan2(y, x)
	el = np.arcsin(z / depth)
	return az, el, depth

	@staticmethod
	def get_extrinsic_matrix(
	camera_center_coords,
	camera_focus_coords,
	):
	"""
	Args:
	camera_center_coords: (x, y, z) of where camera should be located
	in 3D space.
	camera_focus_coords: (x, y, z) of where camera should look at from
	camera_center_coords

	Thoughts:
	Remember that in camera coordiantes, pos x is right, pos y is up,
	pos z is forward.
	"""
	center_x, center_y, center_z = camera_center_coords
	focus_x, focus_y, focus_z = camera_focus_coords
	az, el, depth = Canvas_3D.cart2sph(
	np.array([[focus_x - center_x, focus_y - center_y, focus_z - center_z]])
	)
	az = float(az)
	el = float(el)
	depth = float(depth)

	### First, construct extrinsics
	## Rotation matrix

	z_rot = np.array(
	[[np.cos(az), -np.sin(az), 0], [np.sin(az), np.cos(az), 0], [0, 0, 1]]
	)

	# el is rotation around y axis.
	y_rot = np.array(
	[
	[np.cos(-el), 0, -np.sin(-el)],
	[0, 1, 0],
	[np.sin(-el), 0, np.cos(-el)],
	]
	)

	## Now, how the z_rot and y_rot work (spherical coordiantes), is it
	## computes rotations starting from the positive x axis and rotates
	## positive x axis to the desired direction. The desired direction is
	## the "looking direction" of the camera, which should actually be the
	## z-axis. So should convert the points so that the x axis is the new z
	## axis, and after the transformations.
	## Why x -> z for points? If we think about rotating the camera, z
	## should become x, so reverse when moving points.
	last_rot = np.array([[0, -1, 0], [0, 0, -1], [1, 0, 0]]) # x -> z

	# Put them together. Order matters. Make it hom.
	rot_matrix = np.eye(4, dtype=np.float32)
	rot_matrix[:3, :3] = last_rot @ y_rot @ z_rot

	## Translation matrix
	trans_matrix = np.array(
	[
	[1, 0, 0, -center_x],
	[0, 1, 0, -center_y],
	[0, 0, 1, -center_z],
	[0, 0, 0, 1],
	]
	)

	## Finally, extrinsics matrix. Order matters - do trans then rot
	ext_matrix = rot_matrix @ trans_matrix

	return ext_matrix