Upload folder using huggingface_hub

663494c verified 2 months ago

18.3 kB

	from typing import Dict, List, Optional, Tuple, Union

	import cv2
	import utils.transform as box_transform
	import utils.calibration as calib_utils
	import utils.bev as bev_vis
	import utils.canvas_3d as vis_3d
	import utils.color as color_vis
	import matplotlib.pyplot as plt
	plt.switch_backend('agg')
	import numpy as np
	import scipy
	from PIL import Image
	from pathlib import Path
	import os


	def get_color_object(obj_id: int, color_list: List) -> np.array:
	"""Get color for each object for vis, w.r.t. the ID"""

	color_float: Tuple[float, float, float] = color_list[obj_id % len(color_list)]
	color = np.array(
	[
	int(color_float[0] * 255),
	int(color_float[1] * 255),
	int(color_float[2] * 255),
	]
	)

	return color


	def vis_box_on_lidar(
	lidar: Union[str, np.ndarray],
	save_path: str,
	bbox_det_in_ego_list: Optional[List[np.ndarray]] = None,
	bbox_gt_in_ego_list: Optional[List[np.ndarray]] = None,
	id_list: Optional[List[int]] = None,
	state_list: Optional[List[np.ndarray]] = None,
	fut_traj: Optional[List[np.ndarray]] = None, # xy coordinate
	fut_traj_mask: Optional[List[np.ndarray]] = None,
	pre_traj: Optional[List[np.ndarray]] = None,
	pre_traj_mask: Optional[List[np.ndarray]] = None,
	ego2lidar: Optional[np.ndarray] = None,
	bev: bool = True,
	box_order_nuscenes: bool = False,
	left_hand: bool = True, # carla
	vis_text: bool = True,
	command: Optional[int] = 2,
	command_dict: Optional[Dict[int, str]] = {0: 'TURN RIGHT', 1: 'TURN LEFT', 2: 'KEEP FORWARD'},
	bev_map: Optional[np.ndarray] = None, # H x W x 3
	) -> None:
	"""Visualize detection/GT boxes on the LiDAR point cloud

	Args:
	lidar: str -> path to the data, np array -> N x 3 data already loaded
	state_list: a list of array including velocity/acceleration/angular_velocity
	fut_traj: N x 12 x 4 or N, 12 x 4
	past_traj: N x 8 x 2 or N, 8 x 2

	Note that carla lidar coordinate is
	+x -> left
	+y -> front
	+z -> up
	"""

	# load lidar
	if isinstance(lidar, str):
	# try:
	# lidar = np.load(lidar, allow_pickle=True)[..., :3] # XYZI, N x 3 now
	# except:
	lidar = np.fromfile(lidar, dtype=np.float32)
	lidar = lidar.reshape(-1, 4) # N x 4
	lidar = lidar[:, :3] # N x 3 now
	else:
	assert isinstance(lidar, np.ndarray), "the detection is either str or dict"

	# pre-load color for each object when visualizing tracklets
	# only when id_list is provided and visualizing either GT/tracklets
	if id_list is not None and (
	bbox_det_in_ego_list is None or bbox_gt_in_ego_list is None
	):
	# get the list of colors to choose for each tracklet/prediction
	color_list: List[Tuple[float, float, float]] = color_vis.random_colors()

	if bbox_gt_in_ego_list is None:
	num_obj = len(bbox_det_in_ego_list)
	else:
	num_obj = len(bbox_gt_in_ego_list)

	colors = np.zeros((num_obj, 3), dtype=np.uint8) # N x 3
	assert len(id_list) == num_obj, "number of objects is wrong"

	for obj_index, obj_id in enumerate(id_list):
	color: np.ndarray = get_color_object(obj_id, color_list) # (3, )
	colors[obj_index, :] = color
	else:
	colors = None

	# convert the ID_list to list of strings to visualize
	# only if id_list is provided
	text_corner = 1
	if id_list is not None and vis_text:
	texts = [str(obj_id) for obj_id in id_list]

	# add the list of states to the text
	if state_list is not None:
	for index in range(len(state_list)):
	states: Union[np.ndarray, List] = state_list[index]
	state_str: str = " ".join(["%.2f" % state for state in states])
	texts[index] = texts[index] + " " + state_str
	else:
	texts = None

	# visualize lidar points only, default color ORANGE
	if bev:
	canvas = bev_vis.Canvas_BEV()
	canvas_xy, valid_mask = canvas.get_canvas_coords(lidar) # Get Canvas coords
	canvas.draw_canvas_points(canvas_xy[valid_mask]) # Only draw valid points
	else: # 3D
	canvas = vis_3d.Canvas_3D()
	canvas_xyz, valid_mask = canvas.get_canvas_coords(lidar) # Get Canvas coords
	color_based_on_intensity = (
	(lidar[valid_mask, -1] * 255).astype("uint8").reshape((-1, 1))
	) # N x 1
	color_based_on_intensity = np.repeat(
	color_based_on_intensity, 3, axis=1
	) # N x 3
	canvas.draw_canvas_points(
	canvas_xyz[valid_mask], colors=color_based_on_intensity
	) # Only draw valid points

	# extract height from the bbox
	if (bbox_det_in_ego_list is not None) or (bbox_gt_in_ego_list is not None):
	if bbox_det_in_ego_list is not None:
	num_obj = len(bbox_det_in_ego_list)
	else:
	num_obj = len(bbox_gt_in_ego_list)
	height_all_lidar = np.zeros((num_obj), dtype='float32')

	# visualize detection bbox on lidar, default color WHITE
	if bbox_det_in_ego_list is not None:
	bbox_det_in_lidar_list: List[np.ndarray] = list()
	count = 0
	box_in_ego: np.ndarray
	for box_in_ego in bbox_det_in_ego_list:

	# convert box in ego to lidar coordinate
	box_in_lidar: np.ndarray = box_transform.box_in_ego_to_lidar(
	box_in_ego,
	ego2lidar=ego2lidar,
	) # 8 x 4
	height_all_lidar[count] = np.average(box_in_lidar, axis=0)[2]

	if bev:
	if box_order_nuscenes:
	box_in_lidar = box_in_lidar[
	[1, 2, 6, 5], :2
	] # 4 x 2, nuScenes boxinstances
	else:
	box_in_lidar = box_in_lidar[:4, :2] # 4 x 2, take only BEV corners
	else:
	box_in_lidar = box_in_lidar[:, :3] # 8 x 3, take only xyz
	bbox_det_in_lidar_list.append(np.array(box_in_lidar))
	count += 1

	if len(bbox_det_in_lidar_list) > 0:
	bbox_det_in_lidar = np.stack(bbox_det_in_lidar_list, axis=0) # N x 4 x 2
	if colors is None:
	colors_det = np.full(
	(len(bbox_det_in_lidar), 3), fill_value=0, dtype=np.uint8
	)
	colors_det[:, :2] = 255 # (N x 3)
	else:
	colors_det = colors
	canvas.draw_boxes(
	corners=bbox_det_in_lidar,
	colors=colors_det,
	texts=texts,
	text_corner=text_corner,
	) # Draw Boxes

	# visualize GT bbox on lidar, default color BLUE
	if bbox_gt_in_ego_list is not None:
	bbox_gt_in_lidar_list: List[np.ndarray] = list()
	box_in_ego: np.ndarray
	count = 0
	for box_in_ego in bbox_gt_in_ego_list:

	# convert box in ego to lidar coordinate
	box_in_lidar: np.ndarray = box_transform.box_in_ego_to_lidar(
	box_in_ego,
	ego2lidar=ego2lidar,
	) # 8 x 4
	height_all_lidar[count] = np.average(box_in_lidar, axis=0)[2]

	# convert to BEV
	if bev:
	if box_order_nuscenes:
	box_in_lidar = box_in_lidar[
	[1, 2, 6, 5], :2
	] # 4 x 2, nuScenes boxinstances
	else:
	box_in_lidar = box_in_lidar[:4, :2] # 4 x 2, take only BEV corners
	# box_in_lidar = box_in_lidar[[0, 3, 4, 7], :2] # 4 x 2, take left side corners
	# box_in_lidar = box_in_lidar[[0, 1, 4, 5], :2] # 4 x 2, take front side corners
	else:
	box_in_lidar = box_in_lidar[:, :3]

	# if count >= 10 and count < 13:
	# print("box_in_lidar", box_in_lidar)

	bbox_gt_in_lidar_list.append(np.array(box_in_lidar))
	count += 1

	if len(bbox_gt_in_lidar_list) > 0:
	bbox_gt_in_lidar = np.stack(bbox_gt_in_lidar_list, axis=0) # N x 4 x 2
	if colors is None:
	colors_gt = np.full(
	(len(bbox_gt_in_lidar), 3), fill_value=0, dtype=np.uint8
	)
	colors_gt[:, 2] = 255 # N x 3
	else:
	colors_gt = colors

	canvas.draw_boxes(
	corners=bbox_gt_in_lidar,
	colors=colors_gt,
	texts=texts,
	text_corner=text_corner,
	) # Draw Boxes

	# draw points for past/future trajectories in lidar coordinate
	if fut_traj is not None:
	fut_traj_obj: np.ndarray # F x 4
	obj_index = 0
	for fut_traj_obj in fut_traj:

	# add height to the trajectory in the 3D vis cases
	if fut_traj_obj.shape[1] == 2 and not bev:
	fut_traj_obj_addh = np.concatenate([fut_traj_obj, np.zeros((fut_traj_obj.shape[0], 1))], axis=1)
	fut_traj_obj_addh[:, -1] = height_all_lidar[obj_index]
	fut_traj_obj = fut_traj_obj_addh

	# Get Canvas coords and mask within the visualization range
	canvas_xy, valid_mask = canvas.get_canvas_coords(
	fut_traj_obj
	) # canvas_xy: N x 2, valid_mask: N
	valid_mask = valid_mask.astype("bool")

	# get valid mask for every timestamp
	fut_traj_mask_obj: np.ndarray = fut_traj_mask[obj_index, :, 0].astype(
	"bool"
	) # N
	mask_combined = fut_traj_mask_obj & valid_mask

	# visualize
	canvas.draw_canvas_points(
	canvas_xy[mask_combined], colors=tuple(colors[obj_index]), radius=2
	) # Only draw valid points
	obj_index += 1

	if pre_traj is not None:
	pre_traj_obj: np.ndarray # F x 4
	obj_index = 0
	for pre_traj_obj in pre_traj:

	# add height to the trajectory in the 3D vis cases
	if pre_traj_obj.shape[1] == 2 and not bev:
	pre_traj_obj_addh = np.concatenate([pre_traj_obj, np.zeros((pre_traj_obj.shape[0], 1))], axis=1)
	pre_traj_obj_addh[:, -1] = height_all_lidar[obj_index]
	pre_traj_obj = pre_traj_obj_addh

	canvas_xy, valid_mask = canvas.get_canvas_coords(
	pre_traj_obj
	) # Get Canvas coords
	valid_mask = valid_mask.astype("bool")

	# get valid mask for every timestamp
	pre_traj_mask_obj: np.ndarray = pre_traj_mask[obj_index, :, 0].astype(
	"bool"
	) # N
	mask_combined = pre_traj_mask_obj & valid_mask
	canvas.draw_canvas_points(
	canvas_xy[mask_combined], colors=tuple(colors[obj_index]), radius=2
	) # Only draw valid points
	obj_index += 1

	# rotate to make the view consistent with the image
	# now +x -> left (ego), +y -> front (ego)
	if bev:
	canvas.canvas = np.flip(canvas.canvas, axis=(0))
	# now +x -> right (ego), +y -> front (ego)
	if left_hand:
	canvas.canvas = np.flip(canvas.canvas, axis=(1))
	# now +x -> right (ego), +y -> back (ego)

	# draw figure
	plt.figure(figsize=(20, 20))
	plt.axis("off")
	plt.imshow(canvas.canvas)
	plt.tight_layout()

	# add text for commands
	plt.text(30, 50, command_dict[int(command)], fontsize=45, color=(1, 1, 1))

	# save figure
	save_dir = Path(save_path).resolve().parent
	if not os.path.exists(save_dir):
	os.makedirs(save_dir)
	plt.savefig(save_path, transparent=False)
	plt.close()

	# overlay visualization with map
	if bev_map is not None and bev:
	traj_vis = cv2.imread(save_path)

	# convert the bev map to match with the higher-resolution visualization image
	bev_map = cv2.resize(bev_map, traj_vis.shape[1::-1]) # 2000 x 2000
	bev_map = (bev_map * 255).astype('uint8')

	# make up the third dimension if only one channel is given
	if len(bev_map.shape) == 2:
	bev_map = np.expand_dims(bev_map, axis=-1) # 2000 x 2000 x 1
	bev_map = np.repeat(bev_map, 3, axis=-1) # 2000 x 2000 x 3

	# synchronize with the lidar visualization
	if bev:
	bev_map = np.flip(bev_map, axis=0) # H x W x 3
	if left_hand:
	bev_map = np.flip(bev_map, axis=1) # H x W x 3

	# blend & save
	dst = cv2.addWeighted(traj_vis, 0.7, bev_map, 0.3, 0)
	cv2.imwrite(save_path, dst)

	def vis_box_on_camera(
	cameras: Dict[str, np.ndarray],
	save_path: str,
	cam_param_all: Dict[str, Dict],
	bbox_det_in_ego_list: Optional[List[np.ndarray]] = None,
	bbox_gt_in_ego_list: Optional[List[np.ndarray]] = None,
	left_hand_system: bool = True,
	) -> None:
	"""Visualize detection/GT boxes on the multiple cameras

	Args:
	camera: keys can be ["left", "front", "right", "back"]
	values are H x W x 3

	"""

	# process each camera
	cam_name: str
	cam_param: Dict[str, float]
	for cam_name, cam_param in cam_param_all.items():

	# if we already have ego2cam for visualization, no need to construct the transform
	if "intrinsics" not in cam_param:
	intrinsics: np.ndarray = calib_utils.get_camera_intrinsics(cam_param, dim=4)
	else:
	intrinsics: np.ndarray = cam_param["intrinsics"]

	# visualize each box for detection, default color ORANGE
	if bbox_det_in_ego_list is not None:
	box_in_ego: np.ndarray
	for box_in_ego in bbox_det_in_ego_list:

	# first convert to the camera coordinate
	# and then 3D -> 2D projection to the image coordinate
	box_in_camera: np.ndarray = box_transform.box_in_ego_to_camera(
	box_in_ego, cam_param
	) # 8 x 4

	# camera projection
	box_2d_in_image: np.ndarray = box_transform.box_projection_to_image(
	box_in_camera,
	intrinsics,
	left_hand_system=left_hand_system,
	) # 8 x 2

	# check if box is in front of the camera for visualization
	if box_2d_in_image is not None:
	cameras[cam_name], _ = vis_box_on_single_image(
	cameras[cam_name],
	box_2d_in_image,
	img_size=(cam_param["height"], cam_param["width"]),
	color=(255, 255, 0),
	thickness=2,
	)

	# visualize each box for GT, default color BLUE
	if bbox_gt_in_ego_list is not None:
	box_in_ego: np.ndarray
	for box_in_ego in bbox_gt_in_ego_list:

	# first convert to the camera coordinate
	# and then 3D -> 2D projection to the image coordinate
	box_in_camera: np.ndarray = box_transform.box_in_ego_to_camera(
	box_in_ego, cam_param
	) # 8 x 4

	# camera projection
	box_2d_in_image: np.ndarray = box_transform.box_projection_to_image(
	box_in_camera,
	intrinsics,
	left_hand_system=left_hand_system,
	) # 8 x 2

	# check if box is in front of the camera for visualization
	if box_2d_in_image is not None:
	cameras[cam_name], _ = vis_box_on_single_image(
	cameras[cam_name],
	box_2d_in_image,
	img_size=(cam_param["height"], cam_param["width"]),
	color=(0, 0, 255),
	thickness=2,
	)

	# visualize all images together
	# TODO (Xinshuo): remove this assumption
	# assume all cameras have the same width and height
	image = np.concatenate(list(cameras.values()), axis=1) # H x 3W x 3
	image = image[:, :, ::-1] # convert bgr to rgb
	image = Image.fromarray(image)
	image = image.resize(
	(cam_param["width"] * len(cameras.keys()), cam_param["height"])
	)
	save_dir = Path(save_path).resolve().parent
	if not os.path.exists(save_dir):
	os.makedirs(save_dir)
	image.save(save_path)


	def check_outside_image(x, y, height, width):
	if x < 0 or x >= width:
	return True
	if y < 0 or y >= height:
	return True


	def vis_box_on_single_image(
	image, qs, img_size=(900, 1600), color=(255, 255, 255), thickness=4
	):
	"""Draw 3d bounding box in image
	qs: (8,2) array of vertices for the 3d box in following order:
	1 -------- 0
	/\| /\|
	2 -------- 3 .
	\| \| \| \|
	. 5 -------- 4
	\|/ \|/
	6 -------- 7
	"""

	# if 6 points of the box are outside the image, then do not draw
	pts_outside = 0
	for index in range(8):
	check = check_outside_image(
	qs[index, 0], qs[index, 1], img_size[0], img_size[1]
	)
	if check:
	pts_outside += 1
	if pts_outside >= 6:
	return image, False

	# actually draw
	if qs is not None:
	qs = qs.astype(np.int32)
	for k in range(0, 4):
	i, j = k, (k + 1) % 4
	cv2.line(
	image,
	(qs[i, 0], qs[i, 1]),
	(qs[j, 0], qs[j, 1]),
	color,
	thickness,
	cv2.LINE_AA,
	) # use LINE_AA for opencv3

	i, j = k + 4, (k + 1) % 4 + 4
	cv2.line(
	image,
	(qs[i, 0], qs[i, 1]),
	(qs[j, 0], qs[j, 1]),
	color,
	thickness,
	cv2.LINE_AA,
	)

	i, j = k, k + 4
	cv2.line(
	image,
	(qs[i, 0], qs[i, 1]),
	(qs[j, 0], qs[j, 1]),
	color,
	thickness,
	cv2.LINE_AA,
	)

	return image, True