R3PM-Net / tools /metrics.py
YasiiKB's picture
initial commit
97aa5af verified
import open3d as o3d
import torch
import numpy as np
import matplotlib.pyplot as plt
from math import atan2
from scipy.spatial.transform import Rotation as R
import warnings
def get_rotaion(est):
# Extract the rotation matrices
try:
estimated_rotation = est[:3, :3]
except TypeError:
try:
estimation_transformation = est.transformation # for open3d
except AttributeError:
try:
estimation_transformation = est.rot # for Probreg
except: # for learning 3d
detached_est = est['est_T'].detach().cpu().numpy()[0]
estimation_transformation = detached_est.reshape(4,4)
estimated_rotation = estimation_transformation[:3, :3]
return estimated_rotation
def get_translation(est):
# Extract the translation vectors
try:
estimated_translation = est[:3, 3]
except TypeError:
try:
estimated_translation = est.t # for Probreg
except AttributeError:
try:
estimation_transformation = est.transformation # for open3d
except: # for learning 3d
detached_est = est['est_T'].detach().cpu().numpy()[0]
estimation_transformation = detached_est.reshape(4,4)
estimated_translation = estimation_transformation[:3, 3]
return estimated_translation
def compute_rmse(result, target, corres):
'''
This function computes the root-mean-square error (RMSE) between the (transforemed) source and target point clouds based on the correspondences.
Based on C++ code in Open3D https://github.com/isl-org/Open3D/blob/c8856fc0d4ec89f8d53591db245fd29ad946f9cb/cpp/open3d/pipelines/registration/TransformationEstimation.cpp#L20
args:
result (point cloud data): the transformed point cloud
target (point cloud data): the target point cloud
corres (Vector2iVector): the point-to-point correspondences between the source and target point clouds
returns:
rmse: the root-mean-square error (centimeters or meters based on the source and target point clouds)
'''
err = 0.0
for c in corres:
diff = np.asarray(result.points)[c[0]] - np.asarray(target.points)[c[1]] # Euclidean distance
err += np.sum(diff**2) # sum of squared distances
rmse = np.sqrt(err / len(corres))
return rmse
def rotation_error(gt_transformation, est):
'''
This function computes the rotation error as the Geodesic distance between the estimated and the ground truth rotation matrices in 3D space.
Based on formula on this page http://www.boris-belousov.net/2016/12/01/quat-dist/
args:
gt_transformation: the ground truth transformation (rotation matrix will be extracted from this)
est: the estimated transformation (rotation matrix will be extracted from this)
returns:
rotation_error_deg: the rotation error (degrees)
'''
estimated_rotation = get_rotaion(est)
ground_truth_rotation = gt_transformation[:3, :3]
# Compute the angular distance between the two rotation matrices
R = np.dot(ground_truth_rotation, estimated_rotation.T) # Compute the relative rotation matrix (np.matmul(gt.T, est))
trace = np.trace(R)
normalized_trace = min(max(((trace - 1) / 2), -1.0), 1.0) # Normalize and clamp the trace to avoid numerical errors
theta = np.arccos(normalized_trace)
rotation_error = abs(theta)
rotation_error_deg = np.rad2deg(rotation_error) # Convert to degrees
return rotation_error_deg
def translation_error(gt_transformation, est):
'''
This function computes the translation error as the Euclidean distance between Ground Truth & Estimated translation.
Based on definitions in this paper https://arxiv.org/pdf/2103.02690
args:
gt_transformation: the ground truth transformation (translation vector will be extracted from this)
est: the estimated transformation (translation vector will be extracted from this)
returns:
abs(translation_error): the absolute translation error (centimeters)
'''
estimated_translation = get_translation(est)
ground_truth_translation = gt_transformation[:3, 3]
# Compute the translation error
translation_error = np.linalg.norm(estimated_translation - ground_truth_translation)
return abs(translation_error)
def residual_error(cloud1: o3d.geometry.PointCloud, cloud2: o3d.geometry.PointCloud) -> float:
'''
This metric combines the rotation and translation errors so that different approaches can be compared.
It uses root mean squared distance between homologous points of the source point cloud, after the execution of an algorithm, and the same point cloud at the ground truth pose.
Based on papers:
https://www.sciencedirect.com/science/article/pii/S0921889021000191?via=ihub (3.3. Error metric) (main paper) -> https://github.com/iralabdisco/point_clouds_registration_benchmark/tree/master
https://link.springer.com/article/10.1007/s11370-024-00562-1 [14]
'''
if len(cloud1.points) != len(cloud2.points):
if len(cloud1.points) > len(cloud2.points):
cloud1.points = cloud1.points[:len(cloud2.points)]
else:
cloud2.points = cloud2.points[:len(cloud1.points)]
assert len(cloud1.points) == len(cloud2.points), "len(cloud1.points) != len(cloud2.points)"
centroid, _ = cloud1.compute_mean_and_covariance()
weights = np.linalg.norm(np.asarray(cloud1.points) - centroid, 2, axis=1)
distances = np.linalg.norm(np.asarray(cloud1.points) - np.asarray(cloud2.points), 2, axis=1)/len(weights)
return np.sum(distances/weights)
def chamfer_distance(pcd1, pcd2):
'''
Computes the Chamfer Distance between two point clouds using Open3D and PyTorch.
The Chamfer Distance is a metric that measures the similarity between two point clouds.
It is calculated as the sum of the mean squared distances from each point in one point cloud
to its nearest neighbor in the other point cloud, in both directions.
Args:
pcd1 (o3d.geometry.PointCloud): The first point cloud.
pcd2 (o3d.geometry.PointCloud): The second point cloud.
Returns:
chamfer_distance (float): The Chamfer distance between the two point clouds.
'''
dist1 = pcd1.compute_point_cloud_distance(pcd2)
dist2 = pcd2.compute_point_cloud_distance(pcd1)
dist1 = torch.tensor(np.asarray(dist1), dtype=torch.float32)
dist2 = torch.tensor(np.asarray(dist2), dtype=torch.float32)
chamfer_distance = torch.mean(dist1) + torch.mean(dist2)
chamfer_distance = chamfer_distance.item()
return chamfer_distance
def all_evaluations(source, target, result, time, gt_transformation = None, est_transformation = None, corres = None):
cd = chamfer_distance(result, target)
error = residual_error(target, result)
computation_time = time
max_treshold = 0.5
inlier_rmse = o3d.pipelines.registration.evaluate_registration(result, target, max_treshold, np.eye(4)).inlier_rmse
fitness = o3d.pipelines.registration.evaluate_registration(result, target, max_treshold, np.eye(4)).fitness
if gt_transformation is not None:
rmse = 1
rotation_err = rotation_error(gt_transformation, est_transformation)
translation_err = translation_error(gt_transformation, est_transformation)
return rmse, rotation_err, translation_err, computation_time, cd, error, fitness, inlier_rmse #8
else:
return cd, fitness, inlier_rmse, computation_time #4
def summerize_results(results: np.ndarray) -> dict:
if results.shape[2] == 8:
mean_rmse = np.round(np.mean(results[:, :, 0]), 4)
mean_rotation_error = np.round(np.mean(results[:, :, 1]), 4)
mean_translation_error = np.round(np.mean(results[:, :, 2]), 4)
mean_computation_time = np.round(np.mean(results[:, :, 3]), 4)
mean_cd = np.round(np.mean(results[:, :, 4]), 4)
mean_error = np.round(np.mean(results[:, :, 5]), 4)
mean_fitness = np.round(np.mean(results[:, :, 6]), 4)
mean_inlier_rmse = np.round(np.mean(results[:, :, 7]), 4)
return {
'mean_rmse': mean_rmse,
'mean_rotation_error': mean_rotation_error,
'mean_translation_error': mean_translation_error,
'mean_computation_time': mean_computation_time,
'mean_cd': mean_cd,
'mean_error': mean_error,
'mean_fitness': mean_fitness,
'mean_inlier_rmse': mean_inlier_rmse
}
elif results.shape[2] == 5:
mean_cd = np.round(np.mean(results[:, :, 0]), 4)
mean_error = np.round(np.mean(results[:, :, 1]), 4)
mean_fitness = np.round(np.mean(results[:, :, 2]), 4)
mean_inlier_rmse = np.round(np.mean(results[:, :, 3]), 4)
mean_computation_time = np.round(np.mean(results[:, :, 4]), 4)
return {
'mean_cd': mean_cd,
'mean_error': mean_error,
'mean_fitness': mean_fitness,
'mean_inlier_rmse': mean_inlier_rmse,
'mean_computation_time': mean_computation_time
}
else:
raise ValueError('Invalid results shape. Expected shape (N, M, 8) or (N, M, 5).')
def inlier_ratio(pcd, all_errors, threshold = 5):
'''
This function calculates the inlier ratio based on a given threshold.
args:
pcd (point cloud data): the point cloud
all_errors (list): the errors between the two point clouds (from error_histogram)
threshold (float): the threshold for inliers
returns:
inlier_ratio (float): the ratio of inliers (set at 5 cm)
'''
inliers = []
for error in all_errors:
# if the error is below the threshold, the pair is an inlier
if error < threshold:
inliers.append(error)
inlier_ratio = len(inliers) / len(pcd.points)
return inlier_ratio
def calculate_snr(clean_pcd, noisy_pcd):
'''
This function calculates the signal-to-noise ratio (SNR) between two point clouds.
SNR is defined as the ratio of the RMS power of the signal (clean point cloud) to the RMS power of the noise (difference between clean and noisy point clouds).
args:
clean_pcd (point cloud): the clean point cloud
noisy_pcd (point cloud): the noisy point cloud
returns:
snr_db (float): the signal-to-noise ratio in decibels
'''
# Convert point clouds to numpy arrays
clean_points = np.asarray(clean_pcd.points)
noisy_points = np.asarray(noisy_pcd.points)
# Calculate the RMS power of the signal (clean point cloud)
signal_amplitude = np.sqrt(np.mean(np.sum(clean_points**2, axis=1)))
# Calculate the RMS power of the noise (difference between clean and noisy point clouds)
noise_amplitude = np.sqrt(np.mean(np.sum((clean_points - noisy_points)**2, axis=1)))
# Compute the SNR
snr = (signal_amplitude / noise_amplitude)**2
snr_db = 10 * np.log10(snr)
return snr_db
def rotation_error_along_axis(gt_transformation, est_transformation, convention = 'zyx', verbose = False):
'''
This function calculates the rotation error along the each axis (Euler angle) between the estimated and ground truth rotation matrices.
It gives a warning if gimbal lock is detected (90 or 270 degrees).
Based on formulas and discussions in:
https://www.youtube.com/watch?v=wg9bI8-Qx2Q (10:29)
Args:
gt_transformation: the ground truth transformation
est_transformation: the estimated transformation
convention: the convention for the Euler angles (default and only one supported is 'zyx')
verbose: if True, the Euler angles are printed
Returns:
theta_x_deg: the rotation error along the x-axis (degrees) rounded to 3 decimal places
theta_y_deg: the rotation error along the y-axis (degrees) rounded to 3 decimal places
theta_z_deg: the rotation error along the z-axis (degrees) rounded to 3 decimal places
'''
if convention != 'zyx':
raise ValueError("Invalid convention. Only 'zyx' is supported.")
estimated_rotation = get_rotaion(est_transformation)
ground_truth_rotation = gt_transformation[:3, :3]
R_relative = np.dot(ground_truth_rotation, estimated_rotation.T)
theta_z = atan2(R_relative[1, 0], R_relative[0, 0]) # Euler angles = atan2(r21, r11)
theta_x = atan2(R_relative[2, 1], R_relative[2, 2]) # Euler angles = atan2(r32, r33)
if np.isclose(np.cos(theta_z), 0.0, atol=1e-6):
second_term = R_relative[1, 0]/np.sin(theta_z)
theta_y = atan2(-R_relative[2, 0], second_term)
else:
second_term = R_relative[0, 0]/np.cos(theta_z)
theta_y = atan2(-R_relative[2, 0], second_term)
# Convert to degrees
theta_x_deg = np.round(abs(np.rad2deg(theta_x)), 3)
theta_y_deg = np.round(abs(np.rad2deg(theta_y)), 3)
theta_z_deg = np.round(abs(np.rad2deg(theta_z)), 3)
if verbose:
if np.round(theta_y_deg, 3) == 90 or np.round(theta_y_deg, 3) == 270:
print("Warning: Gimbal lock detected! It might not be possible to uniquely and accurately determine all angles.")
print(f'{theta_x_deg}° error along x-axis, {theta_y_deg}° error along y-axis and {theta_z_deg}° error along z-axis.')
return theta_x_deg, theta_y_deg, theta_z_deg
def angle_diff(a, b):
'''
This function calculates the smallest unsigned angle difference in degrees.
'''
diff = abs(a - b) % 360
return min(diff, 360 - diff)
def signed_angle_diff(a, b):
'''
This function calculates the signed angle difference in degrees.
'''
diff = (b - a + 180) % 360 - 180
return diff
def decompose_rotation_error(gt_transformation, est_transformation, signed = True, convention = 'zyx', verbose = False):
'''
This fuction calculates Euler angles (rotation) differences between the estimated and ground truth transformation matrices.
It uses the scipy.spatial.transform.Rotation class to extract the Euler angles from the rotation matrices.
If Gimbal lock is detected, it uses a manual calculation of the angles.
Args:
gt_transformation: the ground truth transformation matrix
est: the estimated transformation matrix
signed: if True, the signed angle difference is calculated
convention: the convention for the Euler angles (default and only supported is 'zyx')
This restriction is because the rotation matrix applied to simulate data is 'xyz' order which is the inverse of 'zyx' - because initrinsic and extrinsic rotations are inverted. Source: https://dominicplein.medium.com/extrinsic-intrinsic-rotation-do-i-multiply-from-right-or-left-357c38c1abfd
verbose: if True, the Euler angles are printed
Returns:
x_diff: the difference in the x-axis rotation (degrees)
y_diff: the difference in the y-axis rotation (degrees)
z_diff: the difference in the z-axis rotation (degrees)
OR if Gimbal lock is detected:
re_along_x: the rotation error along the x-axis (degrees)
re_along_y: the rotation error along the y-axis (degrees)
re_along_z: the rotation error along the z-axis (degrees)
Raises:
RuntimeError: if Gimbal lock is detected.
'''
if convention != 'zyx':
raise ValueError("Invalid convention. Only 'zyx' is supported.")
# Get rotation matrices
estimated_rotation = get_rotaion(est_transformation)
gt_rotation = gt_transformation[:3, :3]
# Get Euler degrees using scipy
try:
with warnings.catch_warnings(record=True) as w:
warnings.simplefilter("always")
gt_euler = R.from_matrix(gt_rotation).as_euler(convention, degrees=True)
gt_z, gt_y, gt_x = np.round(gt_euler, 3)
est_euler = R.from_matrix(estimated_rotation).as_euler(convention, degrees=True)
est_z, est_y, est_x = np.round(est_euler, 3)
# Check for Gimbal lock warning
gimal_lock_warning = any("Gimbal lock detected" in str(warn.message) for warn in w)
if gimal_lock_warning:
raise RuntimeError("Gimbal lock detected!")
if verbose:
print(f"Extracted Ground Truth Euler angles (deg): x={gt_x}, y={gt_y}, z={gt_z}")
print(f"Extracted Estimated Euler angles (deg): x={est_x}, y={est_y}, z={est_z}")
# compute differences
diff_fn = signed_angle_diff if signed else angle_diff
x_diff = diff_fn(gt_x, est_x)
y_diff = diff_fn(gt_y, est_y)
z_diff = diff_fn(gt_z, est_z)
# Use manual calculation of angles if Gimbal lock is detected
except RuntimeError as e:
print(f'{e} - Trying manual calculation of angles.') if verbose else None
x_diff, y_diff, z_diff = rotation_error_along_axis(gt_transformation, est_transformation, convention)
if verbose:
print(f'{x_diff}° error along x-axis, {y_diff}° error along y-axis and {z_diff}° error along z-axis.')
return x_diff, y_diff, z_diff
# --------- UNUSED FUNCTIONS ---------
def error_histogram(source, target, result, dis_type ='mse', bins = 200):
'''
This function creates a histogram of the errors between the target and result point clouds.
args:
target: the target point cloud
result: the result point cloud
dis_type: the type of distance to calculate the error (mse or mae)
bins: the number of bins for the histogram
returns:
histogram (Plot): the histogram plot of the errors
all_errors (list): the errors between the source and target point clouds (for inlier ratio calculation)
'''
# Calcualte error between the correspondences
all_errors = []
for i in range(len(source.points)):
if dis_type =='mse':
# Error as root mean square error
error = np.sqrt(np.sum((np.asarray(result.points[i]) - np.asarray(target.points[i]))**2))
elif dis_type == 'mae':
# Error as mean absolute error
error = np.mean(np.abs(np.asarray(result.points[i]) - np.asarray(target.points[i])))
all_errors.append(error)
# Make a histogram of the errors
plt.hist(all_errors, bins = bins)
plt.xlabel('Error')
plt.ylabel('Frequency')
plt.show()
return all_errors
def rotation_error_along_z (gt_transformation, est, symmetry = None):
'''
This function calculates the rotation error along the z-axis (Euler angle) between the estimated and ground truth rotation matrices.
Based on formulas and discussions in:
https://math.stackexchange.com/questions/31001/finding-the-cos-angle-between-two-matrices-using-the-euclidean-inner-product
https://stackoverflow.com/questions/15022630/how-to-calculate-the-angle-from-rotation-matrix
https://www.youtube.com/watch?v=wg9bI8-Qx2Q (10:29)
For C2 and C4 symmetries, the explanation is here:
https://www2.math.upenn.edu/~mlazar/math170/notes07-4.pdf
https://web.stanford.edu/~kaleeg/chem32/groupT/
'''
estimated_rotation = get_rotaion(est)
ground_truth_rotation = gt_transformation[:3, :3]
R = np.dot(ground_truth_rotation, estimated_rotation.T)
theta_z = atan2(R[1, 0], R[0, 0]) # Euler angles
theta_z_deg = abs(np.rad2deg(theta_z))
if symmetry == 'C2':
theta_z_deg = min(theta_z_deg, abs(180 - theta_z_deg))
elif symmetry == 'C4':
theta_z_deg = min(theta_z_deg, abs(90 - theta_z_deg), abs(180 - theta_z_deg), abs(270 - theta_z_deg))
return np.round(theta_z_deg, 3)
def rotation_error_along_x (gt_transformation, est):
'''
This function calculates the rotation error along the x-axis (Euler angle) between the estimated and ground truth rotation matrices.
Based on formulas and discussions in:
https://www.youtube.com/watch?v=wg9bI8-Qx2Q (10:29)
Args:
est: the estimated transformation
gt_transformation: the ground truth transformation
Returns:
theta_x_deg: the rotation error along the x-axis (degrees) rounded to 3 decimal places
'''
estimated_rotation = get_rotaion(est)
ground_truth_rotation = gt_transformation[:3, :3]
R = np.dot(ground_truth_rotation, estimated_rotation.T)
theta_x = atan2(R[2, 1], R[2, 2]) # Euler angles = atan2(r32, r33)
theta_x_deg = abs(np.rad2deg(theta_x))
return np.round(theta_x_deg, 3)
def rotation_error_along_y (gt_transformation, est, theta_z_deg):
'''
This function calculates the rotation error along the y-axis (Euler angle) between the estimated and ground truth rotation matrices.
It gives a warning if gimbal lock is detected (90 or 270 degrees).
Based on formulas and discussions in:
https://www.youtube.com/watch?v=wg9bI8-Qx2Q
Args:
est: the estimated transformation
gt_transformation: the ground truth transformation
theta_z_deg: the rotation error along the z-axis (degrees)
Returns:
theta_y_deg: the rotation error along the y-axis (degrees) rounded to 3 decimal places
'''
estimated_rotation = get_rotaion(est)
ground_truth_rotation = gt_transformation[:3, :3]
R = np.dot(ground_truth_rotation, estimated_rotation.T)
if np.cos(np.deg2rad(theta_z_deg)) == 0:
second_term = R[1, 0]/np.sin(np.deg2rad(theta_z_deg))
theta_y = atan2(-R[2, 0], second_term)
else:
second_term = R[0, 0]/np.cos(np.deg2rad(theta_z_deg))
theta_y = atan2(-R[2, 0], second_term)
theta_y_deg = abs(np.rad2deg(theta_y))
if np.round(theta_y_deg, 3) == 90 or np.round(theta_y_deg, 3) == 270:
print("Warning: Gimbal lock detected! It might not be possible to uniquely and accurately determine all angles.")
return np.round(theta_y_deg, 3)
# Construct the transformation matrix from the rotation matrix, translation vector, and scale (for Probreg)
def reconstruct_transformation_propreg(rot, t, scale):
scaled_rotation = scale * rot
T = np.eye(4)
T[:3, :3] = scaled_rotation
T[:3, 3] = t
return T
def get_transformation(est):
# Extract the transformation matrices
try:
estimation_transformation = est.transformation # for open3d
except AttributeError:
try:
estimation_transformation = reconstruct_transformation_propreg(est.rot, est.t, est.scale) # for Probreg
except: # for learning 3d
estimation_transformation = est['est_T'].detach().cpu().numpy()[0]
estimation_transformation = estimation_transformation.reshape(4,4)
return estimation_transformation
def transformation_error(est, gt_transformation): # ATTENTION: not a good metric because transformations consist of rotation and translation, which have different metrics (one is radian, the other centimeters).
'''
This function calculates transformation error as the root-mean-square error between estimated transformation and ground truth transformation
Based on definitions in this paper https://arxiv.org/pdf/2103.02690
args:
est: the estimation object
gt_transformation: the ground truth transformation
returns:
transformation_error: the transformation error
'''
estimation_transformation = get_transformation(est)
rmseT = np.sqrt(np.mean(np.square(estimation_transformation - gt_transformation)))
return rmseT
def remove_outliers(data):
'''
This function removes outliers from the data based on the interquartile range (IQR).
Based on https://medium.com/@davidnh8/outlier-detection-101-median-and-interquartile-range-cc9dde94c0ac
Args:
data (np.array): The data to remove outliers from.
Returns:
clear_data (np.array): The data without outliers.
outlier_index (np.array): The indices of the outliers.
'''
q1 = np.percentile(data, 25)
q3 = np.percentile(data, 75)
iqr = q3 - q1
lower_bound = q1 - 1.5 * iqr
upper_bound = q3 + 1.5 * iqr
outlier_index = np.where((data <= lower_bound) | (data >= upper_bound))
clear_data = np.delete(data, outlier_index)
return clear_data, outlier_index
def get_overlap_ratio(source,target,threshold):
"""
- Overlap is defined as the ratio of the number of points in each point cloud that cover a region of the scene,
which is also covered by the other point cloud, to the total number of points in the point cloud.
- Overlap is computed as the ratio of the number of points in the source point cloud that are within a distance
threshold to the target point cloud to the total number of points in the source point cloud.
Taken from https://github.com/prs-eth/OverlapPredator/blob/main/scripts/cal_overlap.py
Based on https://www.open3d.org/docs/latest/tutorial/Basic/kdtree.html
"""
pcd_tree = o3d.geometry.KDTreeFlann(target)
match_count=0
for i, point in enumerate(source.points):
[count, _, _] = pcd_tree.search_radius_vector_3d(point, threshold)
if(count!=0):
match_count+=1
overlap_ratio = match_count / len(source.points) *100
return overlap_ratio