Vincentqyw
fix: roma
8b973ee
raw
history blame
9.09 kB
import torch
import cv2
import numpy as np
from collections import OrderedDict
from loguru import logger
from kornia.geometry.epipolar import numeric
from kornia.geometry.conversions import convert_points_to_homogeneous
# --- METRICS ---
def relative_pose_error(T_0to1, R, t, ignore_gt_t_thr=0.0):
# angle error between 2 vectors
t_gt = T_0to1[:3, 3]
n = np.linalg.norm(t) * np.linalg.norm(t_gt)
t_err = np.rad2deg(np.arccos(np.clip(np.dot(t, t_gt) / n, -1.0, 1.0)))
t_err = np.minimum(t_err, 180 - t_err) # handle E ambiguity
if np.linalg.norm(t_gt) < ignore_gt_t_thr: # pure rotation is challenging
t_err = 0
# angle error between 2 rotation matrices
R_gt = T_0to1[:3, :3]
cos = (np.trace(np.dot(R.T, R_gt)) - 1) / 2
cos = np.clip(cos, -1.0, 1.0) # handle numercial errors
R_err = np.rad2deg(np.abs(np.arccos(cos)))
return t_err, R_err
def symmetric_epipolar_distance(pts0, pts1, E, K0, K1):
"""Squared symmetric epipolar distance.
This can be seen as a biased estimation of the reprojection error.
Args:
pts0 (torch.Tensor): [N, 2]
E (torch.Tensor): [3, 3]
"""
pts0 = (pts0 - K0[[0, 1], [2, 2]][None]) / K0[[0, 1], [0, 1]][None]
pts1 = (pts1 - K1[[0, 1], [2, 2]][None]) / K1[[0, 1], [0, 1]][None]
pts0 = convert_points_to_homogeneous(pts0)
pts1 = convert_points_to_homogeneous(pts1)
Ep0 = pts0 @ E.T # [N, 3]
p1Ep0 = torch.sum(pts1 * Ep0, -1) # [N,]
Etp1 = pts1 @ E # [N, 3]
d = p1Ep0**2 * (
1.0 / (Ep0[:, 0] ** 2 + Ep0[:, 1] ** 2)
+ 1.0 / (Etp1[:, 0] ** 2 + Etp1[:, 1] ** 2)
) # N
return d
def compute_symmetrical_epipolar_errors(data):
"""
Update:
data (dict):{"epi_errs": [M]}
"""
Tx = numeric.cross_product_matrix(data["T_0to1"][:, :3, 3])
E_mat = Tx @ data["T_0to1"][:, :3, :3]
m_bids = data["m_bids"]
pts0 = data["mkpts0_f"]
pts1 = data["mkpts1_f"]
epi_errs = []
for bs in range(Tx.size(0)):
mask = m_bids == bs
epi_errs.append(
symmetric_epipolar_distance(
pts0[mask], pts1[mask], E_mat[bs], data["K0"][bs], data["K1"][bs]
)
)
epi_errs = torch.cat(epi_errs, dim=0)
data.update({"epi_errs": epi_errs})
def compute_symmetrical_epipolar_errors_offset(data):
"""
Update:
data (dict):{"epi_errs": [M]}
"""
Tx = numeric.cross_product_matrix(data["T_0to1"][:, :3, 3])
E_mat = Tx @ data["T_0to1"][:, :3, :3]
m_bids = data["offset_bids"]
l_ids = data["offset_lids"]
pts0 = data["offset_kpts0_f"]
pts1 = data["offset_kpts1_f"]
epi_errs = []
layer_num = data["predict_flow"][0].shape[0]
for bs in range(Tx.size(0)):
for ls in range(layer_num):
mask_b = m_bids == bs
mask_l = l_ids == ls
mask = mask_b & mask_l
epi_errs.append(
symmetric_epipolar_distance(
pts0[mask], pts1[mask], E_mat[bs], data["K0"][bs], data["K1"][bs]
)
)
epi_errs = torch.cat(epi_errs, dim=0)
data.update({"epi_errs_offset": epi_errs}) # [b*l*n]
def compute_symmetrical_epipolar_errors_offset_bidirectional(data):
"""
Update
data (dict):{"epi_errs": [M]}
"""
_compute_symmetrical_epipolar_errors_offset(data, "left")
_compute_symmetrical_epipolar_errors_offset(data, "right")
def _compute_symmetrical_epipolar_errors_offset(data, side):
"""
Update
data (dict):{"epi_errs": [M]}
"""
assert side == "left" or side == "right", "invalid side"
Tx = numeric.cross_product_matrix(data["T_0to1"][:, :3, 3])
E_mat = Tx @ data["T_0to1"][:, :3, :3]
m_bids = data["offset_bids_" + side]
l_ids = data["offset_lids_" + side]
pts0 = data["offset_kpts0_f_" + side]
pts1 = data["offset_kpts1_f_" + side]
epi_errs = []
layer_num = data["predict_flow"][0].shape[0]
for bs in range(Tx.size(0)):
for ls in range(layer_num):
mask_b = m_bids == bs
mask_l = l_ids == ls
mask = mask_b & mask_l
epi_errs.append(
symmetric_epipolar_distance(
pts0[mask], pts1[mask], E_mat[bs], data["K0"][bs], data["K1"][bs]
)
)
epi_errs = torch.cat(epi_errs, dim=0)
data.update({"epi_errs_offset_" + side: epi_errs}) # [b*l*n]
def estimate_pose(kpts0, kpts1, K0, K1, thresh, conf=0.99999):
if len(kpts0) < 5:
return None
# normalize keypoints
kpts0 = (kpts0 - K0[[0, 1], [2, 2]][None]) / K0[[0, 1], [0, 1]][None]
kpts1 = (kpts1 - K1[[0, 1], [2, 2]][None]) / K1[[0, 1], [0, 1]][None]
# normalize ransac threshold
ransac_thr = thresh / np.mean([K0[0, 0], K1[1, 1], K0[0, 0], K1[1, 1]])
# compute pose with cv2
E, mask = cv2.findEssentialMat(
kpts0, kpts1, np.eye(3), threshold=ransac_thr, prob=conf, method=cv2.RANSAC
)
if E is None:
print("\nE is None while trying to recover pose.\n")
return None
# recover pose from E
best_num_inliers = 0
ret = None
for _E in np.split(E, len(E) / 3):
n, R, t, _ = cv2.recoverPose(_E, kpts0, kpts1, np.eye(3), 1e9, mask=mask)
if n > best_num_inliers:
ret = (R, t[:, 0], mask.ravel() > 0)
best_num_inliers = n
return ret
def compute_pose_errors(data, config):
"""
Update:
data (dict):{
"R_errs" List[float]: [N]
"t_errs" List[float]: [N]
"inliers" List[np.ndarray]: [N]
}
"""
pixel_thr = config.TRAINER.RANSAC_PIXEL_THR # 0.5
conf = config.TRAINER.RANSAC_CONF # 0.99999
data.update({"R_errs": [], "t_errs": [], "inliers": []})
m_bids = data["m_bids"].cpu().numpy()
pts0 = data["mkpts0_f"].cpu().numpy()
pts1 = data["mkpts1_f"].cpu().numpy()
K0 = data["K0"].cpu().numpy()
K1 = data["K1"].cpu().numpy()
T_0to1 = data["T_0to1"].cpu().numpy()
for bs in range(K0.shape[0]):
mask = m_bids == bs
ret = estimate_pose(
pts0[mask], pts1[mask], K0[bs], K1[bs], pixel_thr, conf=conf
)
if ret is None:
data["R_errs"].append(np.inf)
data["t_errs"].append(np.inf)
data["inliers"].append(np.array([]).astype(np.bool))
else:
R, t, inliers = ret
t_err, R_err = relative_pose_error(T_0to1[bs], R, t, ignore_gt_t_thr=0.0)
data["R_errs"].append(R_err)
data["t_errs"].append(t_err)
data["inliers"].append(inliers)
# --- METRIC AGGREGATION ---
def error_auc(errors, thresholds):
"""
Args:
errors (list): [N,]
thresholds (list)
"""
errors = [0] + sorted(list(errors))
recall = list(np.linspace(0, 1, len(errors)))
aucs = []
thresholds = [5, 10, 20]
for thr in thresholds:
last_index = np.searchsorted(errors, thr)
y = recall[:last_index] + [recall[last_index - 1]]
x = errors[:last_index] + [thr]
aucs.append(np.trapz(y, x) / thr)
return {f"auc@{t}": auc for t, auc in zip(thresholds, aucs)}
def epidist_prec(errors, thresholds, ret_dict=False, offset=False):
precs = []
for thr in thresholds:
prec_ = []
for errs in errors:
correct_mask = errs < thr
prec_.append(np.mean(correct_mask) if len(correct_mask) > 0 else 0)
precs.append(np.mean(prec_) if len(prec_) > 0 else 0)
if ret_dict:
return (
{f"prec@{t:.0e}": prec for t, prec in zip(thresholds, precs)}
if not offset
else {f"prec_flow@{t:.0e}": prec for t, prec in zip(thresholds, precs)}
)
else:
return precs
def aggregate_metrics(metrics, epi_err_thr=5e-4):
"""Aggregate metrics for the whole dataset:
(This method should be called once per dataset)
1. AUC of the pose error (angular) at the threshold [5, 10, 20]
2. Mean matching precision at the threshold 5e-4(ScanNet), 1e-4(MegaDepth)
"""
# filter duplicates
unq_ids = OrderedDict((iden, id) for id, iden in enumerate(metrics["identifiers"]))
unq_ids = list(unq_ids.values())
logger.info(f"Aggregating metrics over {len(unq_ids)} unique items...")
# pose auc
angular_thresholds = [5, 10, 20]
pose_errors = np.max(np.stack([metrics["R_errs"], metrics["t_errs"]]), axis=0)[
unq_ids
]
aucs = error_auc(pose_errors, angular_thresholds) # (auc@5, auc@10, auc@20)
# matching precision
dist_thresholds = [epi_err_thr]
precs = epidist_prec(
np.array(metrics["epi_errs"], dtype=object)[unq_ids], dist_thresholds, True
) # (prec@err_thr)
# offset precision
try:
precs_offset = epidist_prec(
np.array(metrics["epi_errs_offset"], dtype=object)[unq_ids],
[2e-3],
True,
offset=True,
)
return {**aucs, **precs, **precs_offset}
except:
return {**aucs, **precs}