LDLT / UCI_N4 /jmlr_tables.tex
SuperComputer's picture
Add files using upload-large-folder tool
a1efe59 verified
% JMLR-ready tables for two-column papers
% Required packages (no siunitx):
% \usepackage{booktabs}
% \usepackage{threeparttable}
% \usepackage{threeparttablex} % for TableNotes + longtable
% \usepackage{longtable}
% Optional for landscape: \usepackage{pdflscape}
\begin{table*}[t]
\centering
\begin{threeparttable}
\caption{Model dimension ranges (min--max across all datasets and folds). Input/Output dimensions follow dataset label spaces.}
\label{tab:model-ranges}
\begin{tabular}{l r r r r r r}
\toprule
Algorithm & Width & Depth & Parameters & Padding & Input dim & Output dim \\
\midrule
AOL & 32--512 & 4--4 & 282--694837 & 10--524 & 3--262 & 2--100 \\
Orthogonal & 32--512 & 4--4 & 285--694840 & 10--524 & 3--262 & 2--100 \\
Sandwich & 32--512 & 4--4 & 615--1520140 & 10--524 & 3--262 & 2--100 \\
SLL & 32--512 & 4--4 & 1558--1084073 & 10--524 & 3--262 & 2--100 \\
LDLT-L & 32--512 & 4--4 & 3366--929297 & 10--524 & 3--262 & 2--100 \\
LDLT-R & 32--512 & 4--4 & 3463--1063442 & 10--524 & 3--262 & 2--100 \\
\bottomrule
\end{tabular}
\end{threeparttable}
\end{table*}
\begin{table*}[t]
\centering
\begin{threeparttable}
\caption{Sorted mean$\pm$std across $N$ datasets for each algorithm.}
\label{tab:metric_summary}
\begin{tabular}{l r lllll}
\toprule
& & & \multicolumn{4}{c}{Certified Accuracy} \\
\cmidrule(lr){4-7}
Algorithm & $N$ & Accuracy & 36/255 & 72/255 & 108/255 & 255/255 \\
\midrule
AOL & 121 & 0.6295\,\tiny$\pm$0.2278 & 0.3669\,\tiny$\pm$0.2895 & 0.2660\,\tiny$\pm$0.2953 & 0.2076\,\tiny$\pm$0.2819 & 0.0999\,\tiny$\pm$0.1875 \\
Orthogonal & 121 & 0.6969\,\tiny$\pm$0.1938 & 0.5973\,\tiny$\pm$0.2386 & 0.5073\,\tiny$\pm$0.2617 & 0.4300\,\tiny$\pm$0.2702 & 0.1970\,\tiny$\pm$0.2288 \\
Sandwich & 121 & 0.7215\,\tiny$\pm$0.1871 & \textbf{0.6375\,\tiny$\pm$0.2305} & \textbf{0.5593\,\tiny$\pm$0.2503} & \textbf{0.4836\,\tiny$\pm$0.2659} & \textbf{0.2496\,\tiny$\pm$0.2471} \\
SLL & 121 & 0.6978\,\tiny$\pm$0.1998 & 0.5885\,\tiny$\pm$0.2451 & 0.4975\,\tiny$\pm$0.2649 & 0.4146\,\tiny$\pm$0.2715 & 0.1918\,\tiny$\pm$0.2222 \\
\midrule
LDLT-L & 121 & \textbf{0.7223\,\tiny$\pm$0.1868} & 0.5301\,\tiny$\pm$0.2920 & 0.4293\,\tiny$\pm$0.3049 & 0.3535\,\tiny$\pm$0.3003 & 0.1652\,\tiny$\pm$0.2281 \\
LDLT-R & 121 & 0.7022\,\tiny$\pm$0.1944 & 0.6107\,\tiny$\pm$0.2314 & 0.5292\,\tiny$\pm$0.2525 & 0.4492\,\tiny$\pm$0.2655 & 0.2172\,\tiny$\pm$0.2312 \\
\bottomrule
\end{tabular}
\end{threeparttable}
\end{table*}
\begin{table}[t]
\centering
\begin{threeparttable}
{\small
\caption{Overall comparison on Mean Accuracy: average rank (lower is better) with Iman--Davenport $F=44.33$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
\label{tab:overall:mean_test_acc}
\setlength{\tabcolsep}{4pt}
\begin{tabular}{@{}l r r r r r r@{}}
\toprule
Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
\midrule
LDLT-L & 2.434 & 4 & 0 & 4 & 0.800 & 0.577 \\
Sandwich & 2.566 & 4 & 0 & 4 & 0.800 & 0.517 \\
LDLT-R & 3.438 & 1 & 2 & -1 & 0.200 & 0.629 \\
SLL & 3.624 & 1 & 2 & -1 & 0.200 & 0.678 \\
Orthogonal & 3.831 & 1 & 2 & -1 & 0.200 & 0.639 \\
AOL & 5.107 & 0 & 5 & -5 & 0.000 & 0.000 \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{\small
\caption{Overall comparison on Mean Certified Accuracy (36/255): average rank (lower is better) with Iman--Davenport $F=89.22$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
\label{tab:overall:mean_cert_acc_36}
\setlength{\tabcolsep}{4pt}
\begin{tabular}{@{}l r r r r r r@{}}
\toprule
Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
\midrule
Sandwich & 2.021 & 5 & 0 & 5 & 1.000 & 0.626 \\
LDLT-R & 2.715 & 4 & 1 & 3 & 0.800 & 0.514 \\
Orthogonal & 3.417 & 2 & 2 & 0 & 0.400 & 0.627 \\
SLL & 3.426 & 2 & 2 & 0 & 0.400 & 0.602 \\
LDLT-L & 3.785 & 1 & 4 & -3 & 0.200 & 0.732 \\
AOL & 5.636 & 0 & 5 & -5 & 0.000 & 0.000 \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{\small
\caption{Overall comparison on Mean Certified Accuracy (72/255): average rank (lower is better) with Iman--Davenport $F=101.00$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
\label{tab:overall:mean_cert_acc_72}
\setlength{\tabcolsep}{4pt}
\begin{tabular}{@{}l r r r r r r@{}}
\toprule
Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
\midrule
Sandwich & 1.926 & 5 & 0 & 5 & 1.000 & 0.670 \\
LDLT-R & 2.628 & 4 & 1 & 3 & 0.800 & 0.557 \\
Orthogonal & 3.376 & 2 & 2 & 0 & 0.400 & 0.643 \\
SLL & 3.409 & 2 & 2 & 0 & 0.400 & 0.640 \\
LDLT-L & 4.058 & 1 & 4 & -3 & 0.200 & 0.732 \\
AOL & 5.603 & 0 & 5 & -5 & 0.000 & 0.000 \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{\small
\caption{Overall comparison on Mean Certified Accuracy (108/255): average rank (lower is better) with Iman--Davenport $F=125.70$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
\label{tab:overall:mean_cert_acc_108}
\setlength{\tabcolsep}{4pt}
\begin{tabular}{@{}l r r r r r r@{}}
\toprule
Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
\midrule
Sandwich & 1.868 & 5 & 0 & 5 & 1.000 & 0.675 \\
LDLT-R & 2.562 & 4 & 1 & 3 & 0.800 & 0.548 \\
Orthogonal & 3.347 & 2 & 2 & 0 & 0.400 & 0.674 \\
SLL & 3.360 & 2 & 2 & 0 & 0.400 & 0.660 \\
LDLT-L & 4.136 & 1 & 4 & -3 & 0.200 & 0.801 \\
AOL & 5.727 & 0 & 5 & -5 & 0.000 & 0.000 \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{\small
\caption{Overall comparison on Mean Certified Accuracy (255/255): average rank (lower is better) with Iman--Davenport $F=105.79$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
\label{tab:overall:mean_cert_acc_255}
\setlength{\tabcolsep}{4pt}
\begin{tabular}{@{}l r r r r r r@{}}
\toprule
Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
\midrule
Sandwich & 1.909 & 5 & 0 & 5 & 1.000 & 0.671 \\
LDLT-R & 2.550 & 4 & 1 & 3 & 0.800 & 0.575 \\
SLL & 3.310 & 2 & 2 & 0 & 0.400 & 0.662 \\
Orthogonal & 3.471 & 2 & 2 & 0 & 0.400 & 0.607 \\
LDLT-L & 4.202 & 1 & 4 & -3 & 0.200 & 0.796 \\
AOL & 5.558 & 0 & 5 & -5 & 0.000 & 0.000 \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{
\caption{Pairwise Wilcoxon outcomes for Mean Accuracy (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
\label{tab:signif:mean_test_acc}
\setlength{\tabcolsep}{3pt}
\begin{tabular}{@{}l c c c c c c @{}}
\toprule
& AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
\midrule
AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
Sandwich & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{
\caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (36/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
\label{tab:signif:mean_cert_acc_36}
\setlength{\tabcolsep}{3pt}
\begin{tabular}{@{}l c c c c c c @{}}
\toprule
& AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
\midrule
AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{
\caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (72/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
\label{tab:signif:mean_cert_acc_72}
\setlength{\tabcolsep}{3pt}
\begin{tabular}{@{}l c c c c c c @{}}
\toprule
& AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
\midrule
AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{
\caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (108/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
\label{tab:signif:mean_cert_acc_108}
\setlength{\tabcolsep}{3pt}
\begin{tabular}{@{}l c c c c c c @{}}
\toprule
& AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
\midrule
AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table}[t]
\centering
\begin{threeparttable}
{
\caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (255/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
\label{tab:signif:mean_cert_acc_255}
\setlength{\tabcolsep}{3pt}
\begin{tabular}{@{}l c c c c c c @{}}
\toprule
& AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
\midrule
AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
\bottomrule
\end{tabular}
}
\end{threeparttable}
\end{table}
\begin{table*}[t]
\centering
\begin{threeparttable}
\caption[Mean Accuracy]{Wilcoxon signed-rank tests (two-sided) for Mean Accuracy; $p$-values with Holm FWER corrections within-metric and global.}
\label{tab:wilcoxon:mean_test_acc}
\begingroup
\setlength{\tabcolsep}{4pt}
\begin{tabular}{ll r r r r r r r r r r r}
\toprule
\multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
\midrule
AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.0568 & 412 & $2.3e-17^{***}$ & $3.4e-16^{***}$ & $0^{***}$ & 0.7708 \\
AOL & Sandwich & 121 & 18 & 103 & 0 & 0.1488 & -0.0595 & 518 & $2.3e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7459 \\
AOL & SLL & 121 & 22 & 99 & 0 & 0.1818 & -0.0351 & 806 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6782 \\
AOL & Orthogonal & 121 & 27 & 94 & 0 & 0.2231 & -0.0265 & 971 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6394 \\
AOL & LDLT-R & 121 & 25 & 96 & 0 & 0.2066 & -0.0313 & 1013 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6295 \\
Orthogonal & Sandwich & 121 & 31 & 89 & 1 & 0.2603 & -0.0126 & 1269 & $6.0e-10^{***}$ & $6.3e-09^{***}$ & $2.2e-08^{***}$ & 0.5643 \\
LDLT-L & Orthogonal & 121 & 94 & 27 & 0 & 0.7769 & 0.0139 & 1309 & $7.0e-10^{***}$ & $6.6e-09^{***}$ & $2.5e-08^{***}$ & 0.5599 \\
LDLT-L & SLL & 121 & 86 & 35 & 0 & 0.7107 & 0.0111 & 1503 & $1.5e-08^{***}$ & $1.2e-07^{***}$ & $4.9e-07^{***}$ & 0.5143 \\
LDLT-L & LDLT-R & 121 & 87 & 33 & 1 & 0.7231 & 0.0108 & 1689 & $3.7e-07^{***}$ & $2.6e-06^{***}$ & $1.1e-05^{***}$ & 0.4639 \\
Sandwich & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0090 & 1789 & $8.8e-07^{***}$ & $5.3e-06^{***}$ & $2.3e-05^{***}$ & 0.4470 \\
LDLT-R & Sandwich & 121 & 43 & 78 & 0 & 0.3554 & -0.0068 & 2364 & $6.0e-04^{***}$ & $3.0e-03^{**}$ & $7.2e-03^{**}$ & 0.3118 \\
LDLT-R & SLL & 121 & 66 & 54 & 1 & 0.5496 & 0.0019 & 3070 & $1.4e-01$ & $5.7e-01$ & $8.7e-01$ & 0.1338 \\
LDLT-R & Orthogonal & 121 & 71 & 50 & 0 & 0.5868 & 0.0025 & 3138 & $1.5e-01$ & $5.7e-01$ & $8.7e-01$ & 0.1298 \\
Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0004 & 3623 & $8.6e-01$ & $1.0e+00$ & $1.0e+00$ & 0.0158 \\
LDLT-L & Sandwich & 121 & 59 & 62 & 0 & 0.4876 & -0.0002 & 3624 & $8.6e-01$ & $1.0e+00$ & $1.0e+00$ & 0.0155 \\
\bottomrule
\end{tabular}
\begin{tablenotes}
\item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
\end{tablenotes}
\endgroup
\end{threeparttable}
\end{table*}
\begin{table*}[t]
\centering
\begin{threeparttable}
\caption[Mean Certified Accuracy (36/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (36/255); $p$-values with Holm FWER corrections within-metric and global.}
\label{tab:wilcoxon:mean_cert_acc_36}
\begingroup
\setlength{\tabcolsep}{4pt}
\begin{tabular}{ll r r r r r r r r r r r}
\toprule
\multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
\midrule
AOL & LDLT-R & 121 & 6 & 115 & 0 & 0.0496 & -0.2319 & 84 & $1.1e-20^{***}$ & $1.6e-19^{***}$ & $7.7e-19^{***}$ & 0.8479 \\
AOL & Sandwich & 121 & 6 & 115 & 0 & 0.0496 & -0.2436 & 88 & $1.2e-20^{***}$ & $1.7e-19^{***}$ & $8.4e-19^{***}$ & 0.8470 \\
AOL & SLL & 121 & 6 & 115 & 0 & 0.0496 & -0.1912 & 145 & $4.8e-20^{***}$ & $6.2e-19^{***}$ & $3.2e-18^{***}$ & 0.8336 \\
AOL & Orthogonal & 121 & 10 & 111 & 0 & 0.0826 & -0.2187 & 196 & $1.6e-19^{***}$ & $1.9e-18^{***}$ & $1.0e-17^{***}$ & 0.8216 \\
AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.1218 & 579 & $8.5e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7315 \\
LDLT-L & Sandwich & 121 & 28 & 93 & 0 & 0.2314 & -0.0511 & 884 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6598 \\
Orthogonal & Sandwich & 121 & 24 & 96 & 1 & 0.2025 & -0.0275 & 1002 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6282 \\
Sandwich & SLL & 121 & 97 & 24 & 0 & 0.8017 & 0.0199 & 1005 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6314 \\
LDLT-L & LDLT-R & 121 & 39 & 82 & 0 & 0.3223 & -0.0372 & 1356 & $1.6e-09^{***}$ & $1.1e-08^{***}$ & $5.2e-08^{***}$ & 0.5488 \\
LDLT-L & Orthogonal & 121 & 47 & 74 & 0 & 0.3884 & -0.0190 & 1855 & $2.1e-06^{***}$ & $1.2e-05^{***}$ & $4.8e-05^{***}$ & 0.4315 \\
LDLT-R & SLL & 121 & 81 & 39 & 1 & 0.6736 & 0.0118 & 2104 & $6.5e-05^{***}$ & $2.5e-04^{***}$ & $1.0e-03^{**}$ & 0.3647 \\
LDLT-L & SLL & 121 & 49 & 72 & 0 & 0.4050 & -0.0075 & 2119 & $4.8e-05^{***}$ & $2.4e-04^{***}$ & $9.2e-04^{***}$ & 0.3694 \\
LDLT-R & Sandwich & 121 & 41 & 80 & 0 & 0.3388 & -0.0168 & 2142 & $6.2e-05^{***}$ & $2.5e-04^{***}$ & $1.0e-03^{**}$ & 0.3640 \\
LDLT-R & Orthogonal & 121 & 78 & 43 & 0 & 0.6446 & 0.0126 & 2429 & $1.1e-03^{**}$ & $2.2e-03^{**}$ & $1.1e-02^{*}$ & 0.2965 \\
Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0004 & 3076 & $1.1e-01$ & $1.1e-01$ & $8.7e-01$ & 0.1444 \\
\bottomrule
\end{tabular}
\begin{tablenotes}
\item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
\end{tablenotes}
\endgroup
\end{threeparttable}
\end{table*}
\begin{table*}[t]
\centering
\begin{threeparttable}
\caption[Mean Certified Accuracy (72/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (72/255); $p$-values with Holm FWER corrections within-metric and global.}
\label{tab:wilcoxon:mean_cert_acc_72}
\begingroup
\setlength{\tabcolsep}{4pt}
\begin{tabular}{ll r r r r r r r r r r r}
\toprule
\multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
\midrule
AOL & Sandwich & 121 & 7 & 114 & 0 & 0.0579 & -0.2614 & 107 & $1.9e-20^{***}$ & $2.9e-19^{***}$ & $1.3e-18^{***}$ & 0.8425 \\
AOL & LDLT-R & 121 & 5 & 116 & 0 & 0.0413 & -0.2327 & 116 & $2.4e-20^{***}$ & $3.3e-19^{***}$ & $1.6e-18^{***}$ & 0.8404 \\
AOL & SLL & 121 & 5 & 116 & 0 & 0.0413 & -0.1928 & 162 & $7.1e-20^{***}$ & $9.3e-19^{***}$ & $4.6e-18^{***}$ & 0.8296 \\
AOL & Orthogonal & 121 & 11 & 110 & 0 & 0.0909 & -0.2064 & 214 & $2.4e-19^{***}$ & $2.9e-18^{***}$ & $1.5e-17^{***}$ & 0.8174 \\
AOL & LDLT-L & 121 & 19 & 100 & 2 & 0.1653 & -0.1250 & 557 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7323 \\
Orthogonal & Sandwich & 121 & 19 & 101 & 1 & 0.1612 & -0.0346 & 601 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7240 \\
LDLT-L & Sandwich & 121 & 20 & 101 & 0 & 0.1653 & -0.0772 & 607 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7250 \\
Sandwich & SLL & 121 & 95 & 25 & 1 & 0.7893 & 0.0393 & 801 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6762 \\
LDLT-L & LDLT-R & 121 & 30 & 91 & 0 & 0.2479 & -0.0627 & 930 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6490 \\
LDLT-L & Orthogonal & 121 & 42 & 79 & 0 & 0.3471 & -0.0210 & 1696 & $2.5e-07^{***}$ & $1.5e-06^{***}$ & $7.5e-06^{***}$ & 0.4689 \\
LDLT-L & SLL & 121 & 42 & 79 & 0 & 0.3471 & -0.0213 & 1776 & $7.4e-07^{***}$ & $3.7e-06^{***}$ & $2.0e-05^{***}$ & 0.4501 \\
LDLT-R & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0192 & 1938 & $5.9e-06^{***}$ & $2.3e-05^{***}$ & $1.3e-04^{***}$ & 0.4120 \\
LDLT-R & Sandwich & 121 & 40 & 81 & 0 & 0.3306 & -0.0197 & 2062 & $2.5e-05^{***}$ & $7.6e-05^{***}$ & $5.2e-04^{***}$ & 0.3828 \\
LDLT-R & Orthogonal & 121 & 78 & 43 & 0 & 0.6446 & 0.0178 & 2306 & $3.4e-04^{***}$ & $6.9e-04^{***}$ & $4.5e-03^{**}$ & 0.3254 \\
Orthogonal & SLL & 121 & 66 & 55 & 0 & 0.5455 & 0.0041 & 3178 & $1.9e-01$ & $1.9e-01$ & $8.7e-01$ & 0.1204 \\
\bottomrule
\end{tabular}
\begin{tablenotes}
\item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
\end{tablenotes}
\endgroup
\end{threeparttable}
\end{table*}
\begin{table*}[t]
\centering
\begin{threeparttable}
\caption[Mean Certified Accuracy (108/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (108/255); $p$-values with Holm FWER corrections within-metric and global.}
\label{tab:wilcoxon:mean_cert_acc_108}
\begingroup
\setlength{\tabcolsep}{4pt}
\begin{tabular}{ll r r r r r r r r r r r}
\toprule
\multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
\midrule
AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2229 & 11 & $1.8e-21^{***}$ & $2.7e-20^{***}$ & $1.3e-19^{***}$ & 0.8651 \\
AOL & SLL & 121 & 4 & 117 & 0 & 0.0331 & -0.1616 & 33 & $3.1e-21^{***}$ & $4.3e-20^{***}$ & $2.3e-19^{***}$ & 0.8599 \\
AOL & Orthogonal & 121 & 6 & 115 & 0 & 0.0496 & -0.1829 & 54 & $5.2e-21^{***}$ & $6.8e-20^{***}$ & $3.8e-19^{***}$ & 0.8550 \\
AOL & Sandwich & 121 & 5 & 116 & 0 & 0.0413 & -0.2530 & 63 & $6.5e-21^{***}$ & $7.8e-20^{***}$ & $4.7e-19^{***}$ & 0.8529 \\
AOL & LDLT-L & 121 & 15 & 102 & 4 & 0.1405 & -0.0795 & 265 & $4.5e-18^{***}$ & $5.0e-17^{***}$ & $2.7e-16^{***}$ & 0.8011 \\
LDLT-L & Sandwich & 121 & 16 & 104 & 1 & 0.1364 & -0.0911 & 469 & $1.3e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7556 \\
Orthogonal & Sandwich & 121 & 15 & 106 & 0 & 0.1240 & -0.0411 & 634 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7186 \\
Sandwich & SLL & 121 & 95 & 25 & 1 & 0.7893 & 0.0391 & 769 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6839 \\
LDLT-L & LDLT-R & 121 & 28 & 93 & 0 & 0.2314 & -0.0559 & 854 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6669 \\
LDLT-L & Orthogonal & 121 & 39 & 82 & 0 & 0.3223 & -0.0289 & 1595 & $6.0e-08^{***}$ & $3.6e-07^{***}$ & $1.9e-06^{***}$ & 0.4926 \\
LDLT-L & SLL & 121 & 37 & 82 & 2 & 0.3140 & -0.0231 & 1675 & $5.1e-07^{***}$ & $2.5e-06^{***}$ & $1.4e-05^{***}$ & 0.4605 \\
LDLT-R & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0187 & 2059 & $2.5e-05^{***}$ & $9.8e-05^{***}$ & $5.2e-04^{***}$ & 0.3835 \\
LDLT-R & Sandwich & 121 & 43 & 78 & 0 & 0.3554 & -0.0213 & 2138 & $6.0e-05^{***}$ & $1.8e-04^{***}$ & $1.0e-03^{**}$ & 0.3649 \\
LDLT-R & Orthogonal & 121 & 77 & 44 & 0 & 0.6364 & 0.0182 & 2506 & $2.2e-03^{**}$ & $4.4e-03^{**}$ & $2.0e-02^{*}$ & 0.2784 \\
Orthogonal & SLL & 121 & 65 & 56 & 0 & 0.5372 & 0.0038 & 3069 & $1.1e-01$ & $1.1e-01$ & $8.7e-01$ & 0.1460 \\
\bottomrule
\end{tabular}
\begin{tablenotes}
\item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
\end{tablenotes}
\endgroup
\end{threeparttable}
\end{table*}
\begin{table*}[t]
\centering
\begin{threeparttable}
\caption[Mean Certified Accuracy (255/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (255/255); $p$-values with Holm FWER corrections within-metric and global.}
\label{tab:wilcoxon:mean_cert_acc_255}
\begingroup
\setlength{\tabcolsep}{4pt}
\begin{tabular}{ll r r r r r r r r r r r}
\toprule
\multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
\midrule
AOL & LDLT-R & 121 & 1 & 111 & 9 & 0.0455 & -0.0570 & 10 & $5.4e-20^{***}$ & $8.2e-19^{***}$ & $3.6e-18^{***}$ & 0.8651 \\
AOL & SLL & 121 & 3 & 104 & 14 & 0.0826 & -0.0476 & 23 & $5.3e-19^{***}$ & $6.9e-18^{***}$ & $3.2e-17^{***}$ & 0.8610 \\
AOL & Sandwich & 121 & 2 & 112 & 7 & 0.0455 & -0.0803 & 62 & $9.9e-20^{***}$ & $1.4e-18^{***}$ & $6.3e-18^{***}$ & 0.8514 \\
AOL & Orthogonal & 121 & 5 & 105 & 11 & 0.0868 & -0.0363 & 122 & $2.4e-18^{***}$ & $2.8e-17^{***}$ & $1.4e-16^{***}$ & 0.8331 \\
AOL & LDLT-L & 121 & 8 & 85 & 28 & 0.1818 & -0.0160 & 182 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7958 \\
Orthogonal & Sandwich & 121 & 11 & 103 & 7 & 0.1198 & -0.0313 & 258 & $1.4e-17^{***}$ & $1.5e-16^{***}$ & $8.1e-16^{***}$ & 0.7995 \\
LDLT-L & Sandwich & 121 & 12 & 102 & 7 & 0.1281 & -0.0397 & 342 & $1.1e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7772 \\
LDLT-L & LDLT-R & 121 & 23 & 89 & 9 & 0.2273 & -0.0242 & 927 & $1.0e-10^{***}$ & $6.0e-10^{***}$ & $3.0e-09^{***}$ & 0.6135 \\
Sandwich & SLL & 121 & 90 & 25 & 6 & 0.7686 & 0.0240 & 977 & $0^{***}$ & $4.0e-10^{***}$ & $1.7e-09^{***}$ & 0.6135 \\
LDLT-L & SLL & 121 & 27 & 79 & 15 & 0.2851 & -0.0091 & 1323 & $1.9e-06^{***}$ & $9.4e-06^{***}$ & $4.5e-05^{***}$ & 0.4629 \\
LDLT-R & SLL & 121 & 80 & 35 & 6 & 0.6860 & 0.0175 & 1603 & $1.4e-06^{***}$ & $8.1e-06^{***}$ & $3.4e-05^{***}$ & 0.4506 \\
LDLT-L & Orthogonal & 121 & 36 & 75 & 10 & 0.3388 & -0.0085 & 1741 & $5.8e-05^{***}$ & $2.3e-04^{***}$ & $1.0e-03^{**}$ & 0.3816 \\
LDLT-R & Orthogonal & 121 & 77 & 40 & 4 & 0.6529 & 0.0132 & 1982 & $6.5e-05^{***}$ & $2.3e-04^{***}$ & $1.0e-03^{**}$ & 0.3694 \\
LDLT-R & Sandwich & 121 & 45 & 73 & 3 & 0.3843 & -0.0078 & 2234 & $6.1e-04^{***}$ & $1.2e-03^{**}$ & $7.2e-03^{**}$ & 0.3154 \\
Orthogonal & SLL & 121 & 55 & 58 & 8 & 0.4876 & 0.0000 & 3068 & $6.6e-01$ & $6.6e-01$ & $1.0e+00$ & 0.0410 \\
\bottomrule
\end{tabular}
\begin{tablenotes}
\item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
\end{tablenotes}
\endgroup
\end{threeparttable}
\end{table*}