% JMLR-ready tables for two-column papers % Required packages (no siunitx): % \usepackage{booktabs} % \usepackage{threeparttable} % \usepackage{threeparttablex} % for TableNotes + longtable % \usepackage{longtable} % Optional for landscape: \usepackage{pdflscape} \begin{table*}[t] \centering \begin{threeparttable} \caption{Model dimension ranges (min--max across all datasets and folds). Input/Output dimensions follow dataset label spaces.} \label{tab:model-ranges} \begin{tabular}{l r r r r r r} \toprule Algorithm & Width & Depth & Parameters & Padding & Input dim & Output dim \\ \midrule AOL & 32--512 & 6--6 & 502--1245037 & 10--524 & 3--262 & 2--100 \\ Orthogonal & 32--512 & 6--6 & 507--1245042 & 10--524 & 3--262 & 2--100 \\ Sandwich & 32--512 & 6--6 & 1057--2620542 & 10--524 & 3--262 & 2--100 \\ SLL & 32--512 & 6--6 & 2326--1622697 & 10--524 & 3--262 & 2--100 \\ LDLT-L & 32--512 & 6--6 & 5480--1454611 & 10--524 & 3--262 & 2--100 \\ LDLT-R & 32--512 & 6--6 & 5577--1588756 & 10--524 & 3--262 & 2--100 \\ \bottomrule \end{tabular} \end{threeparttable} \end{table*} \begin{table*}[t] \centering \begin{threeparttable} \caption{Sorted mean$\pm$std across $N$ datasets for each algorithm.} \label{tab:metric_summary} \begin{tabular}{l r lllll} \toprule & & & \multicolumn{4}{c}{Certified Accuracy} \\ \cmidrule(lr){4-7} Algorithm & $N$ & Accuracy & 36/255 & 72/255 & 108/255 & 255/255 \\ \midrule AOL & 121 & 0.6049\,\tiny$\pm$0.2396 & 0.2876\,\tiny$\pm$0.3111 & 0.2157\,\tiny$\pm$0.2940 & 0.1739\,\tiny$\pm$0.2716 & 0.0837\,\tiny$\pm$0.1775 \\ Orthogonal & 121 & 0.7036\,\tiny$\pm$0.1911 & 0.6021\,\tiny$\pm$0.2403 & 0.5088\,\tiny$\pm$0.2638 & 0.4229\,\tiny$\pm$0.2741 & 0.1972\,\tiny$\pm$0.2336 \\ Sandwich & 121 & 0.7163\,\tiny$\pm$0.1879 & \textbf{0.6239\,\tiny$\pm$0.2409} & \textbf{0.5483\,\tiny$\pm$0.2616} & \textbf{0.4738\,\tiny$\pm$0.2712} & \textbf{0.2464\,\tiny$\pm$0.2506} \\ SLL & 121 & 0.7011\,\tiny$\pm$0.1939 & 0.5816\,\tiny$\pm$0.2487 & 0.4813\,\tiny$\pm$0.2720 & 0.3961\,\tiny$\pm$0.2799 & 0.1888\,\tiny$\pm$0.2320 \\ \midrule LDLT-L & 121 & \textbf{0.7245\,\tiny$\pm$0.1908} & 0.4646\,\tiny$\pm$0.3318 & 0.3865\,\tiny$\pm$0.3245 & 0.3247\,\tiny$\pm$0.3088 & 0.1584\,\tiny$\pm$0.2272 \\ LDLT-R & 121 & 0.6970\,\tiny$\pm$0.2021 & 0.6036\,\tiny$\pm$0.2378 & 0.5202\,\tiny$\pm$0.2572 & 0.4478\,\tiny$\pm$0.2640 & 0.2175\,\tiny$\pm$0.2278 \\ \bottomrule \end{tabular} \end{threeparttable} \end{table*} \begin{table}[t] \centering \begin{threeparttable} {\small \caption{Overall comparison on Mean Accuracy: average rank (lower is better) with Iman--Davenport $F=34.41$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.} \label{tab:overall:mean_test_acc} \setlength{\tabcolsep}{4pt} \begin{tabular}{@{}l r r r r r r@{}} \toprule Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\ \midrule LDLT-L & 2.525 & 4 & 0 & 4 & 0.800 & 0.533 \\ Sandwich & 2.773 & 4 & 0 & 4 & 0.800 & 0.421 \\ Orthogonal & 3.479 & 1 & 2 & -1 & 0.200 & 0.654 \\ SLL & 3.545 & 1 & 2 & -1 & 0.200 & 0.621 \\ LDLT-R & 3.628 & 1 & 2 & -1 & 0.200 & 0.560 \\ AOL & 5.050 & 0 & 5 & -5 & 0.000 & 0.000 \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} {\small \caption{Overall comparison on Mean Certified Accuracy (36/255): average rank (lower is better) with Iman--Davenport $F=87.35$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.} \label{tab:overall:mean_cert_acc_36} \setlength{\tabcolsep}{4pt} \begin{tabular}{@{}l r r r r r r@{}} \toprule Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\ \midrule Sandwich & 2.211 & 5 & 0 & 5 & 1.000 & 0.539 \\ LDLT-R & 2.603 & 3 & 1 & 2 & 0.600 & 0.599 \\ Orthogonal & 3.202 & 2 & 1 & 1 & 0.400 & 0.693 \\ SLL & 3.289 & 2 & 2 & 0 & 0.400 & 0.704 \\ LDLT-L & 4.091 & 1 & 4 & -3 & 0.200 & 0.648 \\ AOL & 5.603 & 0 & 5 & -5 & 0.000 & 0.000 \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} {\small \caption{Overall comparison on Mean Certified Accuracy (72/255): average rank (lower is better) with Iman--Davenport $F=125.56$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.} \label{tab:overall:mean_cert_acc_72} \setlength{\tabcolsep}{4pt} \begin{tabular}{@{}l r r r r r r@{}} \toprule Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\ \midrule Sandwich & 1.988 & 5 & 0 & 5 & 1.000 & 0.605 \\ LDLT-R & 2.504 & 4 & 1 & 3 & 0.800 & 0.538 \\ Orthogonal & 3.202 & 3 & 2 & 1 & 0.600 & 0.547 \\ SLL & 3.355 & 2 & 3 & -1 & 0.400 & 0.724 \\ LDLT-L & 4.198 & 1 & 4 & -3 & 0.200 & 0.769 \\ AOL & 5.752 & 0 & 5 & -5 & 0.000 & 0.000 \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} {\small \caption{Overall comparison on Mean Certified Accuracy (108/255): average rank (lower is better) with Iman--Davenport $F=134.70$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.} \label{tab:overall:mean_cert_acc_108} \setlength{\tabcolsep}{4pt} \begin{tabular}{@{}l r r r r r r@{}} \toprule Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\ \midrule Sandwich & 1.988 & 4 & 0 & 4 & 0.800 & 0.721 \\ LDLT-R & 2.364 & 4 & 0 & 4 & 0.800 & 0.594 \\ Orthogonal & 3.260 & 2 & 2 & 0 & 0.400 & 0.717 \\ SLL & 3.388 & 2 & 2 & 0 & 0.400 & 0.696 \\ LDLT-L & 4.256 & 1 & 4 & -3 & 0.200 & 0.826 \\ AOL & 5.744 & 0 & 5 & -5 & 0.000 & 0.000 \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} {\small \caption{Overall comparison on Mean Certified Accuracy (255/255): average rank (lower is better) with Iman--Davenport $F=105.28$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.} \label{tab:overall:mean_cert_acc_255} \setlength{\tabcolsep}{4pt} \begin{tabular}{@{}l r r r r r r@{}} \toprule Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\ \midrule Sandwich & 2.000 & 5 & 0 & 5 & 1.000 & 0.643 \\ LDLT-R & 2.467 & 4 & 1 & 3 & 0.800 & 0.620 \\ SLL & 3.293 & 2 & 2 & 0 & 0.400 & 0.664 \\ Orthogonal & 3.442 & 2 & 2 & 0 & 0.400 & 0.652 \\ LDLT-L & 4.227 & 1 & 4 & -3 & 0.200 & 0.846 \\ AOL & 5.570 & 0 & 5 & -5 & 0.000 & 0.000 \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} { \caption{Pairwise Wilcoxon outcomes for Mean Accuracy (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).} \label{tab:signif:mean_test_acc} \setlength{\tabcolsep}{3pt} \begin{tabular}{@{}l c c c c c c @{}} \toprule & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\ \midrule AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ Sandwich & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} { \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (36/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).} \label{tab:signif:mean_cert_acc_36} \setlength{\tabcolsep}{3pt} \begin{tabular}{@{}l c c c c c c @{}} \toprule & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\ \midrule AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} { \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (72/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).} \label{tab:signif:mean_cert_acc_72} \setlength{\tabcolsep}{3pt} \begin{tabular}{@{}l c c c c c c @{}} \toprule & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\ \midrule AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} { \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (108/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).} \label{tab:signif:mean_cert_acc_108} \setlength{\tabcolsep}{3pt} \begin{tabular}{@{}l c c c c c c @{}} \toprule & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\ \midrule AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table}[t] \centering \begin{threeparttable} { \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (255/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).} \label{tab:signif:mean_cert_acc_255} \setlength{\tabcolsep}{3pt} \begin{tabular}{@{}l c c c c c c @{}} \toprule & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\ \midrule AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\ \bottomrule \end{tabular} } \end{threeparttable} \end{table} \begin{table*}[t] \centering \begin{threeparttable} \caption[Mean Accuracy]{Wilcoxon signed-rank tests (two-sided) for Mean Accuracy; $p$-values with Holm FWER corrections within-metric and global.} \label{tab:wilcoxon:mean_test_acc} \begingroup \setlength{\tabcolsep}{4pt} \begin{tabular}{ll r r r r r r r r r r r} \toprule \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13} Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\ \midrule AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.0632 & 409 & $2.1e-17^{***}$ & $3.2e-16^{***}$ & $0^{***}$ & 0.7715 \\ AOL & Sandwich & 121 & 23 & 98 & 0 & 0.1901 & -0.0656 & 698 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7036 \\ AOL & Orthogonal & 121 & 25 & 96 & 0 & 0.2066 & -0.0525 & 908 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6542 \\ AOL & SLL & 121 & 24 & 97 & 0 & 0.1983 & -0.0445 & 1047 & $0^{***}$ & $1.0e-10^{***}$ & $3.0e-10^{***}$ & 0.6215 \\ AOL & LDLT-R & 121 & 27 & 94 & 0 & 0.2231 & -0.0357 & 1307 & $7.0e-10^{***}$ & $7.8e-09^{***}$ & $2.3e-08^{***}$ & 0.5604 \\ LDLT-L & SLL & 121 & 86 & 35 & 0 & 0.7107 & 0.0103 & 1511 & $1.7e-08^{***}$ & $1.7e-07^{***}$ & $5.0e-07^{***}$ & 0.5124 \\ LDLT-L & LDLT-R & 121 & 87 & 34 & 0 & 0.7190 & 0.0125 & 1779 & $7.7e-07^{***}$ & $6.9e-06^{***}$ & $2.0e-05^{***}$ & 0.4494 \\ LDLT-L & Orthogonal & 121 & 78 & 43 & 0 & 0.6446 & 0.0104 & 2002 & $1.3e-05^{***}$ & $1.0e-04^{***}$ & $2.5e-04^{***}$ & 0.3969 \\ Orthogonal & Sandwich & 121 & 39 & 81 & 1 & 0.3264 & -0.0079 & 2171 & $1.3e-04^{***}$ & $9.4e-04^{***}$ & $2.5e-03^{**}$ & 0.3487 \\ Sandwich & SLL & 121 & 80 & 41 & 0 & 0.6612 & 0.0063 & 2279 & $2.6e-04^{***}$ & $1.6e-03^{**}$ & $4.6e-03^{**}$ & 0.3318 \\ LDLT-R & Sandwich & 121 & 47 & 74 & 0 & 0.3884 & -0.0101 & 2411 & $9.4e-04^{***}$ & $4.7e-03^{**}$ & $1.4e-02^{*}$ & 0.3008 \\ LDLT-L & Sandwich & 121 & 64 & 56 & 1 & 0.5331 & 0.0008 & 3145 & $2.0e-01$ & $8.2e-01$ & $1.0e+00$ & 0.1158 \\ LDLT-R & Orthogonal & 121 & 54 & 67 & 0 & 0.4463 & -0.0024 & 3206 & $2.1e-01$ & $8.2e-01$ & $1.0e+00$ & 0.1138 \\ Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0000 & 3382 & $4.3e-01$ & $8.5e-01$ & $1.0e+00$ & 0.0724 \\ LDLT-R & SLL & 121 & 58 & 63 & 0 & 0.4793 & -0.0010 & 3627 & $8.7e-01$ & $8.7e-01$ & $1.0e+00$ & 0.0148 \\ \bottomrule \end{tabular} \begin{tablenotes} \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$). \end{tablenotes} \endgroup \end{threeparttable} \end{table*} \begin{table*}[t] \centering \begin{threeparttable} \caption[Mean Certified Accuracy (36/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (36/255); $p$-values with Holm FWER corrections within-metric and global.} \label{tab:wilcoxon:mean_cert_acc_36} \begingroup \setlength{\tabcolsep}{4pt} \begin{tabular}{ll r r r r r r r r r r r} \toprule \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13} Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\ \midrule AOL & LDLT-R & 121 & 3 & 118 & 0 & 0.0248 & -0.2903 & 53 & $5.1e-21^{***}$ & $7.6e-20^{***}$ & $3.6e-19^{***}$ & 0.8552 \\ AOL & SLL & 121 & 4 & 117 & 0 & 0.0331 & -0.2718 & 115 & $2.3e-20^{***}$ & $3.2e-19^{***}$ & $1.5e-18^{***}$ & 0.8406 \\ AOL & Sandwich & 121 & 9 & 112 & 0 & 0.0744 & -0.3414 & 135 & $3.7e-20^{***}$ & $4.9e-19^{***}$ & $2.4e-18^{***}$ & 0.8359 \\ AOL & Orthogonal & 121 & 8 & 113 & 0 & 0.0661 & -0.2982 & 140 & $4.2e-20^{***}$ & $5.1e-19^{***}$ & $2.7e-18^{***}$ & 0.8348 \\ LDLT-L & Sandwich & 121 & 22 & 99 & 0 & 0.1818 & -0.0761 & 770 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6866 \\ AOL & LDLT-L & 121 & 22 & 95 & 4 & 0.1983 & -0.1112 & 872 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6485 \\ LDLT-L & LDLT-R & 121 & 34 & 87 & 0 & 0.2810 & -0.0613 & 1073 & $0^{***}$ & $1.0e-10^{***}$ & $5.0e-10^{***}$ & 0.6154 \\ LDLT-L & SLL & 121 & 38 & 83 & 0 & 0.3140 & -0.0545 & 1275 & $4.0e-10^{***}$ & $3.4e-09^{***}$ & $1.4e-08^{***}$ & 0.5679 \\ LDLT-L & Orthogonal & 121 & 40 & 81 & 0 & 0.3306 & -0.0581 & 1346 & $1.3e-09^{***}$ & $9.4e-09^{***}$ & $4.3e-08^{***}$ & 0.5512 \\ Sandwich & SLL & 121 & 89 & 32 & 0 & 0.7355 & 0.0236 & 1459 & $7.9e-09^{***}$ & $4.7e-08^{***}$ & $2.4e-07^{***}$ & 0.5246 \\ Orthogonal & Sandwich & 121 & 33 & 87 & 1 & 0.2769 & -0.0164 & 1846 & $3.0e-06^{***}$ & $1.5e-05^{***}$ & $6.4e-05^{***}$ & 0.4264 \\ LDLT-R & SLL & 121 & 81 & 40 & 0 & 0.6694 & 0.0100 & 2305 & $3.4e-04^{***}$ & $1.4e-03^{**}$ & $5.4e-03^{**}$ & 0.3257 \\ LDLT-R & Sandwich & 121 & 50 & 71 & 0 & 0.4132 & -0.0094 & 2753 & $1.5e-02^{*}$ & $4.6e-02^{*}$ & $1.8e-01$ & 0.2203 \\ Orthogonal & SLL & 121 & 65 & 56 & 0 & 0.5372 & 0.0014 & 2942 & $5.3e-02$ & $1.1e-01$ & $3.9e-01$ & 0.1759 \\ LDLT-R & Orthogonal & 121 & 75 & 46 & 0 & 0.6198 & 0.0065 & 3172 & $1.8e-01$ & $1.8e-01$ & $1.0e+00$ & 0.1218 \\ \bottomrule \end{tabular} \begin{tablenotes} \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$). \end{tablenotes} \endgroup \end{threeparttable} \end{table*} \begin{table*}[t] \centering \begin{threeparttable} \caption[Mean Certified Accuracy (72/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (72/255); $p$-values with Holm FWER corrections within-metric and global.} \label{tab:wilcoxon:mean_cert_acc_72} \begingroup \setlength{\tabcolsep}{4pt} \begin{tabular}{ll r r r r r r r r r r r} \toprule \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13} Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\ \midrule AOL & SLL & 121 & 0 & 121 & 0 & 0.0000 & -0.2418 & 0 & $1.4e-21^{***}$ & $2.1e-20^{***}$ & $1.0e-19^{***}$ & 0.8677 \\ AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2825 & 25 & $2.5e-21^{***}$ & $3.6e-20^{***}$ & $1.9e-19^{***}$ & 0.8618 \\ AOL & Orthogonal & 121 & 4 & 117 & 0 & 0.0331 & -0.2682 & 45 & $4.2e-21^{***}$ & $5.4e-20^{***}$ & $3.0e-19^{***}$ & 0.8571 \\ AOL & Sandwich & 121 & 6 & 115 & 0 & 0.0496 & -0.3329 & 80 & $9.9e-21^{***}$ & $1.2e-19^{***}$ & $6.8e-19^{***}$ & 0.8489 \\ AOL & LDLT-L & 121 & 10 & 93 & 18 & 0.1570 & -0.0849 & 304 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7694 \\ LDLT-L & Sandwich & 121 & 16 & 105 & 0 & 0.1322 & -0.0864 & 509 & $1.9e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7480 \\ LDLT-L & LDLT-R & 121 & 30 & 91 & 0 & 0.2479 & -0.0765 & 873 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6624 \\ Orthogonal & Sandwich & 121 & 22 & 98 & 1 & 0.1860 & -0.0318 & 1154 & $1.0e-10^{***}$ & $6.0e-10^{***}$ & $3.5e-09^{***}$ & 0.5918 \\ Sandwich & SLL & 121 & 95 & 26 & 0 & 0.7851 & 0.0391 & 1169 & $1.0e-10^{***}$ & $6.0e-10^{***}$ & $2.8e-09^{***}$ & 0.5928 \\ LDLT-L & SLL & 121 & 34 & 87 & 0 & 0.2810 & -0.0437 & 1219 & $2.0e-10^{***}$ & $1.0e-09^{***}$ & $6.2e-09^{***}$ & 0.5810 \\ LDLT-L & Orthogonal & 121 & 36 & 85 & 0 & 0.2975 & -0.0452 & 1256 & $3.0e-10^{***}$ & $1.5e-09^{***}$ & $1.1e-08^{***}$ & 0.5723 \\ LDLT-R & SLL & 121 & 89 & 32 & 0 & 0.7355 & 0.0202 & 1852 & $2.0e-06^{***}$ & $8.0e-06^{***}$ & $5.0e-05^{***}$ & 0.4322 \\ LDLT-R & Sandwich & 121 & 49 & 72 & 0 & 0.4050 & -0.0133 & 2656 & $7.5e-03^{**}$ & $2.2e-02^{*}$ & $9.7e-02$ & 0.2431 \\ Orthogonal & SLL & 121 & 67 & 54 & 0 & 0.5537 & 0.0046 & 2784 & $1.9e-02^{*}$ & $3.8e-02^{*}$ & $2.1e-01$ & 0.2130 \\ LDLT-R & Orthogonal & 121 & 74 & 47 & 0 & 0.6116 & 0.0089 & 2855 & $3.1e-02^{*}$ & $3.8e-02^{*}$ & $3.1e-01$ & 0.1963 \\ \bottomrule \end{tabular} \begin{tablenotes} \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$). \end{tablenotes} \endgroup \end{threeparttable} \end{table*} \begin{table*}[t] \centering \begin{threeparttable} \caption[Mean Certified Accuracy (108/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (108/255); $p$-values with Holm FWER corrections within-metric and global.} \label{tab:wilcoxon:mean_cert_acc_108} \begingroup \setlength{\tabcolsep}{4pt} \begin{tabular}{ll r r r r r r r r r r r} \toprule \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13} Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\ \midrule AOL & SLL & 121 & 1 & 116 & 4 & 0.0248 & -0.1721 & 34 & $1.5e-20^{***}$ & $1.8e-19^{***}$ & $1.0e-18^{***}$ & 0.8592 \\ AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2318 & 45 & $4.2e-21^{***}$ & $6.3e-20^{***}$ & $3.0e-19^{***}$ & 0.8571 \\ AOL & Orthogonal & 121 & 3 & 117 & 1 & 0.0289 & -0.2099 & 60 & $8.9e-21^{***}$ & $1.2e-19^{***}$ & $6.2e-19^{***}$ & 0.8534 \\ AOL & Sandwich & 121 & 5 & 116 & 0 & 0.0413 & -0.2735 & 82 & $1.0e-20^{***}$ & $1.3e-19^{***}$ & $7.0e-19^{***}$ & 0.8484 \\ AOL & LDLT-L & 121 & 6 & 90 & 25 & 0.1529 & -0.0672 & 113 & $5.8e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.8259 \\ LDLT-L & Sandwich & 121 & 14 & 107 & 0 & 0.1157 & -0.0819 & 450 & $5.3e-17^{***}$ & $5.8e-16^{***}$ & $0^{***}$ & 0.7619 \\ LDLT-L & LDLT-R & 121 & 25 & 96 & 0 & 0.2066 & -0.0715 & 733 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6953 \\ Orthogonal & Sandwich & 121 & 18 & 102 & 1 & 0.1529 & -0.0376 & 945 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6418 \\ Sandwich & SLL & 121 & 93 & 28 & 0 & 0.7686 & 0.0435 & 995 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6337 \\ LDLT-L & Orthogonal & 121 & 32 & 88 & 1 & 0.2686 & -0.0352 & 1203 & $2.0e-10^{***}$ & $1.3e-09^{***}$ & $7.7e-09^{***}$ & 0.5801 \\ LDLT-L & SLL & 121 & 35 & 82 & 4 & 0.3058 & -0.0294 & 1335 & $8.7e-09^{***}$ & $4.3e-08^{***}$ & $2.6e-07^{***}$ & 0.5321 \\ LDLT-R & SLL & 121 & 89 & 32 & 0 & 0.7355 & 0.0233 & 1603 & $6.7e-08^{***}$ & $2.7e-07^{***}$ & $1.9e-06^{***}$ & 0.4907 \\ LDLT-R & Orthogonal & 121 & 81 & 40 & 0 & 0.6694 & 0.0182 & 2277 & $2.6e-04^{***}$ & $7.7e-04^{***}$ & $4.6e-03^{**}$ & 0.3323 \\ LDLT-R & Sandwich & 121 & 54 & 67 & 0 & 0.4463 & -0.0097 & 2867 & $3.3e-02^{*}$ & $6.7e-02$ & $3.1e-01$ & 0.1935 \\ Orthogonal & SLL & 121 & 67 & 54 & 0 & 0.5537 & 0.0061 & 2930 & $4.9e-02^{*}$ & $6.7e-02$ & $3.9e-01$ & 0.1787 \\ \bottomrule \end{tabular} \begin{tablenotes} \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$). \end{tablenotes} \endgroup \end{threeparttable} \end{table*} \begin{table*}[t] \centering \begin{threeparttable} \caption[Mean Certified Accuracy (255/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (255/255); $p$-values with Holm FWER corrections within-metric and global.} \label{tab:wilcoxon:mean_cert_acc_255} \begingroup \setlength{\tabcolsep}{4pt} \begin{tabular}{ll r r r r r r r r r r r} \toprule \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13} Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\ \midrule AOL & LDLT-R & 121 & 0 & 110 & 11 & 0.0455 & -0.0717 & 0 & $8.9e-20^{***}$ & $1.3e-18^{***}$ & $5.6e-18^{***}$ & 0.8678 \\ AOL & SLL & 121 & 2 & 101 & 18 & 0.0909 & -0.0429 & 22 & $2.4e-18^{***}$ & $3.1e-17^{***}$ & $1.5e-16^{***}$ & 0.8608 \\ AOL & LDLT-L & 121 & 3 & 84 & 34 & 0.1653 & -0.0172 & 48 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.8465 \\ AOL & Orthogonal & 121 & 2 & 103 & 16 & 0.0826 & -0.0488 & 71 & $4.5e-18^{***}$ & $5.3e-17^{***}$ & $2.7e-16^{***}$ & 0.8458 \\ AOL & Sandwich & 121 & 2 & 112 & 7 & 0.0455 & -0.0886 & 74 & $1.4e-19^{***}$ & $1.9e-18^{***}$ & $8.4e-18^{***}$ & 0.8482 \\ LDLT-L & Sandwich & 121 & 10 & 104 & 7 & 0.1116 & -0.0351 & 415 & $5.9e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7579 \\ Orthogonal & Sandwich & 121 & 17 & 97 & 7 & 0.1694 & -0.0273 & 465 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7446 \\ LDLT-L & LDLT-R & 121 & 20 & 90 & 11 & 0.2107 & -0.0296 & 685 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6731 \\ Sandwich & SLL & 121 & 84 & 30 & 7 & 0.7231 & 0.0164 & 1043 & $3.0e-10^{***}$ & $1.9e-09^{***}$ & $9.6e-09^{***}$ & 0.5916 \\ LDLT-L & SLL & 121 & 27 & 76 & 18 & 0.2975 & -0.0086 & 1234 & $2.0e-06^{***}$ & $1.0e-05^{***}$ & $5.0e-05^{***}$ & 0.4679 \\ LDLT-L & Orthogonal & 121 & 30 & 74 & 17 & 0.3182 & -0.0039 & 1287 & $2.9e-06^{***}$ & $1.0e-05^{***}$ & $6.4e-05^{***}$ & 0.4587 \\ LDLT-R & SLL & 121 & 80 & 31 & 10 & 0.7025 & 0.0147 & 1338 & $1.9e-07^{***}$ & $1.2e-06^{***}$ & $5.2e-06^{***}$ & 0.4942 \\ LDLT-R & Orthogonal & 121 & 79 & 33 & 9 & 0.6901 & 0.0149 & 1541 & $2.5e-06^{***}$ & $1.0e-05^{***}$ & $5.7e-05^{***}$ & 0.4451 \\ LDLT-R & Sandwich & 121 & 45 & 70 & 6 & 0.3967 & -0.0068 & 2292 & $3.6e-03^{**}$ & $7.2e-03^{**}$ & $5.1e-02$ & 0.2713 \\ Orthogonal & SLL & 121 & 51 & 56 & 14 & 0.4793 & 0.0000 & 2810 & $8.1e-01$ & $8.1e-01$ & $1.0e+00$ & 0.0236 \\ \bottomrule \end{tabular} \begin{tablenotes} \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$). \end{tablenotes} \endgroup \end{threeparttable} \end{table*}