SuperComputer commited on
Commit
a1efe59
·
verified ·
1 Parent(s): 4fc6159

Add files using upload-large-folder tool

Browse files
Files changed (50) hide show
  1. UCI_N4/aol/summary.json +0 -0
  2. UCI_N4/jmlr_tables.tex +469 -0
  3. UCI_N4/ldlt-resnet/summary.json +0 -0
  4. UCI_N4/ldlt/summary.json +0 -0
  5. UCI_N4/ortho/summary.json +0 -0
  6. UCI_N4/sandwich/summary.json +0 -0
  7. UCI_N4/sdp/runs/abalone/fold_0/result.json +46 -0
  8. UCI_N4/sdp/runs/abalone/fold_1/result.json +46 -0
  9. UCI_N4/sdp/runs/abalone/fold_2/result.json +46 -0
  10. UCI_N4/sdp/runs/abalone/fold_3/result.json +46 -0
  11. UCI_N4/sdp/runs/acute-inflammation/fold_0/result.json +42 -0
  12. UCI_N4/sdp/runs/acute-inflammation/fold_1/result.json +42 -0
  13. UCI_N4/sdp/runs/acute-inflammation/fold_2/result.json +42 -0
  14. UCI_N4/sdp/runs/acute-inflammation/fold_3/result.json +42 -0
  15. UCI_N4/sdp/runs/acute-nephritis/fold_0/result.json +42 -0
  16. UCI_N4/sdp/runs/acute-nephritis/fold_1/result.json +42 -0
  17. UCI_N4/sdp/runs/acute-nephritis/fold_2/result.json +42 -0
  18. UCI_N4/sdp/runs/acute-nephritis/fold_3/result.json +42 -0
  19. UCI_N4/sdp/runs/adult/fold_0/result.json +58 -0
  20. UCI_N4/sdp/runs/adult/fold_1/result.json +58 -0
  21. UCI_N4/sdp/runs/adult/fold_2/result.json +58 -0
  22. UCI_N4/sdp/runs/adult/fold_3/result.json +58 -0
  23. UCI_N4/sdp/runs/annealing/fold_0/result.json +92 -0
  24. UCI_N4/sdp/runs/annealing/fold_1/result.json +92 -0
  25. UCI_N4/sdp/runs/annealing/fold_2/result.json +92 -0
  26. UCI_N4/sdp/runs/annealing/fold_3/result.json +92 -0
  27. UCI_N4/sdp/runs/arrhythmia/fold_0/result.json +554 -0
  28. UCI_N4/sdp/runs/arrhythmia/fold_1/result.json +554 -0
  29. UCI_N4/sdp/runs/arrhythmia/fold_2/result.json +554 -0
  30. UCI_N4/sdp/runs/arrhythmia/fold_3/result.json +554 -0
  31. UCI_N4/sdp/runs/audiology-std/fold_0/result.json +148 -0
  32. UCI_N4/sdp/runs/audiology-std/fold_1/result.json +148 -0
  33. UCI_N4/sdp/runs/audiology-std/fold_2/result.json +148 -0
  34. UCI_N4/sdp/runs/audiology-std/fold_3/result.json +148 -0
  35. UCI_N4/sdp/runs/balance-scale/fold_0/result.json +38 -0
  36. UCI_N4/sdp/runs/balance-scale/fold_1/result.json +38 -0
  37. UCI_N4/sdp/runs/balance-scale/fold_2/result.json +38 -0
  38. UCI_N4/sdp/runs/balance-scale/fold_3/result.json +38 -0
  39. UCI_N4/sdp/runs/balloons/fold_0/result.json +38 -0
  40. UCI_N4/sdp/runs/balloons/fold_1/result.json +38 -0
  41. UCI_N4/sdp/runs/bank/fold_1/result.json +62 -0
  42. UCI_N4/sdp/runs/bank/fold_3/result.json +62 -0
  43. UCI_N4/sdp/summary.json +0 -0
  44. UCI_N4/wilcoxon_pairwise_all.csv +76 -0
  45. UCI_N4/wilcoxon_pairwise_all.json +1427 -0
  46. UCI_N4/wilcoxon_prep_all.json +0 -0
  47. UCI_N6/jmlr_tables.tex +469 -0
  48. UCI_N6/wilcoxon_pairwise_all.csv +76 -0
  49. UCI_N6/wilcoxon_pairwise_all.json +1427 -0
  50. UCI_N6/wilcoxon_prep_all.json +0 -0
UCI_N4/aol/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/jmlr_tables.tex ADDED
@@ -0,0 +1,469 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ % JMLR-ready tables for two-column papers
2
+ % Required packages (no siunitx):
3
+ % \usepackage{booktabs}
4
+ % \usepackage{threeparttable}
5
+ % \usepackage{threeparttablex} % for TableNotes + longtable
6
+ % \usepackage{longtable}
7
+ % Optional for landscape: \usepackage{pdflscape}
8
+
9
+ \begin{table*}[t]
10
+ \centering
11
+ \begin{threeparttable}
12
+ \caption{Model dimension ranges (min--max across all datasets and folds). Input/Output dimensions follow dataset label spaces.}
13
+ \label{tab:model-ranges}
14
+ \begin{tabular}{l r r r r r r}
15
+ \toprule
16
+ Algorithm & Width & Depth & Parameters & Padding & Input dim & Output dim \\
17
+ \midrule
18
+ AOL & 32--512 & 4--4 & 282--694837 & 10--524 & 3--262 & 2--100 \\
19
+ Orthogonal & 32--512 & 4--4 & 285--694840 & 10--524 & 3--262 & 2--100 \\
20
+ Sandwich & 32--512 & 4--4 & 615--1520140 & 10--524 & 3--262 & 2--100 \\
21
+ SLL & 32--512 & 4--4 & 1558--1084073 & 10--524 & 3--262 & 2--100 \\
22
+ LDLT-L & 32--512 & 4--4 & 3366--929297 & 10--524 & 3--262 & 2--100 \\
23
+ LDLT-R & 32--512 & 4--4 & 3463--1063442 & 10--524 & 3--262 & 2--100 \\
24
+ \bottomrule
25
+ \end{tabular}
26
+ \end{threeparttable}
27
+ \end{table*}
28
+
29
+ \begin{table*}[t]
30
+ \centering
31
+ \begin{threeparttable}
32
+ \caption{Sorted mean$\pm$std across $N$ datasets for each algorithm.}
33
+ \label{tab:metric_summary}
34
+ \begin{tabular}{l r lllll}
35
+ \toprule
36
+ & & & \multicolumn{4}{c}{Certified Accuracy} \\
37
+ \cmidrule(lr){4-7}
38
+ Algorithm & $N$ & Accuracy & 36/255 & 72/255 & 108/255 & 255/255 \\
39
+ \midrule
40
+ AOL & 121 & 0.6295\,\tiny$\pm$0.2278 & 0.3669\,\tiny$\pm$0.2895 & 0.2660\,\tiny$\pm$0.2953 & 0.2076\,\tiny$\pm$0.2819 & 0.0999\,\tiny$\pm$0.1875 \\
41
+ Orthogonal & 121 & 0.6969\,\tiny$\pm$0.1938 & 0.5973\,\tiny$\pm$0.2386 & 0.5073\,\tiny$\pm$0.2617 & 0.4300\,\tiny$\pm$0.2702 & 0.1970\,\tiny$\pm$0.2288 \\
42
+ Sandwich & 121 & 0.7215\,\tiny$\pm$0.1871 & \textbf{0.6375\,\tiny$\pm$0.2305} & \textbf{0.5593\,\tiny$\pm$0.2503} & \textbf{0.4836\,\tiny$\pm$0.2659} & \textbf{0.2496\,\tiny$\pm$0.2471} \\
43
+ SLL & 121 & 0.6978\,\tiny$\pm$0.1998 & 0.5885\,\tiny$\pm$0.2451 & 0.4975\,\tiny$\pm$0.2649 & 0.4146\,\tiny$\pm$0.2715 & 0.1918\,\tiny$\pm$0.2222 \\
44
+ \midrule
45
+ LDLT-L & 121 & \textbf{0.7223\,\tiny$\pm$0.1868} & 0.5301\,\tiny$\pm$0.2920 & 0.4293\,\tiny$\pm$0.3049 & 0.3535\,\tiny$\pm$0.3003 & 0.1652\,\tiny$\pm$0.2281 \\
46
+ LDLT-R & 121 & 0.7022\,\tiny$\pm$0.1944 & 0.6107\,\tiny$\pm$0.2314 & 0.5292\,\tiny$\pm$0.2525 & 0.4492\,\tiny$\pm$0.2655 & 0.2172\,\tiny$\pm$0.2312 \\
47
+ \bottomrule
48
+ \end{tabular}
49
+ \end{threeparttable}
50
+ \end{table*}
51
+
52
+ \begin{table}[t]
53
+ \centering
54
+ \begin{threeparttable}
55
+ {\small
56
+ \caption{Overall comparison on Mean Accuracy: average rank (lower is better) with Iman--Davenport $F=44.33$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
57
+ \label{tab:overall:mean_test_acc}
58
+ \setlength{\tabcolsep}{4pt}
59
+ \begin{tabular}{@{}l r r r r r r@{}}
60
+ \toprule
61
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
62
+ \midrule
63
+ LDLT-L & 2.434 & 4 & 0 & 4 & 0.800 & 0.577 \\
64
+ Sandwich & 2.566 & 4 & 0 & 4 & 0.800 & 0.517 \\
65
+ LDLT-R & 3.438 & 1 & 2 & -1 & 0.200 & 0.629 \\
66
+ SLL & 3.624 & 1 & 2 & -1 & 0.200 & 0.678 \\
67
+ Orthogonal & 3.831 & 1 & 2 & -1 & 0.200 & 0.639 \\
68
+ AOL & 5.107 & 0 & 5 & -5 & 0.000 & 0.000 \\
69
+ \bottomrule
70
+ \end{tabular}
71
+ }
72
+ \end{threeparttable}
73
+ \end{table}
74
+
75
+ \begin{table}[t]
76
+ \centering
77
+ \begin{threeparttable}
78
+ {\small
79
+ \caption{Overall comparison on Mean Certified Accuracy (36/255): average rank (lower is better) with Iman--Davenport $F=89.22$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
80
+ \label{tab:overall:mean_cert_acc_36}
81
+ \setlength{\tabcolsep}{4pt}
82
+ \begin{tabular}{@{}l r r r r r r@{}}
83
+ \toprule
84
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
85
+ \midrule
86
+ Sandwich & 2.021 & 5 & 0 & 5 & 1.000 & 0.626 \\
87
+ LDLT-R & 2.715 & 4 & 1 & 3 & 0.800 & 0.514 \\
88
+ Orthogonal & 3.417 & 2 & 2 & 0 & 0.400 & 0.627 \\
89
+ SLL & 3.426 & 2 & 2 & 0 & 0.400 & 0.602 \\
90
+ LDLT-L & 3.785 & 1 & 4 & -3 & 0.200 & 0.732 \\
91
+ AOL & 5.636 & 0 & 5 & -5 & 0.000 & 0.000 \\
92
+ \bottomrule
93
+ \end{tabular}
94
+ }
95
+ \end{threeparttable}
96
+ \end{table}
97
+
98
+ \begin{table}[t]
99
+ \centering
100
+ \begin{threeparttable}
101
+ {\small
102
+ \caption{Overall comparison on Mean Certified Accuracy (72/255): average rank (lower is better) with Iman--Davenport $F=101.00$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
103
+ \label{tab:overall:mean_cert_acc_72}
104
+ \setlength{\tabcolsep}{4pt}
105
+ \begin{tabular}{@{}l r r r r r r@{}}
106
+ \toprule
107
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
108
+ \midrule
109
+ Sandwich & 1.926 & 5 & 0 & 5 & 1.000 & 0.670 \\
110
+ LDLT-R & 2.628 & 4 & 1 & 3 & 0.800 & 0.557 \\
111
+ Orthogonal & 3.376 & 2 & 2 & 0 & 0.400 & 0.643 \\
112
+ SLL & 3.409 & 2 & 2 & 0 & 0.400 & 0.640 \\
113
+ LDLT-L & 4.058 & 1 & 4 & -3 & 0.200 & 0.732 \\
114
+ AOL & 5.603 & 0 & 5 & -5 & 0.000 & 0.000 \\
115
+ \bottomrule
116
+ \end{tabular}
117
+ }
118
+ \end{threeparttable}
119
+ \end{table}
120
+
121
+ \begin{table}[t]
122
+ \centering
123
+ \begin{threeparttable}
124
+ {\small
125
+ \caption{Overall comparison on Mean Certified Accuracy (108/255): average rank (lower is better) with Iman--Davenport $F=125.70$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
126
+ \label{tab:overall:mean_cert_acc_108}
127
+ \setlength{\tabcolsep}{4pt}
128
+ \begin{tabular}{@{}l r r r r r r@{}}
129
+ \toprule
130
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
131
+ \midrule
132
+ Sandwich & 1.868 & 5 & 0 & 5 & 1.000 & 0.675 \\
133
+ LDLT-R & 2.562 & 4 & 1 & 3 & 0.800 & 0.548 \\
134
+ Orthogonal & 3.347 & 2 & 2 & 0 & 0.400 & 0.674 \\
135
+ SLL & 3.360 & 2 & 2 & 0 & 0.400 & 0.660 \\
136
+ LDLT-L & 4.136 & 1 & 4 & -3 & 0.200 & 0.801 \\
137
+ AOL & 5.727 & 0 & 5 & -5 & 0.000 & 0.000 \\
138
+ \bottomrule
139
+ \end{tabular}
140
+ }
141
+ \end{threeparttable}
142
+ \end{table}
143
+
144
+ \begin{table}[t]
145
+ \centering
146
+ \begin{threeparttable}
147
+ {\small
148
+ \caption{Overall comparison on Mean Certified Accuracy (255/255): average rank (lower is better) with Iman--Davenport $F=105.79$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
149
+ \label{tab:overall:mean_cert_acc_255}
150
+ \setlength{\tabcolsep}{4pt}
151
+ \begin{tabular}{@{}l r r r r r r@{}}
152
+ \toprule
153
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
154
+ \midrule
155
+ Sandwich & 1.909 & 5 & 0 & 5 & 1.000 & 0.671 \\
156
+ LDLT-R & 2.550 & 4 & 1 & 3 & 0.800 & 0.575 \\
157
+ SLL & 3.310 & 2 & 2 & 0 & 0.400 & 0.662 \\
158
+ Orthogonal & 3.471 & 2 & 2 & 0 & 0.400 & 0.607 \\
159
+ LDLT-L & 4.202 & 1 & 4 & -3 & 0.200 & 0.796 \\
160
+ AOL & 5.558 & 0 & 5 & -5 & 0.000 & 0.000 \\
161
+ \bottomrule
162
+ \end{tabular}
163
+ }
164
+ \end{threeparttable}
165
+ \end{table}
166
+
167
+ \begin{table}[t]
168
+ \centering
169
+ \begin{threeparttable}
170
+ {
171
+ \caption{Pairwise Wilcoxon outcomes for Mean Accuracy (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
172
+ \label{tab:signif:mean_test_acc}
173
+ \setlength{\tabcolsep}{3pt}
174
+ \begin{tabular}{@{}l c c c c c c @{}}
175
+ \toprule
176
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
177
+ \midrule
178
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
179
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
180
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
181
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
182
+ Sandwich & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
183
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
184
+ \bottomrule
185
+ \end{tabular}
186
+ }
187
+ \end{threeparttable}
188
+ \end{table}
189
+
190
+ \begin{table}[t]
191
+ \centering
192
+ \begin{threeparttable}
193
+ {
194
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (36/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
195
+ \label{tab:signif:mean_cert_acc_36}
196
+ \setlength{\tabcolsep}{3pt}
197
+ \begin{tabular}{@{}l c c c c c c @{}}
198
+ \toprule
199
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
200
+ \midrule
201
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
202
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
203
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
204
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
205
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
206
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
207
+ \bottomrule
208
+ \end{tabular}
209
+ }
210
+ \end{threeparttable}
211
+ \end{table}
212
+
213
+ \begin{table}[t]
214
+ \centering
215
+ \begin{threeparttable}
216
+ {
217
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (72/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
218
+ \label{tab:signif:mean_cert_acc_72}
219
+ \setlength{\tabcolsep}{3pt}
220
+ \begin{tabular}{@{}l c c c c c c @{}}
221
+ \toprule
222
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
223
+ \midrule
224
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
225
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
226
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
227
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
228
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
229
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
230
+ \bottomrule
231
+ \end{tabular}
232
+ }
233
+ \end{threeparttable}
234
+ \end{table}
235
+
236
+ \begin{table}[t]
237
+ \centering
238
+ \begin{threeparttable}
239
+ {
240
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (108/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
241
+ \label{tab:signif:mean_cert_acc_108}
242
+ \setlength{\tabcolsep}{3pt}
243
+ \begin{tabular}{@{}l c c c c c c @{}}
244
+ \toprule
245
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
246
+ \midrule
247
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
248
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
249
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
250
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
251
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
252
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
253
+ \bottomrule
254
+ \end{tabular}
255
+ }
256
+ \end{threeparttable}
257
+ \end{table}
258
+
259
+ \begin{table}[t]
260
+ \centering
261
+ \begin{threeparttable}
262
+ {
263
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (255/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
264
+ \label{tab:signif:mean_cert_acc_255}
265
+ \setlength{\tabcolsep}{3pt}
266
+ \begin{tabular}{@{}l c c c c c c @{}}
267
+ \toprule
268
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
269
+ \midrule
270
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
271
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
272
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
273
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
274
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
275
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
276
+ \bottomrule
277
+ \end{tabular}
278
+ }
279
+ \end{threeparttable}
280
+ \end{table}
281
+
282
+
283
+ \begin{table*}[t]
284
+ \centering
285
+ \begin{threeparttable}
286
+ \caption[Mean Accuracy]{Wilcoxon signed-rank tests (two-sided) for Mean Accuracy; $p$-values with Holm FWER corrections within-metric and global.}
287
+ \label{tab:wilcoxon:mean_test_acc}
288
+ \begingroup
289
+ \setlength{\tabcolsep}{4pt}
290
+ \begin{tabular}{ll r r r r r r r r r r r}
291
+ \toprule
292
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
293
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
294
+ \midrule
295
+ AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.0568 & 412 & $2.3e-17^{***}$ & $3.4e-16^{***}$ & $0^{***}$ & 0.7708 \\
296
+ AOL & Sandwich & 121 & 18 & 103 & 0 & 0.1488 & -0.0595 & 518 & $2.3e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7459 \\
297
+ AOL & SLL & 121 & 22 & 99 & 0 & 0.1818 & -0.0351 & 806 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6782 \\
298
+ AOL & Orthogonal & 121 & 27 & 94 & 0 & 0.2231 & -0.0265 & 971 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6394 \\
299
+ AOL & LDLT-R & 121 & 25 & 96 & 0 & 0.2066 & -0.0313 & 1013 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6295 \\
300
+ Orthogonal & Sandwich & 121 & 31 & 89 & 1 & 0.2603 & -0.0126 & 1269 & $6.0e-10^{***}$ & $6.3e-09^{***}$ & $2.2e-08^{***}$ & 0.5643 \\
301
+ LDLT-L & Orthogonal & 121 & 94 & 27 & 0 & 0.7769 & 0.0139 & 1309 & $7.0e-10^{***}$ & $6.6e-09^{***}$ & $2.5e-08^{***}$ & 0.5599 \\
302
+ LDLT-L & SLL & 121 & 86 & 35 & 0 & 0.7107 & 0.0111 & 1503 & $1.5e-08^{***}$ & $1.2e-07^{***}$ & $4.9e-07^{***}$ & 0.5143 \\
303
+ LDLT-L & LDLT-R & 121 & 87 & 33 & 1 & 0.7231 & 0.0108 & 1689 & $3.7e-07^{***}$ & $2.6e-06^{***}$ & $1.1e-05^{***}$ & 0.4639 \\
304
+ Sandwich & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0090 & 1789 & $8.8e-07^{***}$ & $5.3e-06^{***}$ & $2.3e-05^{***}$ & 0.4470 \\
305
+ LDLT-R & Sandwich & 121 & 43 & 78 & 0 & 0.3554 & -0.0068 & 2364 & $6.0e-04^{***}$ & $3.0e-03^{**}$ & $7.2e-03^{**}$ & 0.3118 \\
306
+ LDLT-R & SLL & 121 & 66 & 54 & 1 & 0.5496 & 0.0019 & 3070 & $1.4e-01$ & $5.7e-01$ & $8.7e-01$ & 0.1338 \\
307
+ LDLT-R & Orthogonal & 121 & 71 & 50 & 0 & 0.5868 & 0.0025 & 3138 & $1.5e-01$ & $5.7e-01$ & $8.7e-01$ & 0.1298 \\
308
+ Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0004 & 3623 & $8.6e-01$ & $1.0e+00$ & $1.0e+00$ & 0.0158 \\
309
+ LDLT-L & Sandwich & 121 & 59 & 62 & 0 & 0.4876 & -0.0002 & 3624 & $8.6e-01$ & $1.0e+00$ & $1.0e+00$ & 0.0155 \\
310
+ \bottomrule
311
+ \end{tabular}
312
+ \begin{tablenotes}
313
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
314
+ \end{tablenotes}
315
+ \endgroup
316
+ \end{threeparttable}
317
+ \end{table*}
318
+
319
+
320
+
321
+ \begin{table*}[t]
322
+ \centering
323
+ \begin{threeparttable}
324
+ \caption[Mean Certified Accuracy (36/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (36/255); $p$-values with Holm FWER corrections within-metric and global.}
325
+ \label{tab:wilcoxon:mean_cert_acc_36}
326
+ \begingroup
327
+ \setlength{\tabcolsep}{4pt}
328
+ \begin{tabular}{ll r r r r r r r r r r r}
329
+ \toprule
330
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
331
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
332
+ \midrule
333
+ AOL & LDLT-R & 121 & 6 & 115 & 0 & 0.0496 & -0.2319 & 84 & $1.1e-20^{***}$ & $1.6e-19^{***}$ & $7.7e-19^{***}$ & 0.8479 \\
334
+ AOL & Sandwich & 121 & 6 & 115 & 0 & 0.0496 & -0.2436 & 88 & $1.2e-20^{***}$ & $1.7e-19^{***}$ & $8.4e-19^{***}$ & 0.8470 \\
335
+ AOL & SLL & 121 & 6 & 115 & 0 & 0.0496 & -0.1912 & 145 & $4.8e-20^{***}$ & $6.2e-19^{***}$ & $3.2e-18^{***}$ & 0.8336 \\
336
+ AOL & Orthogonal & 121 & 10 & 111 & 0 & 0.0826 & -0.2187 & 196 & $1.6e-19^{***}$ & $1.9e-18^{***}$ & $1.0e-17^{***}$ & 0.8216 \\
337
+ AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.1218 & 579 & $8.5e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7315 \\
338
+ LDLT-L & Sandwich & 121 & 28 & 93 & 0 & 0.2314 & -0.0511 & 884 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6598 \\
339
+ Orthogonal & Sandwich & 121 & 24 & 96 & 1 & 0.2025 & -0.0275 & 1002 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6282 \\
340
+ Sandwich & SLL & 121 & 97 & 24 & 0 & 0.8017 & 0.0199 & 1005 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6314 \\
341
+ LDLT-L & LDLT-R & 121 & 39 & 82 & 0 & 0.3223 & -0.0372 & 1356 & $1.6e-09^{***}$ & $1.1e-08^{***}$ & $5.2e-08^{***}$ & 0.5488 \\
342
+ LDLT-L & Orthogonal & 121 & 47 & 74 & 0 & 0.3884 & -0.0190 & 1855 & $2.1e-06^{***}$ & $1.2e-05^{***}$ & $4.8e-05^{***}$ & 0.4315 \\
343
+ LDLT-R & SLL & 121 & 81 & 39 & 1 & 0.6736 & 0.0118 & 2104 & $6.5e-05^{***}$ & $2.5e-04^{***}$ & $1.0e-03^{**}$ & 0.3647 \\
344
+ LDLT-L & SLL & 121 & 49 & 72 & 0 & 0.4050 & -0.0075 & 2119 & $4.8e-05^{***}$ & $2.4e-04^{***}$ & $9.2e-04^{***}$ & 0.3694 \\
345
+ LDLT-R & Sandwich & 121 & 41 & 80 & 0 & 0.3388 & -0.0168 & 2142 & $6.2e-05^{***}$ & $2.5e-04^{***}$ & $1.0e-03^{**}$ & 0.3640 \\
346
+ LDLT-R & Orthogonal & 121 & 78 & 43 & 0 & 0.6446 & 0.0126 & 2429 & $1.1e-03^{**}$ & $2.2e-03^{**}$ & $1.1e-02^{*}$ & 0.2965 \\
347
+ Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0004 & 3076 & $1.1e-01$ & $1.1e-01$ & $8.7e-01$ & 0.1444 \\
348
+ \bottomrule
349
+ \end{tabular}
350
+ \begin{tablenotes}
351
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
352
+ \end{tablenotes}
353
+ \endgroup
354
+ \end{threeparttable}
355
+ \end{table*}
356
+
357
+
358
+
359
+ \begin{table*}[t]
360
+ \centering
361
+ \begin{threeparttable}
362
+ \caption[Mean Certified Accuracy (72/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (72/255); $p$-values with Holm FWER corrections within-metric and global.}
363
+ \label{tab:wilcoxon:mean_cert_acc_72}
364
+ \begingroup
365
+ \setlength{\tabcolsep}{4pt}
366
+ \begin{tabular}{ll r r r r r r r r r r r}
367
+ \toprule
368
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
369
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
370
+ \midrule
371
+ AOL & Sandwich & 121 & 7 & 114 & 0 & 0.0579 & -0.2614 & 107 & $1.9e-20^{***}$ & $2.9e-19^{***}$ & $1.3e-18^{***}$ & 0.8425 \\
372
+ AOL & LDLT-R & 121 & 5 & 116 & 0 & 0.0413 & -0.2327 & 116 & $2.4e-20^{***}$ & $3.3e-19^{***}$ & $1.6e-18^{***}$ & 0.8404 \\
373
+ AOL & SLL & 121 & 5 & 116 & 0 & 0.0413 & -0.1928 & 162 & $7.1e-20^{***}$ & $9.3e-19^{***}$ & $4.6e-18^{***}$ & 0.8296 \\
374
+ AOL & Orthogonal & 121 & 11 & 110 & 0 & 0.0909 & -0.2064 & 214 & $2.4e-19^{***}$ & $2.9e-18^{***}$ & $1.5e-17^{***}$ & 0.8174 \\
375
+ AOL & LDLT-L & 121 & 19 & 100 & 2 & 0.1653 & -0.1250 & 557 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7323 \\
376
+ Orthogonal & Sandwich & 121 & 19 & 101 & 1 & 0.1612 & -0.0346 & 601 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7240 \\
377
+ LDLT-L & Sandwich & 121 & 20 & 101 & 0 & 0.1653 & -0.0772 & 607 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7250 \\
378
+ Sandwich & SLL & 121 & 95 & 25 & 1 & 0.7893 & 0.0393 & 801 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6762 \\
379
+ LDLT-L & LDLT-R & 121 & 30 & 91 & 0 & 0.2479 & -0.0627 & 930 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6490 \\
380
+ LDLT-L & Orthogonal & 121 & 42 & 79 & 0 & 0.3471 & -0.0210 & 1696 & $2.5e-07^{***}$ & $1.5e-06^{***}$ & $7.5e-06^{***}$ & 0.4689 \\
381
+ LDLT-L & SLL & 121 & 42 & 79 & 0 & 0.3471 & -0.0213 & 1776 & $7.4e-07^{***}$ & $3.7e-06^{***}$ & $2.0e-05^{***}$ & 0.4501 \\
382
+ LDLT-R & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0192 & 1938 & $5.9e-06^{***}$ & $2.3e-05^{***}$ & $1.3e-04^{***}$ & 0.4120 \\
383
+ LDLT-R & Sandwich & 121 & 40 & 81 & 0 & 0.3306 & -0.0197 & 2062 & $2.5e-05^{***}$ & $7.6e-05^{***}$ & $5.2e-04^{***}$ & 0.3828 \\
384
+ LDLT-R & Orthogonal & 121 & 78 & 43 & 0 & 0.6446 & 0.0178 & 2306 & $3.4e-04^{***}$ & $6.9e-04^{***}$ & $4.5e-03^{**}$ & 0.3254 \\
385
+ Orthogonal & SLL & 121 & 66 & 55 & 0 & 0.5455 & 0.0041 & 3178 & $1.9e-01$ & $1.9e-01$ & $8.7e-01$ & 0.1204 \\
386
+ \bottomrule
387
+ \end{tabular}
388
+ \begin{tablenotes}
389
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
390
+ \end{tablenotes}
391
+ \endgroup
392
+ \end{threeparttable}
393
+ \end{table*}
394
+
395
+
396
+
397
+ \begin{table*}[t]
398
+ \centering
399
+ \begin{threeparttable}
400
+ \caption[Mean Certified Accuracy (108/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (108/255); $p$-values with Holm FWER corrections within-metric and global.}
401
+ \label{tab:wilcoxon:mean_cert_acc_108}
402
+ \begingroup
403
+ \setlength{\tabcolsep}{4pt}
404
+ \begin{tabular}{ll r r r r r r r r r r r}
405
+ \toprule
406
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
407
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
408
+ \midrule
409
+ AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2229 & 11 & $1.8e-21^{***}$ & $2.7e-20^{***}$ & $1.3e-19^{***}$ & 0.8651 \\
410
+ AOL & SLL & 121 & 4 & 117 & 0 & 0.0331 & -0.1616 & 33 & $3.1e-21^{***}$ & $4.3e-20^{***}$ & $2.3e-19^{***}$ & 0.8599 \\
411
+ AOL & Orthogonal & 121 & 6 & 115 & 0 & 0.0496 & -0.1829 & 54 & $5.2e-21^{***}$ & $6.8e-20^{***}$ & $3.8e-19^{***}$ & 0.8550 \\
412
+ AOL & Sandwich & 121 & 5 & 116 & 0 & 0.0413 & -0.2530 & 63 & $6.5e-21^{***}$ & $7.8e-20^{***}$ & $4.7e-19^{***}$ & 0.8529 \\
413
+ AOL & LDLT-L & 121 & 15 & 102 & 4 & 0.1405 & -0.0795 & 265 & $4.5e-18^{***}$ & $5.0e-17^{***}$ & $2.7e-16^{***}$ & 0.8011 \\
414
+ LDLT-L & Sandwich & 121 & 16 & 104 & 1 & 0.1364 & -0.0911 & 469 & $1.3e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7556 \\
415
+ Orthogonal & Sandwich & 121 & 15 & 106 & 0 & 0.1240 & -0.0411 & 634 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7186 \\
416
+ Sandwich & SLL & 121 & 95 & 25 & 1 & 0.7893 & 0.0391 & 769 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6839 \\
417
+ LDLT-L & LDLT-R & 121 & 28 & 93 & 0 & 0.2314 & -0.0559 & 854 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6669 \\
418
+ LDLT-L & Orthogonal & 121 & 39 & 82 & 0 & 0.3223 & -0.0289 & 1595 & $6.0e-08^{***}$ & $3.6e-07^{***}$ & $1.9e-06^{***}$ & 0.4926 \\
419
+ LDLT-L & SLL & 121 & 37 & 82 & 2 & 0.3140 & -0.0231 & 1675 & $5.1e-07^{***}$ & $2.5e-06^{***}$ & $1.4e-05^{***}$ & 0.4605 \\
420
+ LDLT-R & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0187 & 2059 & $2.5e-05^{***}$ & $9.8e-05^{***}$ & $5.2e-04^{***}$ & 0.3835 \\
421
+ LDLT-R & Sandwich & 121 & 43 & 78 & 0 & 0.3554 & -0.0213 & 2138 & $6.0e-05^{***}$ & $1.8e-04^{***}$ & $1.0e-03^{**}$ & 0.3649 \\
422
+ LDLT-R & Orthogonal & 121 & 77 & 44 & 0 & 0.6364 & 0.0182 & 2506 & $2.2e-03^{**}$ & $4.4e-03^{**}$ & $2.0e-02^{*}$ & 0.2784 \\
423
+ Orthogonal & SLL & 121 & 65 & 56 & 0 & 0.5372 & 0.0038 & 3069 & $1.1e-01$ & $1.1e-01$ & $8.7e-01$ & 0.1460 \\
424
+ \bottomrule
425
+ \end{tabular}
426
+ \begin{tablenotes}
427
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
428
+ \end{tablenotes}
429
+ \endgroup
430
+ \end{threeparttable}
431
+ \end{table*}
432
+
433
+
434
+
435
+ \begin{table*}[t]
436
+ \centering
437
+ \begin{threeparttable}
438
+ \caption[Mean Certified Accuracy (255/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (255/255); $p$-values with Holm FWER corrections within-metric and global.}
439
+ \label{tab:wilcoxon:mean_cert_acc_255}
440
+ \begingroup
441
+ \setlength{\tabcolsep}{4pt}
442
+ \begin{tabular}{ll r r r r r r r r r r r}
443
+ \toprule
444
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
445
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
446
+ \midrule
447
+ AOL & LDLT-R & 121 & 1 & 111 & 9 & 0.0455 & -0.0570 & 10 & $5.4e-20^{***}$ & $8.2e-19^{***}$ & $3.6e-18^{***}$ & 0.8651 \\
448
+ AOL & SLL & 121 & 3 & 104 & 14 & 0.0826 & -0.0476 & 23 & $5.3e-19^{***}$ & $6.9e-18^{***}$ & $3.2e-17^{***}$ & 0.8610 \\
449
+ AOL & Sandwich & 121 & 2 & 112 & 7 & 0.0455 & -0.0803 & 62 & $9.9e-20^{***}$ & $1.4e-18^{***}$ & $6.3e-18^{***}$ & 0.8514 \\
450
+ AOL & Orthogonal & 121 & 5 & 105 & 11 & 0.0868 & -0.0363 & 122 & $2.4e-18^{***}$ & $2.8e-17^{***}$ & $1.4e-16^{***}$ & 0.8331 \\
451
+ AOL & LDLT-L & 121 & 8 & 85 & 28 & 0.1818 & -0.0160 & 182 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7958 \\
452
+ Orthogonal & Sandwich & 121 & 11 & 103 & 7 & 0.1198 & -0.0313 & 258 & $1.4e-17^{***}$ & $1.5e-16^{***}$ & $8.1e-16^{***}$ & 0.7995 \\
453
+ LDLT-L & Sandwich & 121 & 12 & 102 & 7 & 0.1281 & -0.0397 & 342 & $1.1e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7772 \\
454
+ LDLT-L & LDLT-R & 121 & 23 & 89 & 9 & 0.2273 & -0.0242 & 927 & $1.0e-10^{***}$ & $6.0e-10^{***}$ & $3.0e-09^{***}$ & 0.6135 \\
455
+ Sandwich & SLL & 121 & 90 & 25 & 6 & 0.7686 & 0.0240 & 977 & $0^{***}$ & $4.0e-10^{***}$ & $1.7e-09^{***}$ & 0.6135 \\
456
+ LDLT-L & SLL & 121 & 27 & 79 & 15 & 0.2851 & -0.0091 & 1323 & $1.9e-06^{***}$ & $9.4e-06^{***}$ & $4.5e-05^{***}$ & 0.4629 \\
457
+ LDLT-R & SLL & 121 & 80 & 35 & 6 & 0.6860 & 0.0175 & 1603 & $1.4e-06^{***}$ & $8.1e-06^{***}$ & $3.4e-05^{***}$ & 0.4506 \\
458
+ LDLT-L & Orthogonal & 121 & 36 & 75 & 10 & 0.3388 & -0.0085 & 1741 & $5.8e-05^{***}$ & $2.3e-04^{***}$ & $1.0e-03^{**}$ & 0.3816 \\
459
+ LDLT-R & Orthogonal & 121 & 77 & 40 & 4 & 0.6529 & 0.0132 & 1982 & $6.5e-05^{***}$ & $2.3e-04^{***}$ & $1.0e-03^{**}$ & 0.3694 \\
460
+ LDLT-R & Sandwich & 121 & 45 & 73 & 3 & 0.3843 & -0.0078 & 2234 & $6.1e-04^{***}$ & $1.2e-03^{**}$ & $7.2e-03^{**}$ & 0.3154 \\
461
+ Orthogonal & SLL & 121 & 55 & 58 & 8 & 0.4876 & 0.0000 & 3068 & $6.6e-01$ & $6.6e-01$ & $1.0e+00$ & 0.0410 \\
462
+ \bottomrule
463
+ \end{tabular}
464
+ \begin{tablenotes}
465
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
466
+ \end{tablenotes}
467
+ \endgroup
468
+ \end{threeparttable}
469
+ \end{table*}
UCI_N4/ldlt-resnet/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/ldlt/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/ortho/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/sandwich/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/sdp/runs/abalone/fold_0/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 52,
3
+ "best_val_acc": 0.6253968253968254,
4
+ "test_acc": 0.6360367558929285,
5
+ "train_size": 1044,
6
+ "val_size": 630,
7
+ "test_size": 2503,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.03759131666666678,
12
+ -0.0067216787931033565,
13
+ -0.00504821235632188,
14
+ -0.010079406034482869,
15
+ 0.0077948497126437005,
16
+ -0.0035954527720305413,
17
+ 0.011847337255747069,
18
+ 0.020808682452107305
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 0.9932562075552053,
24
+ 1.0067465043023525,
25
+ 0.9980809038500921,
26
+ 0.9297052233036605,
27
+ 1.0141436995589543,
28
+ 0.9931430828536596,
29
+ 1.017739933100054,
30
+ 1.0318462596531948
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.5201757550239563,
42
+ "72": 0.3999200761318207,
43
+ "108": 0.3156212568283081,
44
+ "255": 0.17578904330730438
45
+ }
46
+ }
UCI_N4/sdp/runs/abalone/fold_1/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 38,
3
+ "best_val_acc": 0.6735668789808917,
4
+ "test_acc": 0.6463073852295409,
5
+ "train_size": 1044,
6
+ "val_size": 628,
7
+ "test_size": 2505,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.005192849233716447,
12
+ -0.0023747756321838803,
13
+ -0.004999904980842867,
14
+ -0.01065197068965531,
15
+ -0.001757506036398443,
16
+ -0.0004581268045977247,
17
+ -0.008801511695402298,
18
+ -0.0025385303256705034
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 0.9921988752896624,
24
+ 1.0113577078934743,
25
+ 1.0108378611135136,
26
+ 0.93746968476643,
27
+ 1.0135082046349184,
28
+ 1.0099861173658438,
29
+ 1.0142707677051552,
30
+ 1.019381711286177
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.5117764472961426,
42
+ "72": 0.3960079848766327,
43
+ "108": 0.32255488634109497,
44
+ "255": 0.18483033776283264
45
+ }
46
+ }
UCI_N4/sdp/runs/abalone/fold_2/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 28,
3
+ "best_val_acc": 0.6888519134775375,
4
+ "test_acc": 0.6291469194312796,
5
+ "train_size": 1044,
6
+ "val_size": 601,
7
+ "test_size": 2532,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.017948929501915466,
12
+ 0.023985624319923418,
13
+ 0.023087170114942556,
14
+ 0.018317038026819783,
15
+ 0.02778346245977014,
16
+ 0.025539904827586328,
17
+ 0.018261344003831434,
18
+ 0.034770174578544095
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 0.9978233519534647,
24
+ 1.0049712832060378,
25
+ 1.0100440980049294,
26
+ 0.9634042347353897,
27
+ 1.0033357823934823,
28
+ 1.0054816988393045,
29
+ 0.9890488354165379,
30
+ 1.0152622279378631
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.49842023849487305,
42
+ "72": 0.38270142674446106,
43
+ "108": 0.29936808347702026,
44
+ "255": 0.17890995740890503
45
+ }
46
+ }
UCI_N4/sdp/runs/abalone/fold_3/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 80,
3
+ "best_val_acc": 0.6523887973640856,
4
+ "test_acc": 0.6361836896278702,
5
+ "train_size": 1044,
6
+ "val_size": 607,
7
+ "test_size": 2526,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.039933615229885006,
12
+ 0.033357397988505864,
13
+ 0.02810616465517236,
14
+ 0.015225409386973148,
15
+ 0.03982630053544057,
16
+ 0.03327093634674338,
17
+ 0.031858401652298855,
18
+ 0.04330609419540234
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 1.000898664612302,
24
+ 1.0028361176421674,
25
+ 1.0029617333979737,
26
+ 0.9244955132147792,
27
+ 1.020547570022181,
28
+ 1.016662196023235,
29
+ 1.0053994226175234,
30
+ 1.025123395710352
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.5134600400924683,
42
+ "72": 0.3939034044742584,
43
+ "108": 0.3155186176300049,
44
+ "255": 0.17893902957439423
45
+ }
46
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_0/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 6,
3
+ "best_val_acc": 0.75,
4
+ "test_acc": 0.5945945945945946,
5
+ "train_size": 30,
6
+ "val_size": 16,
7
+ "test_size": 74,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.029776199999999933,
12
+ 0.05815319999999998,
13
+ 0.03366299999999992,
14
+ -0.07041613333333337,
15
+ 0.0829954666666666,
16
+ 0.3029878333333334
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.046299339147563,
22
+ 1.028676385077134,
23
+ 0.9895473157792913,
24
+ 1.0179845925601472,
25
+ 0.9937462864656396,
26
+ 1.0009348864350793
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.1621621698141098,
38
+ "72": 0.0,
39
+ "108": 0.0,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_1/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 4,
3
+ "best_val_acc": 0.7222222222222222,
4
+ "test_acc": 0.6805555555555556,
5
+ "train_size": 30,
6
+ "val_size": 18,
7
+ "test_size": 72,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.2066000000000002,
12
+ 0.2132320000000001,
13
+ 0.16832333333333327,
14
+ -6.666666666858371e-07,
15
+ 0.08299546666666664,
16
+ -0.033663
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.073465583913181,
22
+ 1.0965727109827237,
23
+ 0.9521923485684088,
24
+ 0.9958250796083059,
25
+ 0.9937462864656397,
26
+ 0.9895473157792911
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.5138888955116272,
38
+ "72": 0.2638888955116272,
39
+ "108": 0.0694444477558136,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_2/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 29,
3
+ "best_val_acc": 0.75,
4
+ "test_acc": 0.9142857142857143,
5
+ "train_size": 30,
6
+ "val_size": 20,
7
+ "test_size": 70,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.06825569999999999,
12
+ -0.09692560000000008,
13
+ 0.10099316666666662,
14
+ 0.07041479999999994,
15
+ -0.11619693333333347,
16
+ 0.16832750000000007
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9390286569686838,
22
+ 0.9304728,
23
+ 0.9733809278809981,
24
+ 0.9680526182869189,
25
+ 0.9870693041144554,
26
+ 1.0099525000000003
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.699999988079071,
38
+ "72": 0.6714285612106323,
39
+ "108": 0.5714285969734192,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_3/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 22,
3
+ "best_val_acc": 0.9523809523809523,
4
+ "test_acc": 0.8985507246376812,
5
+ "train_size": 30,
6
+ "val_size": 21,
7
+ "test_size": 69,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.061842666666666594,
12
+ -0.01938619999999999,
13
+ -0.03366716666666666,
14
+ -0.14083160000000008,
15
+ -0.049799466666666695,
16
+ -0.3029836666666666
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9526045937382531,
22
+ 0.9838646893399317,
23
+ 1.000934886435079,
24
+ 1.0348917799997448,
25
+ 0.9937462864656396,
26
+ 0.8932355996217098
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.6811594367027283,
38
+ "72": 0.2753623127937317,
39
+ "108": 0.14492753148078918,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_0/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 20,
3
+ "best_val_acc": 1.0,
4
+ "test_acc": 0.8767123287671232,
5
+ "train_size": 30,
6
+ "val_size": 17,
7
+ "test_size": 73,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.1415510333333333,
12
+ 0.21323200000000003,
13
+ -0.03366716666666671,
14
+ -6.666666667154431e-07,
15
+ 0.2821878666666666,
16
+ -0.1683233333333333
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.0909027516263303,
22
+ 1.0965727109827237,
23
+ 1.0009348864350789,
24
+ 0.9958250796083059,
25
+ 0.9598970403996372,
26
+ 0.9521923485684088
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.6849315166473389,
38
+ "72": 0.42465752363204956,
39
+ "108": 0.232876718044281,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_1/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 29,
3
+ "best_val_acc": 0.9285714285714286,
4
+ "test_acc": 0.881578947368421,
5
+ "train_size": 30,
6
+ "val_size": 14,
7
+ "test_size": 76,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.012368109999999948,
12
+ -0.0969256,
13
+ 0.10099316666666665,
14
+ -0.21124706666666673,
15
+ -0.11619693333333339,
16
+ -0.033662999999999985
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9970611705313925,
22
+ 0.9304727999999999,
23
+ 0.9733809278809981,
24
+ 1.0468011683411809,
25
+ 0.9870693041144555,
26
+ 0.9895473157792911
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.5394737124443054,
38
+ "72": 0.44736841320991516,
39
+ "108": 0.10526315867900848,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_2/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 12,
3
+ "best_val_acc": 1.0,
4
+ "test_acc": 1.0,
5
+ "train_size": 30,
6
+ "val_size": 11,
7
+ "test_size": 79,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.03252466666666676,
12
+ 0.05815320000000001,
13
+ -0.10099733333333338,
14
+ -6.666666667154431e-07,
15
+ 0.1493929333333332,
16
+ -0.033662999999999985
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9744119491152714,
22
+ 1.0286763850771339,
23
+ 1.0077056618442157,
24
+ 0.9958250796083059,
25
+ 0.9870693041144553,
26
+ 0.9895473157792911
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.6962025761604309,
38
+ "72": 0.5316455960273743,
39
+ "108": 0.2278481125831604,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_3/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 49,
3
+ "best_val_acc": 0.8421052631578947,
4
+ "test_acc": 0.9295774647887324,
5
+ "train_size": 30,
6
+ "val_size": 19,
7
+ "test_size": 71,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.029776590000000006,
12
+ -0.01938619999999999,
13
+ -0.10099733333333341,
14
+ -6.666666667080416e-07,
15
+ 0.01659799999999996,
16
+ -0.10099316666666663
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.0535901730675965,
22
+ 0.9838646893399317,
23
+ 1.0077056618442157,
24
+ 0.9958250796083058,
25
+ 0.995962,
26
+ 0.9733809278809978
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.6478872895240784,
38
+ "72": 0.577464759349823,
39
+ "108": 0.2957746386528015,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/adult/fold_0/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 4,
3
+ "best_val_acc": 0.8133191100274306,
4
+ "test_acc": 0.8112619716142928,
5
+ "train_size": 16281,
6
+ "val_size": 6562,
7
+ "test_size": 25999,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.7494903802871704,
54
+ "72": 0.6914111971855164,
55
+ "108": 0.6325628161430359,
56
+ "255": 0.38409170508384705
57
+ }
58
+ }
UCI_N4/sdp/runs/adult/fold_1/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 3,
3
+ "best_val_acc": 0.8076100244498777,
4
+ "test_acc": 0.8065880001537457,
5
+ "train_size": 16281,
6
+ "val_size": 6544,
7
+ "test_size": 26017,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.7445900440216064,
54
+ "72": 0.6839374303817749,
55
+ "108": 0.6224391460418701,
56
+ "255": 0.36464619636535645
57
+ }
58
+ }
UCI_N4/sdp/runs/adult/fold_2/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 2,
3
+ "best_val_acc": 0.804847923421337,
4
+ "test_acc": 0.8083116086489802,
5
+ "train_size": 16281,
6
+ "val_size": 6477,
7
+ "test_size": 26084,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.7493482828140259,
54
+ "72": 0.6899248957633972,
55
+ "108": 0.6268210411071777,
56
+ "255": 0.36359456181526184
57
+ }
58
+ }
UCI_N4/sdp/runs/adult/fold_3/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 7,
3
+ "best_val_acc": 0.8011200242167398,
4
+ "test_acc": 0.8089311859443631,
5
+ "train_size": 16281,
6
+ "val_size": 6607,
7
+ "test_size": 25954,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.7547969222068787,
54
+ "72": 0.6956538558006287,
55
+ "108": 0.6332356929779053,
56
+ "255": 0.38209909200668335
57
+ }
58
+ }
UCI_N4/sdp/runs/annealing/fold_0/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 39,
3
+ "best_val_acc": 0.8154761904761905,
4
+ "test_acc": 0.7746031746031746,
5
+ "train_size": 100,
6
+ "val_size": 168,
7
+ "test_size": 630,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.7571428418159485,
88
+ "72": 0.7428571581840515,
89
+ "108": 0.699999988079071,
90
+ "255": 0.5873016119003296
91
+ }
92
+ }
UCI_N4/sdp/runs/annealing/fold_1/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 58,
3
+ "best_val_acc": 0.8136645962732919,
4
+ "test_acc": 0.7551020408163265,
5
+ "train_size": 100,
6
+ "val_size": 161,
7
+ "test_size": 637,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.6954474449157715,
88
+ "72": 0.6734694242477417,
89
+ "108": 0.6389325261116028,
90
+ "255": 0.5196232199668884
91
+ }
92
+ }
UCI_N4/sdp/runs/annealing/fold_2/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 62,
3
+ "best_val_acc": 0.7309941520467836,
4
+ "test_acc": 0.7400318979266348,
5
+ "train_size": 100,
6
+ "val_size": 171,
7
+ "test_size": 627,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.6762360334396362,
88
+ "72": 0.6539074778556824,
89
+ "108": 0.6299840211868286,
90
+ "255": 0.5390749573707581
91
+ }
92
+ }
UCI_N4/sdp/runs/annealing/fold_3/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 58,
3
+ "best_val_acc": 0.7245508982035929,
4
+ "test_acc": 0.7321711568938193,
5
+ "train_size": 100,
6
+ "val_size": 167,
7
+ "test_size": 631,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.7115689516067505,
88
+ "72": 0.673534095287323,
89
+ "108": 0.6402536034584045,
90
+ "255": 0.5182250738143921
91
+ }
92
+ }
UCI_N4/sdp/runs/arrhythmia/fold_0/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 25,
3
+ "best_val_acc": 0.5949367088607594,
4
+ "test_acc": 0.5538461538461539,
5
+ "train_size": 113,
6
+ "val_size": 79,
7
+ "test_size": 260,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.05548900442477873,
12
+ 0.17327679646017674,
13
+ -0.09933938283185836,
14
+ -0.022536060176991165,
15
+ -0.05529378318584072,
16
+ -0.02827017327433631,
17
+ -0.005964132743362813,
18
+ 0.04588333831858407,
19
+ -0.06835887191150443,
20
+ -0.01879734327433625,
21
+ 0.08708691123893805,
22
+ -0.010227719469026567,
23
+ -0.05324860619469024,
24
+ 0.03857876283185871,
25
+ -0.0029412946902654486,
26
+ -0.14624673451327397,
27
+ 0.0106677238938053,
28
+ -0.09994685221238946,
29
+ -2.2654867242673962e-07,
30
+ -0.10041930088495568,
31
+ 0.14110856637168184,
32
+ -0.02112876106194691,
33
+ -0.021128761061946916,
34
+ -0.06659289999999989,
35
+ -0.06659289999999989,
36
+ -0.09438650000000005,
37
+ -0.024449619469026587,
38
+ -0.006156723893805307,
39
+ -0.03655609734513271,
40
+ -0.06008078761061956,
41
+ -0.05587280000000011,
42
+ -0.1535461769911505,
43
+ -2.9203539835147346e-07,
44
+ 0.1454482212389377,
45
+ -0.04703600000000003,
46
+ -0.06659289999999989,
47
+ 0.0665928778761063,
48
+ -0.053692424778761245,
49
+ 0.10382045292035355,
50
+ -0.045959752212389356,
51
+ -0.039423744247787586,
52
+ -0.042264867256637376,
53
+ -0.0339906548672566,
54
+ -0.10218601769911498,
55
+ -0.04703600000000003,
56
+ 0.04783872566371683,
57
+ 0.14110856637168165,
58
+ -2.920353982139237e-07,
59
+ -0.1056450000000003,
60
+ -0.06659289999999989,
61
+ 0.039230692920353964,
62
+ -0.048857433628318604,
63
+ -0.0949235044247789,
64
+ -0.0951867699115044,
65
+ -0.04703600000000003,
66
+ -0.07884043362831854,
67
+ -0.021128761061946947,
68
+ 0.0665928778761063,
69
+ 0.0665928778761063,
70
+ 0.06659287787610634,
71
+ 0.0665928778761063,
72
+ 1.0619469034296467e-07,
73
+ -0.14459542477876128,
74
+ 0.10166875221238943,
75
+ -0.0007696849557522316,
76
+ 0.08089214159292042,
77
+ 0.024555884070796462,
78
+ -0.06704164601769926,
79
+ -0.04703600000000003,
80
+ 0.1411085663716821,
81
+ 0.02721671504424786,
82
+ -0.04703600000000003,
83
+ 0.008643274336283235,
84
+ -0.03328283893805306,
85
+ -0.08280126353982296,
86
+ -0.04353061946902624,
87
+ 0.022193132743362702,
88
+ -0.07879264601769921,
89
+ 0.06659287787610634,
90
+ 0.07170867256637195,
91
+ 0.1411085663716824,
92
+ -0.04703600000000003,
93
+ 0.14110856637168173,
94
+ -0.05805589380530971,
95
+ 0.08516874884955755,
96
+ 0.043014315044247776,
97
+ -0.002110141592920556,
98
+ -0.07482919999999994,
99
+ 0.027698871681415955,
100
+ -0.08165009999999992,
101
+ -0.0536924247787612,
102
+ 1.0619469030955972e-07,
103
+ -0.09438650000000005,
104
+ 0.06338747787610613,
105
+ -0.0901489026548673,
106
+ -0.04849817699115047,
107
+ 0.07722033628318585,
108
+ 0.026260424778761074,
109
+ 0.0738569911504426,
110
+ 0.04712901946902665,
111
+ 0.16431531858407084,
112
+ 0.09438671238938037,
113
+ 0.09438671238938054,
114
+ -0.0386190796460177,
115
+ -0.09438650000000005,
116
+ 1.0619469029580476e-07,
117
+ 0.06704106194690244,
118
+ 0.00271023008849546,
119
+ 0.04821953097345133,
120
+ -0.022629159292035374,
121
+ 0.24075912389380558,
122
+ 0.19588278672566428,
123
+ 0.10636762831858415,
124
+ 0.07170867256637167,
125
+ 0.0665928778761063,
126
+ -0.08165009999999992,
127
+ 1.0619469029580476e-07,
128
+ 0.24495034513274322,
129
+ -0.02112876106194717,
130
+ -0.03837423008849555,
131
+ 0.0792644690265486,
132
+ -0.010963192920353986,
133
+ -0.13985853097345086,
134
+ -0.06118739999999991,
135
+ -0.05918213274336283,
136
+ -0.06659289999999989,
137
+ 0.19309768141592948,
138
+ 0.0665928778761063,
139
+ -2.920353984064934e-07,
140
+ -0.08791879646017699,
141
+ -0.009588667256637163,
142
+ 0.039876742477876134,
143
+ -0.04371391504424787,
144
+ -0.09472733274336269,
145
+ -0.08165009999999992,
146
+ -0.04703600000000003,
147
+ -0.08165009999999992,
148
+ -0.059833336283185844,
149
+ -0.07838458407079653,
150
+ -0.015475274336283125,
151
+ -0.0805356,
152
+ -0.13698139380530983,
153
+ 0.14110856637168137,
154
+ -0.04703600000000003,
155
+ 0.0665928778761063,
156
+ -0.021128761061947016,
157
+ 0.017010241592920368,
158
+ 0.09822180530973434,
159
+ 0.005761375398230098,
160
+ 0.0322361946902655,
161
+ -0.034939104424778704,
162
+ 0.06566965486725665,
163
+ 0.061632838053097376,
164
+ 0.0004023300884955741,
165
+ 0.07045262681415927,
166
+ 0.028733457522123865,
167
+ 0.02147898230088495,
168
+ -0.05026543539823011,
169
+ 0.060225181415929224,
170
+ -0.07029714159292026,
171
+ 0.06618380000000008,
172
+ 0.011594984955752213,
173
+ 0.040387401769911555,
174
+ -0.0058615916814159065,
175
+ 0.04742410654867257,
176
+ -0.015766054867256643,
177
+ -0.062290848053097175,
178
+ -0.05214830601769914,
179
+ 0.04644970973451337,
180
+ -0.05739616814159293,
181
+ 0.05439313274336291,
182
+ -0.0036409858407079588,
183
+ -0.009598277876106183,
184
+ -0.011235967256637188,
185
+ -0.002634908849557516,
186
+ -0.005508535398230053,
187
+ -0.05590965752212387,
188
+ -0.06772527787610619,
189
+ 0.08251315044247781,
190
+ -0.08976234513274321,
191
+ 0.04703600000000003,
192
+ -0.04274165486725669,
193
+ -0.05909215752212393,
194
+ 0.027935999115044265,
195
+ -0.036451818017699096,
196
+ 0.03197787610619467,
197
+ 0.1596792035398229,
198
+ 0.0024668168141592844,
199
+ -0.015842806194690306,
200
+ 0.07878208849557493,
201
+ 0.006463776548672604,
202
+ 0.06462291946902653,
203
+ 0.025483634513274327,
204
+ 0.06707996637168136,
205
+ -0.07861038619469025,
206
+ -0.0949829097345134,
207
+ -0.08679084778761066,
208
+ 0.09411216159292037,
209
+ -0.061483929203539976,
210
+ -0.03750280353982299,
211
+ 0.024982454867256657,
212
+ 0.010920844247787605,
213
+ -0.036973680442477924,
214
+ -0.00325765690265486,
215
+ -0.06706977168141595,
216
+ 0.054682415929203546,
217
+ 0.07233616902654867,
218
+ 0.024967183185840673,
219
+ 0.0201886814159292,
220
+ 0.0625599000000001,
221
+ 0.016163015929203547,
222
+ -0.19404511061946894,
223
+ 0.1314095771681416,
224
+ -0.02607840336283184,
225
+ -0.07232390353982299,
226
+ 0.06542182300884967,
227
+ 0.09097714132743363,
228
+ -0.0490932584955752,
229
+ 0.17395115044247766,
230
+ -0.08915754336283198,
231
+ 0.005843493805309704,
232
+ -0.1311985026548673,
233
+ 0.0822022767256637,
234
+ -0.0316962311504425,
235
+ -0.15503262123893807,
236
+ 0.050416203539823005,
237
+ 0.012278147787610633,
238
+ 0.0764223432743363,
239
+ 0.20117684424778776,
240
+ -0.15312840973451328,
241
+ -0.006850403539823016,
242
+ -0.22191862300884949,
243
+ 0.1207021007964602,
244
+ -0.08917110283185833,
245
+ -0.07690047646017703,
246
+ 0.030319972566371638,
247
+ -0.1126870734513274,
248
+ 0.06241866831858403,
249
+ -0.1273596991150443,
250
+ 0.06213639999999999,
251
+ -0.07254762831858405,
252
+ -0.08504349999999997,
253
+ 0.034207636283185856,
254
+ -0.02238689532743362,
255
+ 0.10946240796460185,
256
+ 0.021622823008849552,
257
+ -0.1487953611504425,
258
+ 0.02685327893805308,
259
+ -0.04490421946902649,
260
+ -0.04955592035398229,
261
+ 0.06734868938053096,
262
+ -0.08363668734513273,
263
+ 0.022693176017699095,
264
+ 0.09933861353982294,
265
+ -0.00604589380530972,
266
+ -0.10963647433628322,
267
+ 0.03259297079646029,
268
+ -0.07945840000000003,
269
+ -0.007002541592920362,
270
+ 0.10658185398230094,
271
+ -0.0866022876106194,
272
+ 0.06365430106194689
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 0.9732374444872444,
278
+ 0.9655808459932996,
279
+ 0.2507734231833244,
280
+ 0.85756632700396,
281
+ 0.9152499916483915,
282
+ 0.9319460220789437,
283
+ 0.9577523305438101,
284
+ 1.1527478213503135,
285
+ 0.9576681124104236,
286
+ 1.0097636409421697,
287
+ 0.9939501739346246,
288
+ 0.8077223719814682,
289
+ 0.9956881527950738,
290
+ 1.065832253077651,
291
+ 0.8648866626310105,
292
+ 0.7884428876814543,
293
+ 0.8846283104978594,
294
+ 1.0392968702844574,
295
+ 0.9547571784517959,
296
+ 0.830419971626617,
297
+ 1.9911349325902201,
298
+ 0.8944357999064113,
299
+ 0.8944357999064099,
300
+ 1.0,
301
+ 1.0,
302
+ 1.0,
303
+ 1.0288388455432311,
304
+ 1.0366372636701484,
305
+ 1.0104922342254585,
306
+ 0.6029602666961917,
307
+ 1.0,
308
+ 0.9119059418676891,
309
+ 0.9988936769842922,
310
+ 1.3401171108416883,
311
+ 1.0,
312
+ 1.0,
313
+ 1.409505785723462,
314
+ 0.7576328500006007,
315
+ 1.1142082921935355,
316
+ 1.100915710823559,
317
+ 0.9521761840451372,
318
+ 0.8352521125885086,
319
+ 0.7194469320515606,
320
+ 0.9886952789548065,
321
+ 1.0,
322
+ 1.111662684055426,
323
+ 1.9911349325902201,
324
+ 0.9988936769842919,
325
+ 1.0,
326
+ 1.0,
327
+ 0.9092993788613446,
328
+ 1.061138924056677,
329
+ 0.8860454459362529,
330
+ 0.77869888137794,
331
+ 1.0,
332
+ 0.9971658374137916,
333
+ 0.8944357999064098,
334
+ 1.4095057857234619,
335
+ 1.409505785723463,
336
+ 1.4095057857234636,
337
+ 1.4095057857234625,
338
+ 0.9988939483461562,
339
+ 0.8359429042688657,
340
+ 0.9455652546275832,
341
+ 1.047159553008427,
342
+ 1.2373317065584502,
343
+ 0.9367499049873408,
344
+ 0.7094990007768702,
345
+ 1.0,
346
+ 1.9911349325902201,
347
+ 1.152138074538977,
348
+ 1.0,
349
+ 1.076296523650441,
350
+ 1.0790204523971971,
351
+ 0.9278040585020654,
352
+ 0.6623289850929874,
353
+ 1.0736843273720698,
354
+ 1.059187675645061,
355
+ 1.4095057857234636,
356
+ 1.1978616378928757,
357
+ 1.9911349325902201,
358
+ 1.0,
359
+ 1.9911349325902201,
360
+ 0.9142231440920847,
361
+ 1.3486308966826843,
362
+ 0.9779239267203217,
363
+ 1.072217573812213,
364
+ 1.0,
365
+ 1.0670736267417575,
366
+ 1.0,
367
+ 0.7576328500006009,
368
+ 0.9988939483461562,
369
+ 1.0,
370
+ 1.2592635987036094,
371
+ 0.6360290623787335,
372
+ 0.8549033709264361,
373
+ 1.300841714365119,
374
+ 0.979322007928904,
375
+ 1.2296324368044147,
376
+ 1.3300447893255654,
377
+ 1.2339107860310472,
378
+ 1.4063287585864288,
379
+ 1.4063287585864277,
380
+ 0.817419899167048,
381
+ 1.0,
382
+ 0.9988939483461566,
383
+ 1.2178666747421332,
384
+ 0.9179155627028488,
385
+ 1.1674686384124506,
386
+ 0.937597875841375,
387
+ 1.9128860722576218,
388
+ 1.9849443701676805,
389
+ 1.2128492302504466,
390
+ 1.1978616378928766,
391
+ 1.409505785723462,
392
+ 1.0,
393
+ 0.9988939483461566,
394
+ 1.9776639067090993,
395
+ 0.8944357999064088,
396
+ 0.9089427774812973,
397
+ 1.1565813541259533,
398
+ 0.9312031818896745,
399
+ 0.37790291497240225,
400
+ 1.0,
401
+ 1.0103067336455187,
402
+ 1.0,
403
+ 1.612796005825811,
404
+ 1.4095057857234625,
405
+ 0.9988936769842919,
406
+ 0.9869575017654069,
407
+ 1.0625408223089012,
408
+ 0.8572543250334869,
409
+ 0.4626232154331089,
410
+ 0.8399894436428749,
411
+ 1.0,
412
+ 1.0,
413
+ 1.0,
414
+ 0.9949165069017805,
415
+ 0.9763809111647539,
416
+ 0.9886383527662114,
417
+ 1.0,
418
+ 0.8853802248708618,
419
+ 1.9911349325902201,
420
+ 1.0,
421
+ 1.4095057857234612,
422
+ 0.8944357999064094,
423
+ 0.8545082434186259,
424
+ 0.8796291945635648,
425
+ 0.9389113833926183,
426
+ 0.8861374760427413,
427
+ 0.39441056751713705,
428
+ 0.8648668783726172,
429
+ 0.9862191391833568,
430
+ 0.8481954658017612,
431
+ 0.9206020572467216,
432
+ 0.886517128434336,
433
+ 1.0192902215038742,
434
+ 0.956622629021229,
435
+ 0.8523688961466389,
436
+ 0.2992587051477164,
437
+ 1.0,
438
+ 0.8898404778961094,
439
+ 1.0071877733497892,
440
+ 0.950155747946548,
441
+ 1.0050918229648342,
442
+ 0.7815635141616576,
443
+ 0.9972744785704897,
444
+ 0.9594844360499902,
445
+ 0.9255046483391078,
446
+ 0.4876909595587591,
447
+ 0.5036861467715275,
448
+ 0.8566188861170654,
449
+ 0.7638467720219689,
450
+ 1.0032544884403838,
451
+ 1.0560420525550518,
452
+ 0.8986819691295396,
453
+ 0.9372189161919664,
454
+ 0.8101867430665612,
455
+ 0.8950623205358443,
456
+ 0.7725356624236849,
457
+ 1.0,
458
+ 0.872460731649835,
459
+ 1.045597205130584,
460
+ 0.881115812189619,
461
+ 0.9553256168269835,
462
+ 0.8848742890899297,
463
+ 0.5907365616618244,
464
+ 0.9525692591339604,
465
+ 0.9761188977078773,
466
+ 1.2163938242844157,
467
+ 0.9319895550002153,
468
+ 0.8335462617896103,
469
+ 0.9176414735582966,
470
+ 0.9775951517497435,
471
+ 0.8425042883529639,
472
+ 1.2598848541968266,
473
+ 0.949252647471748,
474
+ 0.838972165335258,
475
+ 0.23456841787874302,
476
+ 1.1642248030770597,
477
+ 0.8628119131177865,
478
+ 0.8751618803772816,
479
+ 0.9228296916565395,
480
+ 0.9809394578124714,
481
+ 0.5915262659968897,
482
+ 0.8563703331027254,
483
+ 1.223677024967222,
484
+ 0.9284798655045788,
485
+ 1.2965375076317172,
486
+ 1.0,
487
+ 0.9389878405072626,
488
+ 0.8540110671890598,
489
+ 1.316521539927867,
490
+ 1.4340416104694482,
491
+ 0.8735072262525767,
492
+ 0.676363014728904,
493
+ 1.1134658692256694,
494
+ 1.0134545560863548,
495
+ 1.7552329970203224,
496
+ 1.7155564074285294,
497
+ 0.873049365917997,
498
+ 1.030474558081803,
499
+ 1.0170344415415917,
500
+ 1.0766146909852692,
501
+ 0.7111765255105056,
502
+ 0.6923440560955865,
503
+ 1.0058025631570486,
504
+ 0.9240158601820535,
505
+ 1.9435205267323648,
506
+ 1.9899491083438348,
507
+ 0.8387690283436754,
508
+ 0.9708565551581373,
509
+ 0.8493149601758292,
510
+ 0.985055690803851,
511
+ 0.8279931417986857,
512
+ 0.9098729896957297,
513
+ 0.9370725829078755,
514
+ 0.8393620512490872,
515
+ 0.28080206241297245,
516
+ 1.0,
517
+ 0.8220194136548338,
518
+ 0.9761698379739507,
519
+ 0.7917031329595748,
520
+ 0.9270879739715543,
521
+ 0.847139011361557,
522
+ 1.0122054789755355,
523
+ 0.9745187015121873,
524
+ 0.8548335912371546,
525
+ 0.16972156566241,
526
+ 0.8245729285934237,
527
+ 1.06901211839648,
528
+ 0.8750748380574906,
529
+ 1.0605384058291198,
530
+ 0.814622435544981,
531
+ 1.1662691506968674,
532
+ 1.0027045465050628,
533
+ 0.707221379699125,
534
+ 1.0,
535
+ 0.8738904193642293,
536
+ 1.0307627522011051,
537
+ 0.9112504790758761,
538
+ 1.0340966211802813
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.4923076927661896,
550
+ "72": 0.4384615421295166,
551
+ "108": 0.3769230842590332,
552
+ "255": 0.2153846174478531
553
+ }
554
+ }
UCI_N4/sdp/runs/arrhythmia/fold_1/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 13,
3
+ "best_val_acc": 0.5263157894736842,
4
+ "test_acc": 0.4858156028368794,
5
+ "train_size": 113,
6
+ "val_size": 57,
7
+ "test_size": 282,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.08236052831858409,
12
+ 0.04887446902654869,
13
+ 0.0825547600000001,
14
+ 0.07080902389380533,
15
+ 0.06969351327433632,
16
+ -0.02017880672566372,
17
+ 0.0033134920353982203,
18
+ -0.0904622607964602,
19
+ 0.0008566455575221136,
20
+ 0.05502761778761062,
21
+ 0.0029605046017698983,
22
+ 0.16618478141592918,
23
+ 0.10348846991150445,
24
+ -0.12880789292035386,
25
+ 0.001393306194690269,
26
+ -0.009972053097345045,
27
+ -0.13480514867256632,
28
+ 0.15853807787610613,
29
+ -0.022554120353982243,
30
+ -0.17088875221238942,
31
+ -0.04703600000000003,
32
+ -0.02112876106194702,
33
+ 0.14790371681415893,
34
+ 0.0665928778761063,
35
+ 0.0665928778761063,
36
+ 0.09438671238938028,
37
+ -0.033913831858407135,
38
+ -0.05746374070796462,
39
+ 0.020589044247787618,
40
+ -0.08296883185840712,
41
+ -0.016433217699115002,
42
+ -0.02482472566371683,
43
+ -0.13408300000000029,
44
+ -0.0661125929203539,
45
+ 0.14110856637168206,
46
+ 0.19977865575221251,
47
+ 0.06659287787610634,
48
+ 0.16107630088495584,
49
+ -0.04968823575221234,
50
+ 0.16085886725663703,
51
+ -0.040819525663716834,
52
+ -0.04226484955752222,
53
+ 0.03399069026548677,
54
+ 0.08868894690265484,
55
+ 0.14110856637168143,
56
+ 0.1435154159292037,
57
+ -0.04703600000000003,
58
+ -2.920353984457933e-07,
59
+ -0.02112876106194691,
60
+ 0.1997786557522125,
61
+ -0.14194291681415921,
62
+ 0.11196102831858407,
63
+ 0.0592675752212388,
64
+ 0.09347194690265491,
65
+ -0.04703600000000003,
66
+ 0.13773737168141595,
67
+ -0.1056450000000003,
68
+ -0.06659289999999989,
69
+ 0.0665928778761063,
70
+ -0.06659289999999989,
71
+ 0.0665928778761063,
72
+ 0.09438671238938029,
73
+ -0.09931298230088502,
74
+ -0.11574543716814155,
75
+ 0.19007244637168158,
76
+ 0.006741415929203616,
77
+ -0.17417296814159283,
78
+ -2.920353982846636e-07,
79
+ -0.04703600000000003,
80
+ -0.04703600000000003,
81
+ 0.027216715044247736,
82
+ 0.14110856637168231,
83
+ -0.00288054867256639,
84
+ 0.04904841858407081,
85
+ 0.02098572858407086,
86
+ -0.1192364601769909,
87
+ -0.0031704955752213143,
88
+ 0.01358514159292034,
89
+ -0.06659289999999989,
90
+ 0.014341504424779012,
91
+ -0.04703600000000003,
92
+ -0.04703600000000003,
93
+ -0.04703600000000003,
94
+ 0.07784732743362836,
95
+ 0.10888657327433629,
96
+ -0.1186584123893806,
97
+ -0.02180679646017706,
98
+ -0.07482919999999994,
99
+ 0.08863622212389385,
100
+ 0.13608353008849555,
101
+ 0.08948672566371674,
102
+ 1.0619469028597977e-07,
103
+ -0.09438650000000005,
104
+ -0.02112876106194696,
105
+ 0.09014838938053121,
106
+ -0.048498132743362864,
107
+ 0.05329288938053096,
108
+ 0.07878135752212394,
109
+ 0.006330884955752202,
110
+ 0.04712901946902665,
111
+ 0.11292442477876118,
112
+ -0.09438650000000005,
113
+ 0.09438671238938054,
114
+ -0.03861907964601756,
115
+ 1.0619469029580476e-07,
116
+ -0.09438650000000005,
117
+ 0.06704106194690229,
118
+ -0.07101396460177,
119
+ 0.11338092035398238,
120
+ 0.022629575221239016,
121
+ 0.15994504424778788,
122
+ 0.039176644247788044,
123
+ 0.11334270796460184,
124
+ -0.100392831858407,
125
+ 0.0665928778761063,
126
+ -0.08165009999999992,
127
+ 1.0619469028597977e-07,
128
+ 0.027216715044247736,
129
+ -0.0211287610619469,
130
+ 0.007675044247787407,
131
+ 0.017898353982300903,
132
+ 0.022447520353982425,
133
+ -0.10415006194690236,
134
+ -0.06118739999999991,
135
+ -0.031867106194690256,
136
+ 0.0665928778761063,
137
+ 0.0386198407079645,
138
+ -0.06659289999999989,
139
+ 0.06704106194690229,
140
+ 0.03697516814159319,
141
+ -0.044993100884955714,
142
+ -0.005112693362831841,
143
+ -0.08742769999999993,
144
+ -0.04059785840707965,
145
+ 0.027216715044247736,
146
+ 0.1411085663716819,
147
+ 0.13608353008849491,
148
+ 0.03589945132743362,
149
+ -0.0453806460176991,
150
+ 0.003572176991150533,
151
+ 0.05211161769911493,
152
+ -0.012922732743362846,
153
+ 0.1411085663716814,
154
+ -0.04703600000000003,
155
+ 0.1997786557522125,
156
+ 0.14790371681415954,
157
+ 0.14316932831858414,
158
+ 0.03571657522123903,
159
+ -0.10441322884955753,
160
+ -0.23222040176991168,
161
+ -0.03493910442477871,
162
+ 0.05546864601769913,
163
+ 0.12581869469026555,
164
+ -0.18030577079646018,
165
+ -0.07161228646017702,
166
+ -0.03718444513274338,
167
+ 0.013523787610619589,
168
+ 0.10059417451327425,
169
+ 0.01624747876106193,
170
+ 0.05021323893805318,
171
+ -0.05147623362831883,
172
+ 0.1827229362831858,
173
+ 0.0034618557522124397,
174
+ 0.05241511327433623,
175
+ 0.030558143362831823,
176
+ -0.19202160176991148,
177
+ 0.11133997495575228,
178
+ 0.12129543628318586,
179
+ 0.060097776106194795,
180
+ 0.11579815929203502,
181
+ -0.027196398230088462,
182
+ 0.17599128230088495,
183
+ -0.1195051539823009,
184
+ 0.18247482389380532,
185
+ 0.06219380353982303,
186
+ -0.09025506017699113,
187
+ 0.08350311504424779,
188
+ 0.1271729522123894,
189
+ -0.0951591353982304,
190
+ 0.10388311504424796,
191
+ 0.04703600000000003,
192
+ -0.14397143362831855,
193
+ -0.056712807079646044,
194
+ 0.11911974769911506,
195
+ 0.07255731355752211,
196
+ 0.17956833628318594,
197
+ 0.03657456283185836,
198
+ -0.12767188938053103,
199
+ -0.21526490619469008,
200
+ 0.019409734513274046,
201
+ -0.20038580796460184,
202
+ 0.13453505858407078,
203
+ -0.20150050008849554,
204
+ -0.10956924336283183,
205
+ -0.1755137388495575,
206
+ 0.07771356637168146,
207
+ 0.1258815132743363,
208
+ 0.05789021663716825,
209
+ 0.059674265486725525,
210
+ 0.04250356814159293,
211
+ 0.18101372743362842,
212
+ -0.08988732212389382,
213
+ 0.148077411681416,
214
+ 0.041530495575221225,
215
+ -0.07796867964601775,
216
+ -0.08606286725663721,
217
+ 0.216610610619469,
218
+ 0.09511035132743359,
219
+ -0.05938040707964593,
220
+ 0.0625599000000001,
221
+ -0.09312924070796465,
222
+ -0.07196051769911511,
223
+ 0.13021555911504423,
224
+ 0.10358608645132746,
225
+ -0.0039450442477876055,
226
+ 0.015811640707964647,
227
+ 0.042050546725663725,
228
+ -0.11399942584070796,
229
+ 0.01275024778761036,
230
+ -0.012157897345132696,
231
+ -0.07146561415929208,
232
+ -0.03644905008849562,
233
+ -0.0460240963716814,
234
+ -0.04567296300884947,
235
+ -0.0159320159292035,
236
+ -0.020865886725663647,
237
+ 0.006243656991150445,
238
+ -0.04104453495575228,
239
+ 0.04250217699115046,
240
+ 0.034307366371681414,
241
+ -0.11968876460176998,
242
+ -0.0937977030973451,
243
+ -0.007898124601769923,
244
+ -0.06254813724778759,
245
+ 0.027666705132743385,
246
+ -0.0678103380530974,
247
+ 0.0033648314159292177,
248
+ 0.014861656991150381,
249
+ -0.08490639823008855,
250
+ 0.06213639999999999,
251
+ 0.10985744247787621,
252
+ -0.1141806185840708,
253
+ -0.0051085477876106,
254
+ -0.07652198922123891,
255
+ 0.1186390026548673,
256
+ -0.006018964601769793,
257
+ -0.03378361716814159,
258
+ 0.011641800000000063,
259
+ -0.06094139999999994,
260
+ 0.1415026725663717,
261
+ -0.08340849911504429,
262
+ -0.021807159292035423,
263
+ -0.08355237141592924,
264
+ 0.10080485079646004,
265
+ -0.0028213893805309528,
266
+ -0.039560768141592914,
267
+ -0.03811751592920355,
268
+ 0.06180052389380527,
269
+ 0.08721472743362838,
270
+ -0.045456217699115044,
271
+ -0.04452998026548677,
272
+ -0.08741183716814158
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 1.0288523625377175,
278
+ 0.9926765498781311,
279
+ 1.5821926864265932,
280
+ 1.2345480341843558,
281
+ 1.0919259987637373,
282
+ 0.8553411989728208,
283
+ 0.9770372253740158,
284
+ 1.0941619685910755,
285
+ 0.9070109264400832,
286
+ 1.1660151450666374,
287
+ 0.82811358045681,
288
+ 0.8585451804478106,
289
+ 0.9271539318095082,
290
+ 0.826139795075132,
291
+ 0.9407871254954377,
292
+ 1.1098127265333941,
293
+ 0.9673996715099642,
294
+ 1.0170784936919917,
295
+ 0.7160692020317576,
296
+ 0.8881539469849713,
297
+ 1.0,
298
+ 0.8944357999064094,
299
+ 1.5353137244867066,
300
+ 1.409505785723462,
301
+ 1.4095057857234625,
302
+ 1.4063287585864295,
303
+ 0.8810006273224485,
304
+ 0.9386543902953636,
305
+ 0.9544080465249254,
306
+ 0.605561339519823,
307
+ 0.41738930632162535,
308
+ 0.9435148318250272,
309
+ 1.0,
310
+ 0.7880462841530468,
311
+ 1.9911349325902201,
312
+ 1.9844233966366362,
313
+ 1.4095057857234636,
314
+ 1.494834216304884,
315
+ 0.8945327921343991,
316
+ 1.0465252306595956,
317
+ 0.9657902518204129,
318
+ 0.8818849232826983,
319
+ 1.01289922968906,
320
+ 0.9542609489006632,
321
+ 1.9911349325902201,
322
+ 1.303101066939662,
323
+ 1.0,
324
+ 0.9988936769842933,
325
+ 0.8944357999064099,
326
+ 1.9844233966366385,
327
+ 0.9721978598866062,
328
+ 0.9751070654641969,
329
+ 1.053405494669145,
330
+ 1.2277188687789828,
331
+ 1.0,
332
+ 0.9710532649972081,
333
+ 1.0,
334
+ 1.0,
335
+ 1.4095057857234625,
336
+ 1.0,
337
+ 1.409505785723463,
338
+ 1.4063287585864295,
339
+ 0.9944538524514821,
340
+ 1.0084398738408038,
341
+ 1.096956593110858,
342
+ 0.9848747659663566,
343
+ 1.0176485758563296,
344
+ 0.9988936769842915,
345
+ 1.0,
346
+ 1.0,
347
+ 1.1521380745389784,
348
+ 1.9911349325902201,
349
+ 0.8886796764360778,
350
+ 1.0626176220464763,
351
+ 0.9820129092696263,
352
+ 0.48071756015968203,
353
+ 0.8052609158630751,
354
+ 0.9014845427415126,
355
+ 1.0,
356
+ 1.0421263616247836,
357
+ 1.0,
358
+ 1.0,
359
+ 1.0,
360
+ 1.0603166366167238,
361
+ 1.3948018100222412,
362
+ 1.0002378777841179,
363
+ 1.0521891063258038,
364
+ 1.0,
365
+ 1.170667828978199,
366
+ 1.6220790112596297,
367
+ 1.3004892166096398,
368
+ 0.9988939483461562,
369
+ 1.0,
370
+ 0.8944357999064098,
371
+ 1.2549059943840741,
372
+ 0.9010506624821365,
373
+ 1.2640911636544077,
374
+ 0.947031285603356,
375
+ 0.991260918816901,
376
+ 1.3300447893255651,
377
+ 1.1497030038124454,
378
+ 1.0,
379
+ 1.4063287585864277,
380
+ 0.8174198991670485,
381
+ 0.9988939483461566,
382
+ 1.0,
383
+ 1.217866674742133,
384
+ 0.8282680988206665,
385
+ 1.073085103116072,
386
+ 0.9693454139903576,
387
+ 1.7234040703162494,
388
+ 1.1056144342459158,
389
+ 1.074119172644369,
390
+ 0.6071170412907283,
391
+ 1.409505785723462,
392
+ 1.0,
393
+ 0.9988939483461562,
394
+ 1.1521380745389787,
395
+ 0.8944357999064119,
396
+ 1.058370875443875,
397
+ 1.0846522644237848,
398
+ 1.0598613115637294,
399
+ 0.5613288969768316,
400
+ 1.0,
401
+ 1.077530223972941,
402
+ 1.4095057857234625,
403
+ 1.15083399388167,
404
+ 1.0,
405
+ 1.2178666747421318,
406
+ 1.0966395583377115,
407
+ 1.0389053330759344,
408
+ 1.0429545495698374,
409
+ 1.0,
410
+ 1.0244696199828591,
411
+ 1.152138074538978,
412
+ 1.9911349325902201,
413
+ 1.6220790112596353,
414
+ 1.1329428844818097,
415
+ 1.0304640926757396,
416
+ 1.0027828154445004,
417
+ 1.4038062005460157,
418
+ 1.0648539403871593,
419
+ 1.9911349325902201,
420
+ 1.0,
421
+ 1.9844233966366391,
422
+ 1.5353137244867094,
423
+ 0.6866407429573802,
424
+ 0.9470876233472572,
425
+ 0.8928451459276403,
426
+ 1.3503062413436946,
427
+ 0.39441056751713693,
428
+ 1.0739060999830787,
429
+ 0.8074286630470415,
430
+ 0.8622816943277237,
431
+ 0.9235511168325403,
432
+ 0.8884646840941383,
433
+ 0.9253177369109523,
434
+ 1.0067482855890655,
435
+ 0.8717444615689396,
436
+ 1.7004798113300974,
437
+ 1.2451967529281143,
438
+ 1.0189016467998342,
439
+ 0.9159576992318523,
440
+ 0.9716842292520014,
441
+ 0.8537203439878127,
442
+ 0.6934639134127168,
443
+ 0.6814900866218891,
444
+ 1.08628728041417,
445
+ 0.8695100152450093,
446
+ 1.7244969164094923,
447
+ 0.9957413253735008,
448
+ 0.886998298843266,
449
+ 1.0086098935045376,
450
+ 0.9474117590718318,
451
+ 0.9527864599550645,
452
+ 0.8622024829086022,
453
+ 0.928715896349544,
454
+ 1.165972778898159,
455
+ 1.1444020655792773,
456
+ 1.249832703644339,
457
+ 1.0,
458
+ 1.04414181114218,
459
+ 0.7888691092407913,
460
+ 0.8896110919230731,
461
+ 0.8385172959457787,
462
+ 0.6963004767756463,
463
+ 1.0524770129026086,
464
+ 0.8728215158868736,
465
+ 1.2422671085343606,
466
+ 1.0395955941659785,
467
+ 0.9729248895409327,
468
+ 0.942112878700215,
469
+ 0.9029124312015971,
470
+ 0.9945356002953412,
471
+ 0.9067257721352653,
472
+ 0.6559269963983796,
473
+ 1.0530222495928638,
474
+ 0.7742650861348659,
475
+ 1.7415209866320729,
476
+ 0.31751695199855035,
477
+ 0.9401556411866103,
478
+ 0.9925662855482592,
479
+ 0.9703437391049544,
480
+ 0.9315271035229352,
481
+ 0.76726349356305,
482
+ 1.113451820498087,
483
+ 1.5950728246019172,
484
+ 0.9108834606609704,
485
+ 0.6187680270209445,
486
+ 1.0,
487
+ 1.026218169309107,
488
+ 0.9226908311101232,
489
+ 1.3695879042350074,
490
+ 1.390915117042367,
491
+ 0.9165066682832561,
492
+ 1.0788295714407763,
493
+ 0.8648263176100378,
494
+ 0.9635758583333331,
495
+ 0.8878642706591297,
496
+ 0.9006687498171835,
497
+ 0.8634669309414519,
498
+ 1.0263681887473621,
499
+ 1.1035216758671196,
500
+ 0.9668823371087334,
501
+ 0.9093839574625667,
502
+ 1.2537251227686863,
503
+ 0.925393016008483,
504
+ 0.9198488449490679,
505
+ 0.9988290268424753,
506
+ 0.1771101235529094,
507
+ 1.05614751420039,
508
+ 0.9497863099739803,
509
+ 1.0994839009481026,
510
+ 0.92792429034674,
511
+ 0.9973731985207415,
512
+ 1.4008749618490997,
513
+ 0.9833759189369512,
514
+ 0.7900467121392818,
515
+ 0.5512800744398914,
516
+ 1.0,
517
+ 1.160435495736531,
518
+ 0.840523823247663,
519
+ 1.0569742675732663,
520
+ 0.8576934466322704,
521
+ 0.9349861286126709,
522
+ 0.8587290535040432,
523
+ 0.9574488028099564,
524
+ 0.8825111948837125,
525
+ 1.0,
526
+ 0.9946462418130932,
527
+ 0.8401625258336195,
528
+ 1.0609041780534152,
529
+ 0.8625411201961046,
530
+ 0.8578849236354916,
531
+ 0.9245113485505083,
532
+ 0.9397104471617286,
533
+ 0.949988633400937,
534
+ 1.4949439323664353,
535
+ 1.0752730715733643,
536
+ 0.854508526946672,
537
+ 1.0304209489391347,
538
+ 0.9286338973772724
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.42198580503463745,
550
+ "72": 0.3333333134651184,
551
+ "108": 0.27304962277412415,
552
+ "255": 0.09219858050346375
553
+ }
554
+ }
UCI_N4/sdp/runs/arrhythmia/fold_2/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 60,
3
+ "best_val_acc": 0.5538461538461539,
4
+ "test_acc": 0.6496350364963503,
5
+ "train_size": 113,
6
+ "val_size": 65,
7
+ "test_size": 274,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.003089986725663709,
12
+ -0.004440814159291977,
13
+ 0.06255539469026555,
14
+ 0.0030673203539822954,
15
+ 0.001728016814159293,
16
+ 0.11026861433628313,
17
+ 0.017892446017699123,
18
+ -0.06960080176991157,
19
+ 0.039233834283185866,
20
+ 0.15144875398230093,
21
+ 0.006497817787610628,
22
+ -0.01399969203539821,
23
+ 0.12535314601769912,
24
+ 0.032636741592920446,
25
+ -0.04566848761061949,
26
+ -0.12298024778761062,
27
+ -0.000969959292035392,
28
+ 0.11890371504424775,
29
+ -0.09021629999999985,
30
+ -0.11451322123893802,
31
+ -0.04703600000000003,
32
+ 0.06338747787610569,
33
+ -0.1056450000000003,
34
+ -0.06659289999999989,
35
+ 0.0665928778761063,
36
+ -0.09438650000000005,
37
+ -0.04968765486725668,
38
+ 0.10877121769911505,
39
+ -0.018068128318584065,
40
+ -0.08296883185840709,
41
+ -0.05587280000000011,
42
+ -0.06895776106194693,
43
+ -2.920353983278935e-07,
44
+ -0.013222389380530894,
45
+ -0.04703600000000003,
46
+ 0.06659287787610632,
47
+ -0.06659289999999989,
48
+ -0.1252820000000002,
49
+ 0.010099320973451271,
50
+ 0.07353538053097344,
51
+ -0.007326469911504469,
52
+ -0.07684545132743385,
53
+ -0.0339906548672566,
54
+ 0.05784047787610613,
55
+ 0.14110856637168143,
56
+ 3.805309734868323e-07,
57
+ -0.04703600000000003,
58
+ -0.06704164601769919,
59
+ -0.02112876106194691,
60
+ -0.06659289999999989,
61
+ 0.15620863893805323,
62
+ -0.03053643008849556,
63
+ -0.18165605309734498,
64
+ -0.11233752212389378,
65
+ -0.04703600000000003,
66
+ -0.016779973451327427,
67
+ -0.021128761061946985,
68
+ -0.06659289999999989,
69
+ 0.0665928778761063,
70
+ -0.06659289999999989,
71
+ -0.06659289999999989,
72
+ -0.09438650000000005,
73
+ -0.00463133628318579,
74
+ -0.07507774690265485,
75
+ -0.0007694676106195044,
76
+ -0.08089127433628311,
77
+ -0.10792991415929203,
78
+ -2.9203539847723323e-07,
79
+ -0.04703600000000003,
80
+ -0.04703600000000003,
81
+ 0.027216715044247893,
82
+ -0.04703600000000003,
83
+ -0.02592799999999999,
84
+ 0.08057962389380531,
85
+ 0.024038425752212503,
86
+ -0.16465999999999992,
87
+ -0.07926050000000014,
88
+ -0.09237758407079648,
89
+ -0.06659289999999989,
90
+ -0.043025663716814114,
91
+ 0.14110856637168245,
92
+ 0.1411085663716826,
93
+ -0.04703600000000003,
94
+ -0.023750336283185847,
95
+ 0.03126479168141594,
96
+ 0.008899934513274312,
97
+ -0.02743449557522126,
98
+ 0.06331698053097352,
99
+ 0.05539779646017699,
100
+ 0.027216715044247736,
101
+ 0.017897150442477798,
102
+ 1.0619469029187476e-07,
103
+ 1.061946903233147e-07,
104
+ -0.02112876106194691,
105
+ -0.1502479999999999,
106
+ -0.016447008849557545,
107
+ -0.0054378495575221125,
108
+ 0.07474130442477876,
109
+ -0.07807693805309734,
110
+ -0.07854839999999999,
111
+ -0.008790955752212368,
112
+ 1.0619469031152472e-07,
113
+ 1.0619469029973474e-07,
114
+ 0.038619840707964564,
115
+ 1.061946903233147e-07,
116
+ 1.0619469035868464e-07,
117
+ -2.920353983829134e-07,
118
+ -0.06884565486725683,
119
+ -0.043006230088495565,
120
+ 0.13900964601769922,
121
+ -0.06902842477876096,
122
+ -0.06529410000000001,
123
+ -0.07149334513274326,
124
+ -0.043025663716814044,
125
+ -0.06659289999999989,
126
+ 0.02721671504424799,
127
+ 1.0619469029187476e-07,
128
+ -0.08165009999999992,
129
+ -0.1056450000000003,
130
+ -0.0844234336283186,
131
+ 0.045172380530973465,
132
+ 0.08091592477876108,
133
+ -0.08034439823008824,
134
+ -0.06118739999999991,
135
+ 0.009105318584070807,
136
+ 0.0665928778761063,
137
+ 0.03861984070796471,
138
+ -0.06659289999999989,
139
+ -2.920353983475435e-07,
140
+ -0.01561157522123892,
141
+ 0.034667146902654884,
142
+ 0.04805644646017698,
143
+ 0.07649909380531038,
144
+ 0.0778107902654868,
145
+ -0.08165009999999992,
146
+ -0.04703600000000003,
147
+ 0.027216715044247736,
148
+ 0.003988389380530976,
149
+ 0.07484829203539822,
150
+ 0.06071553097345137,
151
+ 0.014212502654867237,
152
+ 0.06978295752212389,
153
+ -0.04703600000000003,
154
+ -0.04703600000000003,
155
+ -0.06659289999999989,
156
+ -0.1056450000000003,
157
+ -0.05670110707964598,
158
+ 0.09375696460176995,
159
+ -0.16628776973451334,
160
+ -0.004178826548672555,
161
+ -0.07220739999999994,
162
+ -0.06694404424778763,
163
+ -0.06819787345132745,
164
+ -0.049705195575221274,
165
+ -0.11667001238938055,
166
+ -0.12676487345132748,
167
+ 0.06602797345132745,
168
+ 0.0027255099115044237,
169
+ 0.08367987168141594,
170
+ -0.07531826548672561,
171
+ 0.06618380000000008,
172
+ -0.05077870088495575,
173
+ -0.03939802035398229,
174
+ 0.0725209725663717,
175
+ 0.018818907079646008,
176
+ -0.0012129309734513318,
177
+ 0.08232463584070795,
178
+ 0.06279675221238941,
179
+ 0.05451436991150446,
180
+ -0.09364632743362859,
181
+ -0.013597840707964663,
182
+ -0.02791582300884959,
183
+ 0.02277181946902653,
184
+ 0.09624579256637165,
185
+ 0.10685669557522126,
186
+ 0.05720445840707966,
187
+ -0.11690305221238939,
188
+ -0.07600262831858408,
189
+ 0.20486032743362856,
190
+ -0.11598514159292016,
191
+ 0.04703600000000003,
192
+ 0.12372530088495573,
193
+ 0.07733639557522128,
194
+ 0.009731815840707961,
195
+ 0.06515634630088495,
196
+ -0.004099914159292028,
197
+ -0.062444362831858426,
198
+ -0.14432490088495575,
199
+ 0.010303688495575204,
200
+ -0.03996258407079658,
201
+ -0.01723771946902648,
202
+ -0.03748595911504427,
203
+ -0.09338390796460176,
204
+ -0.12455748761061945,
205
+ -0.07069998663716814,
206
+ 0.09306433097345132,
207
+ 0.05574491150442479,
208
+ 0.05271592371681417,
209
+ -0.10488400000000016,
210
+ 0.0725061,
211
+ -0.06092212743362833,
212
+ -0.021001579646017662,
213
+ 0.08582514876106195,
214
+ 0.05783091212389381,
215
+ 0.07796875840707959,
216
+ -0.0484065486725664,
217
+ -0.06359218141592915,
218
+ 0.12465353274336273,
219
+ -0.03740971681415926,
220
+ -0.006256027433628239,
221
+ 0.02847770973451326,
222
+ 0.03523589380530972,
223
+ -0.007258076106194675,
224
+ 0.029468245840707955,
225
+ 0.07720809823008848,
226
+ -0.029801646017699017,
227
+ -0.07590199938053097,
228
+ -0.0023667877876106243,
229
+ -0.06193052212389384,
230
+ 0.0729473,
231
+ -0.08944441592920359,
232
+ -0.008905622654867247,
233
+ -0.09599750318584069,
234
+ -0.11731536725663715,
235
+ 0.03799221946902657,
236
+ 0.04264000707964609,
237
+ -0.05476776486725663,
238
+ -0.08099349336283189,
239
+ -0.06403644955752204,
240
+ 0.0510427,
241
+ -0.1728837920353984,
242
+ 0.04379192212389381,
243
+ -0.08503633221238939,
244
+ -0.04843164778761059,
245
+ -0.013288855929203541,
246
+ 0.05900416725663712,
247
+ 0.01502987168141596,
248
+ -0.028499033982300897,
249
+ -0.06898648672566376,
250
+ 0.06213639999999999,
251
+ -0.020727761061946872,
252
+ 0.056635334513274314,
253
+ -0.009026141592920364,
254
+ 0.03156841769911506,
255
+ -0.12126076106194686,
256
+ 0.06353122123893817,
257
+ 0.031937667522123854,
258
+ 0.029336698938053133,
259
+ 0.12508993982300817,
260
+ -0.07582650442477877,
261
+ 0.006734969026548675,
262
+ 0.06509837044247789,
263
+ 0.03657155663716816,
264
+ -0.13086254787610632,
265
+ -0.01249529203539823,
266
+ 0.041217141592920364,
267
+ 0.050712616814159305,
268
+ 0.008828665486725618,
269
+ -0.04774530973451326,
270
+ -0.06531424955752214,
271
+ 0.08627439557522125,
272
+ 0.019008834867256633
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 0.9244692810470073,
278
+ 0.9993356910018533,
279
+ 1.1547522998507793,
280
+ 0.9432810092169331,
281
+ 1.03584004279498,
282
+ 0.8753158130277445,
283
+ 1.0465755215467378,
284
+ 0.9102607240673849,
285
+ 1.023778543447583,
286
+ 0.9297280045159075,
287
+ 1.0069835198754635,
288
+ 0.9525566546794436,
289
+ 0.9399759480360307,
290
+ 0.9978150756585966,
291
+ 0.9862811329995884,
292
+ 0.9613244275752023,
293
+ 1.111865207612389,
294
+ 0.9715796850385696,
295
+ 1.0,
296
+ 1.0813226579822182,
297
+ 1.0,
298
+ 1.2592635987036094,
299
+ 1.0,
300
+ 1.0,
301
+ 1.4095057857234625,
302
+ 1.0,
303
+ 1.010538238524329,
304
+ 1.0722512669094082,
305
+ 1.0593646908068974,
306
+ 0.605561339519823,
307
+ 1.0,
308
+ 0.9556792785074675,
309
+ 0.9988936769842924,
310
+ 0.9607982608538026,
311
+ 1.0,
312
+ 1.4095057857234632,
313
+ 1.0,
314
+ 1.0,
315
+ 0.972373648410722,
316
+ 1.0584533172538098,
317
+ 1.0284056325027326,
318
+ 0.8751294762374062,
319
+ 0.7194469320515607,
320
+ 0.9753483226530357,
321
+ 1.9911349325902201,
322
+ 0.99889397212978,
323
+ 1.0,
324
+ 0.7094990007768706,
325
+ 0.8944357999064104,
326
+ 1.0,
327
+ 0.9004941973725803,
328
+ 1.0121581074927941,
329
+ 0.761525664661198,
330
+ 0.6638398438080123,
331
+ 1.0,
332
+ 1.0084273596642825,
333
+ 0.8944357999064123,
334
+ 1.0,
335
+ 1.4095057857234632,
336
+ 1.0,
337
+ 1.0,
338
+ 1.0,
339
+ 1.0674172345021198,
340
+ 1.0415595393603108,
341
+ 0.9952640371583976,
342
+ 0.7847375185646767,
343
+ 1.0253922671299165,
344
+ 0.9988936769842935,
345
+ 1.0,
346
+ 1.0,
347
+ 1.1521380745389769,
348
+ 1.0,
349
+ 0.9380600926852771,
350
+ 0.9688329579782285,
351
+ 1.0699750013871834,
352
+ 1.0,
353
+ 1.0,
354
+ 0.9022130416875166,
355
+ 1.0,
356
+ 0.8547515543653855,
357
+ 1.9911349325902201,
358
+ 1.9911349325902201,
359
+ 1.0,
360
+ 0.9833161542151768,
361
+ 0.9113836368578456,
362
+ 1.0154070458101938,
363
+ 0.8175726795277899,
364
+ 1.0291658658053822,
365
+ 1.0023879541161114,
366
+ 1.1521380745389784,
367
+ 1.0666606471785436,
368
+ 0.9988939483461562,
369
+ 0.9988939483461564,
370
+ 0.8944357999064111,
371
+ 1.0,
372
+ 1.0194849042181624,
373
+ 0.9377289254070391,
374
+ 0.9868393622488469,
375
+ 0.7115324821514019,
376
+ 1.0,
377
+ 0.9291878599599749,
378
+ 0.9988939483461571,
379
+ 0.9988939483461564,
380
+ 1.150833993881672,
381
+ 0.9988939483461564,
382
+ 0.9988939483461563,
383
+ 0.9988936769842928,
384
+ 0.8446756150368765,
385
+ 0.8840822390425243,
386
+ 0.879273891482901,
387
+ 0.356357040154056,
388
+ 1.0,
389
+ 0.8575361470050674,
390
+ 0.8547515543653872,
391
+ 1.0,
392
+ 1.1521380745389762,
393
+ 0.9988939483461562,
394
+ 1.0,
395
+ 1.0,
396
+ 0.7707096318942795,
397
+ 0.9479029615796615,
398
+ 0.8861435214681488,
399
+ 0.709392406059319,
400
+ 1.0,
401
+ 0.9648083778490988,
402
+ 1.4095057857234619,
403
+ 1.1508339938816696,
404
+ 1.0,
405
+ 0.9988936769842918,
406
+ 0.8265732991714976,
407
+ 1.0190844405952648,
408
+ 0.9459831021380053,
409
+ 1.7348381185160544,
410
+ 1.1517740759366022,
411
+ 1.0,
412
+ 1.0,
413
+ 1.152138074538978,
414
+ 0.912843060712004,
415
+ 1.1388119070973806,
416
+ 0.9915799039109703,
417
+ 1.002719667279991,
418
+ 1.085125621845705,
419
+ 1.0,
420
+ 1.0,
421
+ 1.0,
422
+ 1.0,
423
+ 1.5001714286910226,
424
+ 0.9966194693620798,
425
+ 0.9443805992812078,
426
+ 0.8655175815339226,
427
+ 1.0,
428
+ 0.7897012658620092,
429
+ 1.1164175335449071,
430
+ 1.264530190302258,
431
+ 0.8921583865445091,
432
+ 1.0648052330194941,
433
+ 0.8695758038727032,
434
+ 0.8660581580725691,
435
+ 0.8367831000825393,
436
+ 0.37197924168302665,
437
+ 1.0,
438
+ 0.9262178979224102,
439
+ 0.9242646117464632,
440
+ 0.973591105652927,
441
+ 0.9951600891998066,
442
+ 1.1111862475284577,
443
+ 0.6670563380647561,
444
+ 0.9442962334551489,
445
+ 0.990332316811185,
446
+ 0.480719441273429,
447
+ 1.223234975369157,
448
+ 0.940394811395897,
449
+ 0.9089632031900003,
450
+ 1.0458338698053655,
451
+ 0.9721165818563446,
452
+ 1.374767108546496,
453
+ 0.8594004341053223,
454
+ 0.7653673558229712,
455
+ 0.6670525311692612,
456
+ 0.645642563256581,
457
+ 1.0,
458
+ 0.891254315503885,
459
+ 1.0775980834755503,
460
+ 1.007431548670928,
461
+ 0.9530753484316439,
462
+ 1.4811962251096449,
463
+ 1.2176806384389702,
464
+ 0.9602107117788192,
465
+ 0.8795846242039457,
466
+ 1.1116750216535782,
467
+ 0.9501349187678776,
468
+ 1.0821885258200035,
469
+ 1.1407026156836266,
470
+ 0.9231893015164008,
471
+ 0.8990327480493145,
472
+ 0.6422405879838027,
473
+ 0.9092214790537131,
474
+ 0.9351958368508632,
475
+ 1.0,
476
+ 1.0,
477
+ 0.9288775753611616,
478
+ 0.8531876075690629,
479
+ 1.034017858801366,
480
+ 1.0285706599327553,
481
+ 1.5382840820664052,
482
+ 1.0793433921827003,
483
+ 0.7014984131399681,
484
+ 0.9478974831267535,
485
+ 0.8121083950620509,
486
+ 0.5317226069000799,
487
+ 0.877495299738119,
488
+ 1.105656776922663,
489
+ 0.9679617815757274,
490
+ 0.7155463726091819,
491
+ 1.108302722756925,
492
+ 1.0944778308312668,
493
+ 0.7749616919771513,
494
+ 0.8850563716056123,
495
+ 0.5693811287198752,
496
+ 1.0,
497
+ 0.9220528856937216,
498
+ 0.8553127512283658,
499
+ 0.9975197765961968,
500
+ 0.8796722204092665,
501
+ 1.1740947078133768,
502
+ 0.9516756586234943,
503
+ 0.9063555755946218,
504
+ 0.9537956983823893,
505
+ 0.21590336552059824,
506
+ 1.0,
507
+ 1.1291952185180558,
508
+ 1.0007499385498189,
509
+ 1.0111383561599954,
510
+ 0.9704983147288865,
511
+ 1.1385710361021162,
512
+ 0.7564588026775311,
513
+ 1.0046465692486821,
514
+ 0.9312841189336238,
515
+ 0.6375502285227569,
516
+ 1.0,
517
+ 0.829387189699574,
518
+ 1.0544363475675953,
519
+ 0.9771879250820691,
520
+ 1.0137760206245479,
521
+ 1.0423498864484522,
522
+ 0.43681029699877133,
523
+ 0.8991224001063718,
524
+ 0.8257144621838688,
525
+ 1.968770644943309,
526
+ 0.8856828178067617,
527
+ 1.0398871114616712,
528
+ 0.8345338516516961,
529
+ 0.9722595951185294,
530
+ 1.285772740124495,
531
+ 0.8915167876690523,
532
+ 0.8875667705363124,
533
+ 0.6453390579256484,
534
+ 0.9343424770462008,
535
+ 0.8887305596443167,
536
+ 1.0443061214405034,
537
+ 1.027608228431771,
538
+ 0.9189390661089004
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.6021897792816162,
550
+ "72": 0.5583941340446472,
551
+ "108": 0.49635034799575806,
552
+ "255": 0.3102189898490906
553
+ }
554
+ }
UCI_N4/sdp/runs/arrhythmia/fold_3/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 28,
3
+ "best_val_acc": 0.5373134328358209,
4
+ "test_acc": 0.5992647058823529,
5
+ "train_size": 113,
6
+ "val_size": 67,
7
+ "test_size": 272,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.04070993805309734,
12
+ 0.11996151327433617,
13
+ -0.07505505699115043,
14
+ -0.053473368141592904,
15
+ -0.0023036168141593112,
16
+ -0.04386066761061949,
17
+ 0.1000648973451327,
18
+ 0.21898467610619468,
19
+ 0.0844638663362832,
20
+ -0.21027526176991146,
21
+ 0.08278053309734511,
22
+ 0.02691175840707965,
23
+ -0.10311968407079651,
24
+ -0.019989650442477833,
25
+ -0.029568291150442447,
26
+ 0.06979861946902657,
27
+ -0.09989179115044242,
28
+ -0.0017227557522123856,
29
+ -2.2654867243656462e-07,
30
+ 0.06518417699115044,
31
+ -0.04703600000000003,
32
+ -0.1056450000000003,
33
+ -0.1056450000000003,
34
+ 0.19977865575221251,
35
+ 0.0665928778761063,
36
+ 0.09438671238938035,
37
+ -0.10331811504424784,
38
+ -0.11287559292035391,
39
+ 0.1063068938053097,
40
+ 0.04291548672566383,
41
+ -0.05587280000000011,
42
+ -0.032180318584070916,
43
+ 0.06704106194690261,
44
+ -0.1718930000000004,
45
+ -0.04703600000000003,
46
+ 0.0665928778761063,
47
+ -0.06659289999999989,
48
+ 0.08948672566371665,
49
+ -0.025450121504424723,
50
+ -0.17311484513274336,
51
+ 0.07640526460176993,
52
+ 0.11526853982300869,
53
+ 0.1133023008849558,
54
+ -0.07326554867256642,
55
+ -0.04703600000000003,
56
+ 0.047838725663716816,
57
+ -0.04703600000000003,
58
+ 0.06704106194690251,
59
+ -0.02112876106194691,
60
+ -0.06659289999999989,
61
+ -0.013552253982300916,
62
+ -0.020357922123893812,
63
+ -0.027464973451327517,
64
+ -0.006002522123893788,
65
+ -0.04703600000000003,
66
+ -0.04337743362831858,
67
+ 0.14790371681415934,
68
+ 0.0665928778761063,
69
+ -0.06659289999999989,
70
+ 0.06659287787610634,
71
+ -0.06659289999999989,
72
+ 1.0619469029580476e-07,
73
+ 0.044767823008849614,
74
+ 0.08289923362831852,
75
+ -0.12235442831858409,
76
+ -0.11459614159292028,
77
+ 0.14790476371681416,
78
+ -2.9203539830824354e-07,
79
+ -0.04703600000000003,
80
+ 0.14110856637168223,
81
+ 0.027216715044247736,
82
+ -0.04703600000000003,
83
+ -0.055889752212389385,
84
+ -0.12962760265486717,
85
+ 0.10187851619469035,
86
+ -0.01324823008849549,
87
+ 0.022193132743362702,
88
+ -0.07879260176991155,
89
+ 0.0665928778761063,
90
+ 0.12907584070796485,
91
+ -0.04703600000000003,
92
+ -0.04703600000000003,
93
+ -0.04703600000000003,
94
+ -0.002639044247787606,
95
+ 0.054982569292035384,
96
+ 0.05932991150442477,
97
+ -0.06964141592920373,
98
+ -0.07482919999999994,
99
+ -0.033238396460177,
100
+ 0.13608353008849555,
101
+ 0.0894867256637167,
102
+ -0.09438650000000005,
103
+ -0.09438650000000005,
104
+ -0.1056450000000003,
105
+ 0.030049292035398203,
106
+ 0.0004219557522123656,
107
+ 0.04024157522123887,
108
+ 0.01212035575221241,
109
+ -0.06541580530973452,
110
+ -0.07854839999999999,
111
+ 0.02907596460176992,
112
+ -0.09438650000000005,
113
+ 0.09438671238938048,
114
+ -0.03861907964601766,
115
+ 1.0619469030366473e-07,
116
+ 1.0619469029580476e-07,
117
+ -0.0670416460176993,
118
+ -0.04499362831858416,
119
+ 0.0430065663716814,
120
+ 0.05495734513274337,
121
+ 0.025254761061947018,
122
+ -0.06529410000000001,
123
+ 0.06800543362831867,
124
+ -0.15775999999999976,
125
+ 0.0665928778761063,
126
+ -0.08165009999999992,
127
+ 1.0619469029580476e-07,
128
+ -0.08165009999999992,
129
+ -0.021128761061946954,
130
+ 0.0199548849557522,
131
+ -0.04005870796460183,
132
+ 0.07256339026548671,
133
+ 0.0029753097345135682,
134
+ 0.008741072566371728,
135
+ -0.12291731858407075,
136
+ 0.0665928778761063,
137
+ -0.03861907964601771,
138
+ 0.0665928778761063,
139
+ -2.9203539835933345e-07,
140
+ -0.15365226548672545,
141
+ -0.02139016460176988,
142
+ 0.03374174115044254,
143
+ -0.03278541946902662,
144
+ -0.16577226814159277,
145
+ 0.027216715044247785,
146
+ 0.14110856637168206,
147
+ -0.08165009999999992,
148
+ -0.17471278761061948,
149
+ -0.05009553982300891,
150
+ 0.10357247787610621,
151
+ 0.01421250265486715,
152
+ -0.16799606460176988,
153
+ 0.1411085663716814,
154
+ -0.04703600000000003,
155
+ 0.1997786557522125,
156
+ -0.02112876106194691,
157
+ 0.10064383539823014,
158
+ -0.09822227433628321,
159
+ 0.010812114336283181,
160
+ -0.0005969424778760985,
161
+ -0.034939104424778704,
162
+ -0.021039132743362887,
163
+ 0.1549942769911504,
164
+ -0.05473569823008849,
165
+ 0.09371048247787614,
166
+ 0.1284547699115043,
167
+ 0.08193819469026561,
168
+ -0.1894623433628318,
169
+ -0.03994628938053097,
170
+ 0.005021592920354035,
171
+ 0.06618380000000008,
172
+ 0.046780255752212445,
173
+ 0.12412912743362833,
174
+ -0.15687404504424782,
175
+ -0.04040450761061948,
176
+ 0.01819149026548674,
177
+ 0.047322232477876085,
178
+ -0.1316860601769911,
179
+ -0.08258592566371675,
180
+ 0.05638880530973452,
181
+ -0.10198681415929205,
182
+ 0.1290602176991152,
183
+ -0.03669845398230087,
184
+ -0.10499076469026546,
185
+ -0.12757559911504432,
186
+ -0.06652606637168137,
187
+ 0.05155422566371681,
188
+ 0.031605256637168136,
189
+ 0.0629123805309736,
190
+ 0.023197380530973564,
191
+ 0.04703600000000003,
192
+ -0.03599286283185842,
193
+ -0.1574473318584071,
194
+ 0.10887992823008849,
195
+ -0.053605181415929175,
196
+ -0.012299078761061958,
197
+ -0.05887616991150452,
198
+ 0.07308711769911504,
199
+ 0.09051549646017694,
200
+ -0.10846913274336303,
201
+ -0.15513741725663718,
202
+ 0.12073644318584073,
203
+ 0.05041307504424779,
204
+ 0.1529646697345132,
205
+ 0.0776218637168141,
206
+ 0.057565741592920404,
207
+ -0.17276489823008853,
208
+ -0.014984845840707986,
209
+ -0.04701723008849572,
210
+ -0.03750280353982299,
211
+ 0.06355189203539817,
212
+ 0.06636549999999998,
213
+ -0.1410115592035399,
214
+ -0.08766313362831851,
215
+ -0.09892783274336285,
216
+ -0.013420267079645989,
217
+ 0.09777304070796461,
218
+ 0.07535415840707965,
219
+ -0.10688448672566354,
220
+ 0.0625599000000001,
221
+ -0.011544922123893811,
222
+ -0.09627820707964604,
223
+ 0.08584640530973452,
224
+ 0.007022314424778771,
225
+ -0.05128431504424778,
226
+ -0.06365885663716808,
227
+ 0.02538907345132746,
228
+ 0.071253879380531,
229
+ -0.032786734513274456,
230
+ 0.0729473,
231
+ 0.04719471592920353,
232
+ 0.014598110265486715,
233
+ 0.026159213575221246,
234
+ 0.059101831504424836,
235
+ -0.07843545663716811,
236
+ 0.0003891433628318023,
237
+ 0.014624393274336253,
238
+ 0.03384382522123893,
239
+ -0.07310352920353969,
240
+ 0.0510427,
241
+ 0.14306325132743355,
242
+ -0.011243908849557487,
243
+ 0.02559352380530976,
244
+ 0.03617407230973455,
245
+ -0.012417333274336301,
246
+ -0.10102372743362834,
247
+ -0.09638603628318594,
248
+ 0.02360371292035396,
249
+ -0.0742930973451328,
250
+ -0.014339143362831862,
251
+ 0.03523714159292039,
252
+ 0.03915302300884953,
253
+ -0.08945827723893807,
254
+ -0.02228378656637163,
255
+ 0.10421852477876106,
256
+ 0.0697730088495576,
257
+ -0.12811908238938052,
258
+ -0.10229047238938055,
259
+ -0.048111653097345074,
260
+ 0.041196920353982314,
261
+ 0.10879424867256633,
262
+ -0.10693692778761064,
263
+ 0.02704163566371678,
264
+ 0.12719723849557518,
265
+ 0.1358370884955751,
266
+ -0.11345866194690264,
267
+ -0.11236356814159291,
268
+ 0.008828665486725625,
269
+ 0.04901849557522122,
270
+ 0.10906433185840712,
271
+ -0.12028646725663718,
272
+ 0.005514894867256633
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 1.0502669179700934,
278
+ 0.9792224218294541,
279
+ 0.24305352147883325,
280
+ 1.043042266446498,
281
+ 1.0744571502175468,
282
+ 0.9508826739984755,
283
+ 0.9451555552883207,
284
+ 1.1810283789026603,
285
+ 1.0064552702700122,
286
+ 1.1190882010665817,
287
+ 0.9034793296608571,
288
+ 1.1336521923679663,
289
+ 0.9786491101919341,
290
+ 0.9206985848676537,
291
+ 0.8610889538505271,
292
+ 0.9619675032812017,
293
+ 0.9308084274399617,
294
+ 0.9863758024756076,
295
+ 0.9547571784517959,
296
+ 0.9496800506935921,
297
+ 1.0,
298
+ 1.0,
299
+ 1.0,
300
+ 1.9844233966366367,
301
+ 1.4095057857234627,
302
+ 1.40632875858643,
303
+ 0.892002130496044,
304
+ 1.0129634785032875,
305
+ 0.978487303853688,
306
+ 1.1394715296586964,
307
+ 1.0,
308
+ 1.0267988761241287,
309
+ 1.217866674742132,
310
+ 1.0,
311
+ 1.0,
312
+ 1.4095057857234627,
313
+ 1.0,
314
+ 1.30048921660964,
315
+ 1.101075351501756,
316
+ 0.9423320679555461,
317
+ 0.9745566669040967,
318
+ 1.0784150005489006,
319
+ 1.3072548131334407,
320
+ 1.020520797792866,
321
+ 1.0,
322
+ 1.1116626840554256,
323
+ 1.0,
324
+ 1.2178666747421323,
325
+ 0.8944357999064103,
326
+ 1.0,
327
+ 0.9763859814864452,
328
+ 0.9882312110151381,
329
+ 0.9941548135105892,
330
+ 1.0805382570058093,
331
+ 1.0,
332
+ 0.9455390825539804,
333
+ 1.5353137244867092,
334
+ 1.4095057857234619,
335
+ 1.0,
336
+ 1.4095057857234636,
337
+ 1.0,
338
+ 0.9988939483461567,
339
+ 0.9028116049768871,
340
+ 1.0263167291591377,
341
+ 0.9964436627027657,
342
+ 0.4280387316306564,
343
+ 1.0514551909197751,
344
+ 0.9988936769842915,
345
+ 1.0,
346
+ 1.9911349325902201,
347
+ 1.152138074538978,
348
+ 1.0,
349
+ 0.9644113662850948,
350
+ 0.9806946309645141,
351
+ 0.9930268680075975,
352
+ 0.8905664891946655,
353
+ 1.0736843273720693,
354
+ 1.0058668086951204,
355
+ 1.409505785723462,
356
+ 1.3330925209888196,
357
+ 1.0,
358
+ 1.0,
359
+ 1.0,
360
+ 1.0450036005861865,
361
+ 1.3244456183776097,
362
+ 0.932189980942975,
363
+ 0.9625014477361986,
364
+ 1.0,
365
+ 1.0074707737922228,
366
+ 1.62207901125963,
367
+ 1.3004892166096393,
368
+ 1.0,
369
+ 1.0,
370
+ 1.0,
371
+ 1.0917543201475843,
372
+ 1.0127130749629136,
373
+ 1.2877909824303606,
374
+ 0.9604994075919616,
375
+ 0.8657450013263874,
376
+ 1.0,
377
+ 1.0599660091906427,
378
+ 1.0,
379
+ 1.4063287585864277,
380
+ 0.8174198991670479,
381
+ 0.9988939483461567,
382
+ 0.9988939483461567,
383
+ 0.7094990007768708,
384
+ 0.8740833234525124,
385
+ 1.010657132912493,
386
+ 0.9328151962443406,
387
+ 1.3541564903516528,
388
+ 1.0,
389
+ 1.0437864539647888,
390
+ 1.0,
391
+ 1.409505785723462,
392
+ 1.0,
393
+ 0.9988939483461567,
394
+ 1.0,
395
+ 0.8944357999064098,
396
+ 1.2065791134004533,
397
+ 1.0500123468485083,
398
+ 0.9959504427215604,
399
+ 1.0958354145667224,
400
+ 0.7400533918928887,
401
+ 0.9943642075886404,
402
+ 1.4095057857234627,
403
+ 0.8174198991670482,
404
+ 1.4095057857234627,
405
+ 0.9988936769842922,
406
+ 0.9193790839730072,
407
+ 1.0436031910295362,
408
+ 0.9868834993023391,
409
+ 0.5782795414175284,
410
+ 0.9541173647907301,
411
+ 1.1521380745389775,
412
+ 1.9911349325902201,
413
+ 1.0,
414
+ 0.9325216486314452,
415
+ 1.0303184562115624,
416
+ 0.9698188611354921,
417
+ 1.0027196672799903,
418
+ 1.0327882823860284,
419
+ 1.9911349325902201,
420
+ 1.0,
421
+ 1.9844233966366391,
422
+ 0.8944357999064109,
423
+ 0.7112349595162911,
424
+ 1.0528496975740775,
425
+ 0.9693293962135208,
426
+ 1.098217436491506,
427
+ 0.39441056751713705,
428
+ 1.131185111941341,
429
+ 0.8933013668038887,
430
+ 0.8692841653701331,
431
+ 0.9535583303775852,
432
+ 0.9578421783922644,
433
+ 0.9351032690489206,
434
+ 0.9587912379925385,
435
+ 0.8874155629442673,
436
+ 0.7402206710271984,
437
+ 1.0,
438
+ 1.0688089329251667,
439
+ 0.997681462694144,
440
+ 0.9866601266296527,
441
+ 0.9496581319654654,
442
+ 0.9257831061652533,
443
+ 0.9073562336120353,
444
+ 0.9768579353882867,
445
+ 0.9602672008044747,
446
+ 0.7793988687883875,
447
+ 1.2643817992013762,
448
+ 0.8858997832358527,
449
+ 1.0783739453909889,
450
+ 0.9243425987503827,
451
+ 0.9894525958813807,
452
+ 0.8138319611992417,
453
+ 0.9527697944043735,
454
+ 1.1413505837251008,
455
+ 0.8792523651290115,
456
+ 1.0992317647014969,
457
+ 1.0,
458
+ 1.065433498566479,
459
+ 0.9150528093441637,
460
+ 1.0062463574228966,
461
+ 1.011250604668206,
462
+ 0.7913263564369651,
463
+ 0.9735543146496928,
464
+ 0.9610800849612564,
465
+ 0.9880567372837797,
466
+ 0.3866698577857632,
467
+ 0.9853949011817834,
468
+ 0.990227174214131,
469
+ 0.8869793376043191,
470
+ 1.0049463863071384,
471
+ 0.9992217219580515,
472
+ 0.9135057665522096,
473
+ 0.9794517412025064,
474
+ 0.8334338014885702,
475
+ 0.37518500497353446,
476
+ 1.1642248030770597,
477
+ 0.9506854878365382,
478
+ 1.1083600583283926,
479
+ 0.9361744720072924,
480
+ 1.0051395038183164,
481
+ 0.7234663786843327,
482
+ 1.1371317753211319,
483
+ 1.5356103741191347,
484
+ 0.8479920793399001,
485
+ 0.46656712729960265,
486
+ 1.0,
487
+ 1.0891589322731212,
488
+ 0.8545812844441173,
489
+ 1.3469557389840487,
490
+ 1.3298686360213214,
491
+ 0.8184103746992143,
492
+ 1.2426545134673366,
493
+ 0.9345647421429395,
494
+ 0.8739291157345797,
495
+ 0.7954155323258645,
496
+ 1.0,
497
+ 0.9396031266002715,
498
+ 0.8729340873197525,
499
+ 1.1022147706138496,
500
+ 0.9052007430680863,
501
+ 0.8002297286948205,
502
+ 1.1474637082252046,
503
+ 1.0050624674836923,
504
+ 0.8958786752659496,
505
+ 0.1199464140766847,
506
+ 1.0,
507
+ 0.9484606934407114,
508
+ 0.924743989986394,
509
+ 1.1045533858189263,
510
+ 0.9763355497679247,
511
+ 0.8775711016746042,
512
+ 1.4892483405130004,
513
+ 0.9479162196372228,
514
+ 0.824520740664537,
515
+ 0.48200134691826974,
516
+ 0.8093410764663572,
517
+ 1.0307538015892828,
518
+ 0.8557116942728363,
519
+ 0.9675781578595044,
520
+ 0.9316537658305905,
521
+ 0.961482671503125,
522
+ 0.9499524026348503,
523
+ 1.0156281171297905,
524
+ 0.9533815998673338,
525
+ 0.13577727875330386,
526
+ 1.0944930405696027,
527
+ 0.9984202119037168,
528
+ 1.0610893586418122,
529
+ 1.0416564535479678,
530
+ 0.953141207852886,
531
+ 0.9699518518482332,
532
+ 1.0661304370514315,
533
+ 0.9605383246803934,
534
+ 0.9343424770461999,
535
+ 1.1428421085341074,
536
+ 0.9995106529728873,
537
+ 1.0191031224939573,
538
+ 1.0275583030415119
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.49264705181121826,
550
+ "72": 0.43382352590560913,
551
+ "108": 0.38235294818878174,
552
+ "255": 0.16911764442920685
553
+ }
554
+ }
UCI_N4/sdp/runs/audiology-std/fold_0/result.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 5,
3
+ "best_val_acc": 0.1935483870967742,
4
+ "test_acc": 0.1,
5
+ "train_size": 25,
6
+ "val_size": 31,
7
+ "test_size": 140,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -1.7763568394002505e-17,
12
+ -8.399999999486596e-07,
13
+ 7.99999999756551e-08,
14
+ -1.2800000001833566e-06,
15
+ -3.6000000007696543e-07,
16
+ -8.799999999986596e-07,
17
+ 0.0,
18
+ 0.0,
19
+ 0.0,
20
+ 0.0,
21
+ 0.0,
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0,
26
+ 0.0,
27
+ -8.000000002006402e-08,
28
+ 7.99999999756551e-08,
29
+ 0.0,
30
+ 0.0,
31
+ 0.0,
32
+ 0.0,
33
+ 7.99999999756551e-08,
34
+ 0.0,
35
+ -3.199999999159431e-07,
36
+ 0.0,
37
+ 0.0,
38
+ 0.0,
39
+ 0.0,
40
+ 0.0,
41
+ 0.0,
42
+ 0.0,
43
+ -3.3306690738754695e-17,
44
+ -3.999999999981796e-07,
45
+ 0.0,
46
+ 7.99999999756551e-08,
47
+ 0.0,
48
+ 0.0,
49
+ 0.0,
50
+ 0.0,
51
+ 0.0,
52
+ 0.0,
53
+ -8.659739592076221e-17,
54
+ 0.0,
55
+ -8.659739592076221e-17,
56
+ 0.0,
57
+ 0.0,
58
+ 0.0,
59
+ -7.199999999940587e-07,
60
+ -4.800000000759752e-07,
61
+ 2.799999999325564e-07,
62
+ 0.0,
63
+ 2.220446049250313e-18,
64
+ 0.0,
65
+ -1.5999999996907377e-07,
66
+ 0.0,
67
+ -4.0000000006479297e-07,
68
+ 0.0,
69
+ 0.0
70
+ ]
71
+ ],
72
+ "std": [
73
+ [
74
+ 0.9797958971132714,
75
+ 0.979795399156076,
76
+ 0.979796007645425,
77
+ 0.9797944438980055,
78
+ 0.979795825808005,
79
+ 0.9797970293219844,
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0,
84
+ 1.0,
85
+ 1.0,
86
+ 1.0,
87
+ 1.0,
88
+ 0.9797958971132714,
89
+ 1.0,
90
+ 0.9797961795409461,
91
+ 0.979796007645425,
92
+ 1.0,
93
+ 1.0,
94
+ 1.0,
95
+ 1.0,
96
+ 0.9797960076454252,
97
+ 1.0,
98
+ 0.9797960772142222,
99
+ 1.0,
100
+ 1.0,
101
+ 1.0,
102
+ 1.0,
103
+ 1.0,
104
+ 1.0,
105
+ 1.0,
106
+ 0.9797958971132711,
107
+ 0.9797952000000001,
108
+ 1.0,
109
+ 0.9797960076454251,
110
+ 1.0,
111
+ 1.0,
112
+ 1.0,
113
+ 1.0,
114
+ 1.0,
115
+ 1.0,
116
+ 0.9797958971132709,
117
+ 1.0,
118
+ 0.9797958971132709,
119
+ 1.0,
120
+ 1.0,
121
+ 1.0,
122
+ 0.9797942770355633,
123
+ 0.9797949007791427,
124
+ 0.9797958854236333,
125
+ 1.0,
126
+ 0.979795897113271,
127
+ 1.0,
128
+ 0.9797957933341287,
129
+ 1.0,
130
+ 0.9797952,
131
+ 1.0,
132
+ 1.0
133
+ ]
134
+ ]
135
+ },
136
+ "width": 256,
137
+ "in_features": 59,
138
+ "out_features": 18,
139
+ "depth": 4,
140
+ "padding": 118,
141
+ "parameters": 125022,
142
+ "cert_evals": {
143
+ "36": 0.05000000074505806,
144
+ "72": 0.0071428571827709675,
145
+ "108": 0.0,
146
+ "255": 0.0
147
+ }
148
+ }
UCI_N4/sdp/runs/audiology-std/fold_1/result.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 31,
3
+ "best_val_acc": 0.5151515151515151,
4
+ "test_acc": 0.3188405797101449,
5
+ "train_size": 25,
6
+ "val_size": 33,
7
+ "test_size": 138,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -1.7763568394002505e-17,
12
+ -8.399999999486596e-07,
13
+ 7.99999999756551e-08,
14
+ -1.2800000001833566e-06,
15
+ -3.6000000007696543e-07,
16
+ -8.799999999986596e-07,
17
+ 0.0,
18
+ 0.0,
19
+ 0.0,
20
+ 0.0,
21
+ 0.0,
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0,
26
+ 0.0,
27
+ -8.000000002006402e-08,
28
+ 7.99999999756551e-08,
29
+ 0.0,
30
+ 0.0,
31
+ 0.0,
32
+ 0.0,
33
+ 7.99999999756551e-08,
34
+ 0.0,
35
+ -3.199999999159431e-07,
36
+ 0.0,
37
+ 0.0,
38
+ 0.0,
39
+ 0.0,
40
+ 0.0,
41
+ 0.0,
42
+ 0.0,
43
+ -3.3306690738754695e-17,
44
+ -3.999999999981796e-07,
45
+ 0.0,
46
+ 7.99999999756551e-08,
47
+ 0.0,
48
+ 0.0,
49
+ 0.0,
50
+ 0.0,
51
+ 0.0,
52
+ 0.0,
53
+ -8.659739592076221e-17,
54
+ 0.0,
55
+ -8.659739592076221e-17,
56
+ 0.0,
57
+ 0.0,
58
+ 0.0,
59
+ -7.199999999940587e-07,
60
+ -4.800000000759752e-07,
61
+ 2.799999999325564e-07,
62
+ 0.0,
63
+ 2.220446049250313e-18,
64
+ 0.0,
65
+ -1.5999999996907377e-07,
66
+ 0.0,
67
+ -4.0000000006479297e-07,
68
+ 0.0,
69
+ 0.0
70
+ ]
71
+ ],
72
+ "std": [
73
+ [
74
+ 0.9797958971132714,
75
+ 0.979795399156076,
76
+ 0.979796007645425,
77
+ 0.9797944438980055,
78
+ 0.979795825808005,
79
+ 0.9797970293219844,
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0,
84
+ 1.0,
85
+ 1.0,
86
+ 1.0,
87
+ 1.0,
88
+ 0.9797958971132714,
89
+ 1.0,
90
+ 0.9797961795409461,
91
+ 0.979796007645425,
92
+ 1.0,
93
+ 1.0,
94
+ 1.0,
95
+ 1.0,
96
+ 0.9797960076454252,
97
+ 1.0,
98
+ 0.9797960772142222,
99
+ 1.0,
100
+ 1.0,
101
+ 1.0,
102
+ 1.0,
103
+ 1.0,
104
+ 1.0,
105
+ 1.0,
106
+ 0.9797958971132711,
107
+ 0.9797952000000001,
108
+ 1.0,
109
+ 0.9797960076454251,
110
+ 1.0,
111
+ 1.0,
112
+ 1.0,
113
+ 1.0,
114
+ 1.0,
115
+ 1.0,
116
+ 0.9797958971132709,
117
+ 1.0,
118
+ 0.9797958971132709,
119
+ 1.0,
120
+ 1.0,
121
+ 1.0,
122
+ 0.9797942770355633,
123
+ 0.9797949007791427,
124
+ 0.9797958854236333,
125
+ 1.0,
126
+ 0.979795897113271,
127
+ 1.0,
128
+ 0.9797957933341287,
129
+ 1.0,
130
+ 0.9797952,
131
+ 1.0,
132
+ 1.0
133
+ ]
134
+ ]
135
+ },
136
+ "width": 256,
137
+ "in_features": 59,
138
+ "out_features": 18,
139
+ "depth": 4,
140
+ "padding": 118,
141
+ "parameters": 125022,
142
+ "cert_evals": {
143
+ "36": 0.26811593770980835,
144
+ "72": 0.239130437374115,
145
+ "108": 0.17391304671764374,
146
+ "255": 0.028985507786273956
147
+ }
148
+ }
UCI_N4/sdp/runs/audiology-std/fold_2/result.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 30,
3
+ "best_val_acc": 0.36,
4
+ "test_acc": 0.3561643835616438,
5
+ "train_size": 25,
6
+ "val_size": 25,
7
+ "test_size": 146,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -1.7763568394002505e-17,
12
+ -8.399999999486596e-07,
13
+ 7.99999999756551e-08,
14
+ -1.2800000001833566e-06,
15
+ -3.6000000007696543e-07,
16
+ -8.799999999986596e-07,
17
+ 0.0,
18
+ 0.0,
19
+ 0.0,
20
+ 0.0,
21
+ 0.0,
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0,
26
+ 0.0,
27
+ -8.000000002006402e-08,
28
+ 7.99999999756551e-08,
29
+ 0.0,
30
+ 0.0,
31
+ 0.0,
32
+ 0.0,
33
+ 7.99999999756551e-08,
34
+ 0.0,
35
+ -3.199999999159431e-07,
36
+ 0.0,
37
+ 0.0,
38
+ 0.0,
39
+ 0.0,
40
+ 0.0,
41
+ 0.0,
42
+ 0.0,
43
+ -3.3306690738754695e-17,
44
+ -3.999999999981796e-07,
45
+ 0.0,
46
+ 7.99999999756551e-08,
47
+ 0.0,
48
+ 0.0,
49
+ 0.0,
50
+ 0.0,
51
+ 0.0,
52
+ 0.0,
53
+ -8.659739592076221e-17,
54
+ 0.0,
55
+ -8.659739592076221e-17,
56
+ 0.0,
57
+ 0.0,
58
+ 0.0,
59
+ -7.199999999940587e-07,
60
+ -4.800000000759752e-07,
61
+ 2.799999999325564e-07,
62
+ 0.0,
63
+ 2.220446049250313e-18,
64
+ 0.0,
65
+ -1.5999999996907377e-07,
66
+ 0.0,
67
+ -4.0000000006479297e-07,
68
+ 0.0,
69
+ 0.0
70
+ ]
71
+ ],
72
+ "std": [
73
+ [
74
+ 0.9797958971132714,
75
+ 0.979795399156076,
76
+ 0.979796007645425,
77
+ 0.9797944438980055,
78
+ 0.979795825808005,
79
+ 0.9797970293219844,
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0,
84
+ 1.0,
85
+ 1.0,
86
+ 1.0,
87
+ 1.0,
88
+ 0.9797958971132714,
89
+ 1.0,
90
+ 0.9797961795409461,
91
+ 0.979796007645425,
92
+ 1.0,
93
+ 1.0,
94
+ 1.0,
95
+ 1.0,
96
+ 0.9797960076454252,
97
+ 1.0,
98
+ 0.9797960772142222,
99
+ 1.0,
100
+ 1.0,
101
+ 1.0,
102
+ 1.0,
103
+ 1.0,
104
+ 1.0,
105
+ 1.0,
106
+ 0.9797958971132711,
107
+ 0.9797952000000001,
108
+ 1.0,
109
+ 0.9797960076454251,
110
+ 1.0,
111
+ 1.0,
112
+ 1.0,
113
+ 1.0,
114
+ 1.0,
115
+ 1.0,
116
+ 0.9797958971132709,
117
+ 1.0,
118
+ 0.9797958971132709,
119
+ 1.0,
120
+ 1.0,
121
+ 1.0,
122
+ 0.9797942770355633,
123
+ 0.9797949007791427,
124
+ 0.9797958854236333,
125
+ 1.0,
126
+ 0.979795897113271,
127
+ 1.0,
128
+ 0.9797957933341287,
129
+ 1.0,
130
+ 0.9797952,
131
+ 1.0,
132
+ 1.0
133
+ ]
134
+ ]
135
+ },
136
+ "width": 256,
137
+ "in_features": 59,
138
+ "out_features": 18,
139
+ "depth": 4,
140
+ "padding": 118,
141
+ "parameters": 125022,
142
+ "cert_evals": {
143
+ "36": 0.31506848335266113,
144
+ "72": 0.2602739632129669,
145
+ "108": 0.21232876181602478,
146
+ "255": 0.027397260069847107
147
+ }
148
+ }
UCI_N4/sdp/runs/audiology-std/fold_3/result.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 45,
3
+ "best_val_acc": 0.5,
4
+ "test_acc": 0.3546099290780142,
5
+ "train_size": 25,
6
+ "val_size": 30,
7
+ "test_size": 141,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -1.7763568394002505e-17,
12
+ -8.399999999486596e-07,
13
+ 7.99999999756551e-08,
14
+ -1.2800000001833566e-06,
15
+ -3.6000000007696543e-07,
16
+ -8.799999999986596e-07,
17
+ 0.0,
18
+ 0.0,
19
+ 0.0,
20
+ 0.0,
21
+ 0.0,
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0,
26
+ 0.0,
27
+ -8.000000002006402e-08,
28
+ 7.99999999756551e-08,
29
+ 0.0,
30
+ 0.0,
31
+ 0.0,
32
+ 0.0,
33
+ 7.99999999756551e-08,
34
+ 0.0,
35
+ -3.199999999159431e-07,
36
+ 0.0,
37
+ 0.0,
38
+ 0.0,
39
+ 0.0,
40
+ 0.0,
41
+ 0.0,
42
+ 0.0,
43
+ -3.3306690738754695e-17,
44
+ -3.999999999981796e-07,
45
+ 0.0,
46
+ 7.99999999756551e-08,
47
+ 0.0,
48
+ 0.0,
49
+ 0.0,
50
+ 0.0,
51
+ 0.0,
52
+ 0.0,
53
+ -8.659739592076221e-17,
54
+ 0.0,
55
+ -8.659739592076221e-17,
56
+ 0.0,
57
+ 0.0,
58
+ 0.0,
59
+ -7.199999999940587e-07,
60
+ -4.800000000759752e-07,
61
+ 2.799999999325564e-07,
62
+ 0.0,
63
+ 2.220446049250313e-18,
64
+ 0.0,
65
+ -1.5999999996907377e-07,
66
+ 0.0,
67
+ -4.0000000006479297e-07,
68
+ 0.0,
69
+ 0.0
70
+ ]
71
+ ],
72
+ "std": [
73
+ [
74
+ 0.9797958971132714,
75
+ 0.979795399156076,
76
+ 0.979796007645425,
77
+ 0.9797944438980055,
78
+ 0.979795825808005,
79
+ 0.9797970293219844,
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0,
84
+ 1.0,
85
+ 1.0,
86
+ 1.0,
87
+ 1.0,
88
+ 0.9797958971132714,
89
+ 1.0,
90
+ 0.9797961795409461,
91
+ 0.979796007645425,
92
+ 1.0,
93
+ 1.0,
94
+ 1.0,
95
+ 1.0,
96
+ 0.9797960076454252,
97
+ 1.0,
98
+ 0.9797960772142222,
99
+ 1.0,
100
+ 1.0,
101
+ 1.0,
102
+ 1.0,
103
+ 1.0,
104
+ 1.0,
105
+ 1.0,
106
+ 0.9797958971132711,
107
+ 0.9797952000000001,
108
+ 1.0,
109
+ 0.9797960076454251,
110
+ 1.0,
111
+ 1.0,
112
+ 1.0,
113
+ 1.0,
114
+ 1.0,
115
+ 1.0,
116
+ 0.9797958971132709,
117
+ 1.0,
118
+ 0.9797958971132709,
119
+ 1.0,
120
+ 1.0,
121
+ 1.0,
122
+ 0.9797942770355633,
123
+ 0.9797949007791427,
124
+ 0.9797958854236333,
125
+ 1.0,
126
+ 0.979795897113271,
127
+ 1.0,
128
+ 0.9797957933341287,
129
+ 1.0,
130
+ 0.9797952,
131
+ 1.0,
132
+ 1.0
133
+ ]
134
+ ]
135
+ },
136
+ "width": 256,
137
+ "in_features": 59,
138
+ "out_features": 18,
139
+ "depth": 4,
140
+ "padding": 118,
141
+ "parameters": 125022,
142
+ "cert_evals": {
143
+ "36": 0.3191489279270172,
144
+ "72": 0.27659574151039124,
145
+ "108": 0.24822694063186646,
146
+ "255": 0.06382978707551956
147
+ }
148
+ }
UCI_N4/sdp/runs/balance-scale/fold_0/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 40,
3
+ "best_val_acc": 0.7108433734939759,
4
+ "test_acc": 0.694300518134715,
5
+ "train_size": 156,
6
+ "val_size": 83,
7
+ "test_size": 386,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.05887832692307693,
12
+ -2.5641025661690044e-08,
13
+ 0.09964028205128199,
14
+ -0.09058207692307692
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 0.9464310236223092,
20
+ 0.9765235538802873,
21
+ 0.9974316897506468,
22
+ 1.0391308031314608
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.5803108811378479,
34
+ "72": 0.4404144883155823,
35
+ "108": 0.3134714961051941,
36
+ "255": 0.03367875516414642
37
+ }
38
+ }
UCI_N4/sdp/runs/balance-scale/fold_1/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 54,
3
+ "best_val_acc": 0.8556701030927835,
4
+ "test_acc": 0.7688172043010753,
5
+ "train_size": 156,
6
+ "val_size": 97,
7
+ "test_size": 372,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.09511109615384612,
12
+ -3.416070845000482e-17,
13
+ 0.00905823076923074,
14
+ 0.08152388461538454
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.0090351712085057,
20
+ 1.0055834762270852,
21
+ 0.9532661180714023,
22
+ 1.002273371607005
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.6236559152603149,
34
+ "72": 0.4865591526031494,
35
+ "108": 0.3870967626571655,
36
+ "255": 0.09139785170555115
37
+ }
38
+ }
UCI_N4/sdp/runs/balance-scale/fold_2/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 70,
3
+ "best_val_acc": 0.7634408602150538,
4
+ "test_acc": 0.7207446808510638,
5
+ "train_size": 156,
6
+ "val_size": 93,
7
+ "test_size": 376,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.00452913461538464,
12
+ 0.06340748717948716,
13
+ -1.2820512825151571e-08,
14
+ 0.09964030769230771
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 0.9879158233594086,
20
+ 0.9907460042778667,
21
+ 1.027617579941566,
22
+ 0.9614936385801037
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.585106372833252,
34
+ "72": 0.4627659320831299,
35
+ "108": 0.3643617033958435,
36
+ "255": 0.07180850952863693
37
+ }
38
+ }
UCI_N4/sdp/runs/balance-scale/fold_3/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 17,
3
+ "best_val_acc": 0.8260869565217391,
4
+ "test_acc": 0.8143236074270557,
5
+ "train_size": 156,
6
+ "val_size": 92,
7
+ "test_size": 377,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.05434929487179499,
12
+ -0.08605298076923085,
13
+ 0.06793655769230768,
14
+ -0.16757685256410257
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.0569029867956488,
20
+ 1.0161657906649941,
21
+ 0.9625917447832895,
22
+ 0.9469510608150327
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.6100795865058899,
34
+ "72": 0.3899204134941101,
35
+ "108": 0.24137930572032928,
36
+ "255": 0.03978779911994934
37
+ }
38
+ }
UCI_N4/sdp/runs/balloons/fold_0/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 1,
3
+ "best_val_acc": 0.5,
4
+ "test_acc": 0.5,
5
+ "train_size": 4,
6
+ "val_size": 4,
7
+ "test_size": 8,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.0,
12
+ 0.0,
13
+ -0.968246,
14
+ 0.0
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 0.968246,
20
+ 0.968246,
21
+ 1.0,
22
+ 0.968246
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 2,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1558,
32
+ "cert_evals": {
33
+ "36": 0.5,
34
+ "72": 0.5,
35
+ "108": 0.125,
36
+ "255": 0.0
37
+ }
38
+ }
UCI_N4/sdp/runs/balloons/fold_1/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 1,
3
+ "best_val_acc": 0.0,
4
+ "test_acc": 0.3,
5
+ "train_size": 4,
6
+ "val_size": 2,
7
+ "test_size": 10,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.484123,
12
+ 0.484123,
13
+ 0.0,
14
+ 0.0
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 0.8385256331126676,
20
+ 0.8385256331126676,
21
+ 0.968246,
22
+ 0.968246
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 2,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1558,
32
+ "cert_evals": {
33
+ "36": 0.10000000149011612,
34
+ "72": 0.0,
35
+ "108": 0.0,
36
+ "255": 0.0
37
+ }
38
+ }
UCI_N4/sdp/runs/bank/fold_1/result.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 27,
3
+ "best_val_acc": 0.8402985074626865,
4
+ "test_acc": 0.8357221609702316,
5
+ "train_size": 1130,
6
+ "val_size": 670,
7
+ "test_size": 2721,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.01574801380530978,
12
+ 0.0023927396460177394,
13
+ 0.0021967858407077644,
14
+ -0.01932307256637162,
15
+ 0.006853599999999982,
16
+ -0.03479098039734521,
17
+ 0.0010882398230089275,
18
+ 0.02142298584070794,
19
+ -0.04310824424778776,
20
+ -0.002926514159292115,
21
+ -0.01356536707964567,
22
+ 0.01527978015929205,
23
+ -0.04149083628318521,
24
+ -0.006613960176991296,
25
+ 0.006211176106194516,
26
+ -0.021354536283185895
27
+ ]
28
+ ],
29
+ "std": [
30
+ [
31
+ 0.969300386690253,
32
+ 1.0029838787869998,
33
+ 1.0077378567908635,
34
+ 1.0067270576318987,
35
+ 0.9737641828355684,
36
+ 0.8874066057167844,
37
+ 1.0000362134178429,
38
+ 0.978768086158569,
39
+ 1.0166647522536418,
40
+ 1.0110908544078474,
41
+ 0.9795699211960872,
42
+ 0.988628308543735,
43
+ 0.8468895052095667,
44
+ 1.0088647512260476,
45
+ 1.0744144429583726,
46
+ 0.97024384329565
47
+ ]
48
+ ]
49
+ },
50
+ "width": 64,
51
+ "in_features": 16,
52
+ "out_features": 2,
53
+ "depth": 4,
54
+ "padding": 32,
55
+ "parameters": 8770,
56
+ "cert_evals": {
57
+ "36": 0.781330406665802,
58
+ "72": 0.7023153305053711,
59
+ "108": 0.6159499883651733,
60
+ "255": 0.21977214515209198
61
+ }
62
+ }
UCI_N4/sdp/runs/bank/fold_3/result.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 26,
3
+ "best_val_acc": 0.8491704374057315,
4
+ "test_acc": 0.841275659824047,
5
+ "train_size": 1130,
6
+ "val_size": 663,
7
+ "test_size": 2728,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.0319807638938054,
12
+ 0.00842759592920361,
13
+ 0.0032132584070795264,
14
+ -0.0512567557522122,
15
+ 0.02061919999999998,
16
+ 0.017208951831858395,
17
+ -0.023906728318583995,
18
+ 0.009127680530973464,
19
+ 0.04229537345132683,
20
+ 0.03913422522123883,
21
+ -0.0012866005309730669,
22
+ 0.019049747389380534,
23
+ 0.0011946368141599608,
24
+ -0.01394144424778776,
25
+ -0.01887086017699146,
26
+ -0.012322258407079635
27
+ ]
28
+ ],
29
+ "std": [
30
+ [
31
+ 0.9997012384907139,
32
+ 1.011637351521284,
33
+ 1.0052459246549308,
34
+ 0.9835551200097631,
35
+ 0.9188989108776542,
36
+ 0.975563370252112,
37
+ 0.9964151726496702,
38
+ 0.9910016079646086,
39
+ 0.9876324728734414,
40
+ 0.9709295082923052,
41
+ 1.018649934814902,
42
+ 1.045208416973306,
43
+ 1.0916320113723843,
44
+ 0.971971990527501,
45
+ 0.9802679634858928,
46
+ 0.9883913040231975
47
+ ]
48
+ ]
49
+ },
50
+ "width": 64,
51
+ "in_features": 16,
52
+ "out_features": 2,
53
+ "depth": 4,
54
+ "padding": 32,
55
+ "parameters": 8770,
56
+ "cert_evals": {
57
+ "36": 0.7991202473640442,
58
+ "72": 0.7452346086502075,
59
+ "108": 0.671187698841095,
60
+ "255": 0.2738269865512848
61
+ }
62
+ }
UCI_N4/sdp/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/wilcoxon_pairwise_all.csv ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ metric,alg_a,alg_b,n_common,n_nonzero,wins_a,wins_b,ties,win_rate_a_over_b,mean_diff_a_minus_b,median_diff_a_minus_b,W_stat,p_two_sided,z_equiv,effect_size_r,p_holm_global,p_holm_within_metric
2
+ mean_cert_acc_108,aol,ldlt-resnet,121,121,1,120,0,0.008264462809917356,-0.24158591851735536,-0.22286115070000004,11.0,1.797749072159875e-21,-9.516114773194431,0.8651013430176756,1.348311804119906e-19,2.696623608239812e-20
3
+ mean_cert_acc_108,aol,sdp,121,121,4,117,0,0.03305785123966942,-0.20705215111652892,-0.1616377295,33.0,3.102799787065712e-21,-9.459209493224254,0.8599281357476595,2.296071842428627e-19,4.3439197018919967e-20
4
+ mean_cert_acc_108,aol,ortho,121,121,6,115,0,0.049586776859504134,-0.22247552428264467,-0.1828913777,54.0,5.2084252913700304e-21,-9.404890816889083,0.8549900742626438,3.802150462700122e-19,6.770952878781039e-20
5
+ mean_cert_acc_108,aol,sandwich,121,121,5,116,0,0.04132231404958678,-0.2760772690677686,-0.2530477867,63.0,6.49720575799675e-21,-9.381611384174015,0.8528737621976377,4.67798814575766e-19,7.7966469095961e-20
6
+ mean_cert_acc_108,aol,ldlt,121,117,15,102,4,0.14049586776859505,-0.14590028245619835,-0.0794756578,265.0,4.503316114591703e-18,-8.66529847776026,0.8011071276606325,2.656956507609105e-16,4.953647726050873e-17
7
+ mean_cert_acc_108,ldlt,sandwich,121,120,16,104,1,0.13636363636363635,-0.13017698661157026,-0.0911340416,469.0,1.2638532990605736e-16,-8.27693578933863,0.7555774064737658,6.951193144833155e-15,1.2638532990605736e-15
8
+ mean_cert_acc_108,ortho,sandwich,121,121,15,106,0,0.12396694214876033,-0.053601744785123966,-0.04109544310000002,634.0,2.6866436191638997e-15,-7.904660708584446,0.7186055189622224,1.3164553733903108e-13,2.4179792572475097e-14
9
+ mean_cert_acc_108,sandwich,sdp,121,120,95,25,1,0.7892561983471075,0.0690251179512397,0.03914702120000002,769.0,6.820770278047664e-14,7.491275059453614,0.6838567224230998,3.2057620306824023e-12,5.456616222438131e-13
10
+ mean_cert_acc_108,ldlt,ldlt-resnet,121,121,28,93,0,0.23140495867768596,-0.09568563606115704,-0.05591615720000001,854.0,2.207173194165766e-13,-7.335607908882686,0.6668734462620624,9.71156205432937e-12,1.545021235916036e-12
11
+ mean_cert_acc_108,ldlt,ortho,121,121,39,82,0,0.32231404958677684,-0.0765752418264463,-0.028889218600000002,1595.0,5.995523770828764e-08,-5.418934615341759,0.49263041957652354,1.8586123689569167e-06,3.5973142624972584e-07
12
+ mean_cert_acc_108,ldlt,sdp,121,119,37,82,2,0.3140495867768595,-0.06115186866033058,-0.02308885100000002,1675.0,5.06442347780701e-07,-5.0238559265780784,0.46053611771803965,1.4180385737859628e-05,2.5322117389035047e-06
13
+ mean_cert_acc_108,ldlt-resnet,sdp,121,121,83,38,0,0.6859504132231405,0.03453376740082644,0.018723312800000003,2059.0,2.4565990271643443e-05,4.218750528698047,0.3835227753361861,0.0005158857957045123,9.826396108657377e-05
14
+ mean_cert_acc_108,ldlt-resnet,sandwich,121,121,43,78,0,0.35537190082644626,-0.03449135055041323,-0.02128587660000003,2138.0,5.9594970147687546e-05,-4.014408841532416,0.3649462583211287,0.001044842007824354,0.00017878491044306263
15
+ mean_cert_acc_108,ldlt-resnet,ortho,121,121,77,44,0,0.6363636363636364,0.019110394234710743,0.01817540080000002,2506.0,0.0021946809205803104,3.0625387038494716,0.27841260944086105,0.019752128285222794,0.004389361841160621
16
+ mean_cert_acc_108,ortho,sdp,121,121,65,56,0,0.5371900826446281,0.015423373166115709,0.003775427100000006,3069.0,0.10821221439603135,1.6062808573399678,0.1460255324854516,0.8656977151682508,0.10821221439603135
17
+ mean_cert_acc_255,aol,ldlt-resnet,121,112,1,111,9,0.045454545454545456,-0.11734706390661157,-0.0569680196,10.0,5.435127868923378e-20,-9.155012973058705,0.865067413438693,3.58718439348943e-18,8.152691803385068e-19
18
+ mean_cert_acc_255,aol,sandwich,121,114,2,112,7,0.045454545454545456,-0.14975303244545457,-0.08033088320000001,62.0,9.896991201233032e-20,-9.090075933634997,0.8513636145642759,6.33407436878914e-18,1.3855787681726244e-18
19
+ mean_cert_acc_255,aol,sdp,121,107,3,104,14,0.08264462809917356,-0.09192413907520662,-0.04761767380000004,23.0,5.290354120745356e-19,-8.90600710173059,0.8609762036942776,3.227116013654667e-17,6.877460356968962e-18
20
+ mean_cert_acc_255,aol,ortho,121,110,5,105,11,0.08677685950413223,-0.09715260164132232,-0.03630535300000004,122.0,2.3696816082203004e-18,-8.73814550939856,0.8331494842595897,1.4218089649321803e-16,2.8436179298643605e-17
21
+ mean_cert_acc_255,ortho,sandwich,121,114,11,103,7,0.11983471074380166,-0.05260043080413224,-0.031272400199999995,258.0,1.3906084383345868e-17,-8.535906452144342,0.7994608872067027,8.065528942340604e-16,1.5296692821680454e-16
22
+ mean_cert_acc_255,ldlt,sandwich,121,114,12,102,7,0.128099173553719,-0.08444288477851239,-0.0396959223,342.0,1.0551821198881891e-16,-8.298405245791203,0.7772168611963141,5.909019871373859e-15,1.0551821198881892e-15
23
+ mean_cert_acc_255,aol,ldlt,121,93,8,85,28,0.18181818181818182,-0.06531014766694214,-0.0160309789,182.0,1.6583006315455866e-14,-7.674681580277351,0.7958274071184978,7.959843031418816e-13,1.492470568391028e-13
24
+ mean_cert_acc_255,sandwich,sdp,121,115,90,25,6,0.768595041322314,0.05782889337024793,0.023969374600000037,977.0,4.7297035216832455e-11,6.57920498234637,0.613514028043662,1.7499903030228008e-09,3.7837628173465964e-10
25
+ mean_cert_acc_255,ldlt,ldlt-resnet,121,112,23,89,9,0.22727272727272727,-0.052036916239669426,-0.024182047400000004,927.0,8.423037347976693e-11,-6.49284493871755,0.6135161788982517,3.0322934452716093e-09,5.896126143583686e-10
26
+ mean_cert_acc_255,ldlt-resnet,sdp,121,115,80,35,6,0.6859504132231405,0.02542292483140496,0.0174753755,1603.0,1.3503770074500393e-06,4.832192333799678,0.45060425856101827,3.375942518625098e-05,8.102262044700236e-06
27
+ mean_cert_acc_255,ldlt,sdp,121,106,27,79,15,0.28512396694214875,-0.026613991408264467,-0.0090909088,1323.0,1.8823917821239997e-06,-4.765657080027094,0.46288153466731174,4.517740277097599e-05,9.411958910619998e-06
28
+ mean_cert_acc_255,ldlt,ortho,121,111,36,75,10,0.33884297520661155,-0.03184245397438017,-0.008467743099999994,1741.0,5.8046778212464115e-05,-4.020613482233357,0.3816197434492089,0.001044842007824354,0.00023218711284985646
29
+ mean_cert_acc_255,ldlt-resnet,ortho,121,117,77,40,4,0.6528925619834711,0.020194462265289256,0.0131578948,1982.0,6.4586906071814e-05,3.995393428697371,0.36937425314923705,0.001044842007824354,0.00023218711284985646
30
+ mean_cert_acc_255,ldlt-resnet,sandwich,121,118,45,73,3,0.384297520661157,-0.03240596853884298,-0.007769852899999985,2234.0,0.0006111136089935205,-3.4266333540213187,0.31544716905558257,0.007247342740102473,0.001222227217987041
31
+ mean_cert_acc_255,ortho,sdp,121,113,55,58,8,0.48760330578512395,0.0052284625661157,0.0,3068.0,0.6632312125180395,0.43545635481621653,0.0409642880245867,1.0,0.6632312125180395
32
+ mean_cert_acc_36,aol,ldlt-resnet,121,121,6,115,0,0.049586776859504134,-0.2438353373305785,-0.231873706,84.0,1.0860959640304494e-20,-9.327292707838847,0.8479357007126225,7.711281344616191e-19,1.629143946045674e-19
33
+ mean_cert_acc_36,aol,sandwich,121,121,6,115,0,0.049586776859504134,-0.2706310854,-0.24364745610000005,88.0,1.1973679663363807e-20,-9.316946293298813,0.8469951175726194,8.381575764354665e-19,1.676315152870933e-19
34
+ mean_cert_acc_36,aol,sdp,121,121,6,115,0,0.049586776859504134,-0.22157216573801655,-0.19121596959999998,145.0,4.7517450378286984e-20,-9.169509886103357,0.8335918078275779,3.183669175345228e-18,6.177268549177308e-19
35
+ mean_cert_acc_36,aol,ortho,121,121,10,111,0,0.08264462809917356,-0.23044399081570252,-0.21867529300000002,196.0,1.6015929096147696e-19,-9.037593100717949,0.8215993727925408,1.0090035330573049e-17,1.9219114915377238e-18
36
+ mean_cert_acc_36,aol,ldlt,121,121,16,105,0,0.1322314049586777,-0.16320656559917357,-0.12175737319999999,579.0,8.49009306398396e-16,-8.046923908509886,0.7315385371372624,4.499749323911499e-14,9.339102370382356e-15
37
+ mean_cert_acc_36,ldlt,sandwich,121,121,28,93,0,0.23140495867768596,-0.10742451980082644,-0.05105680230000009,884.0,3.928270999828109e-13,-7.258009799832447,0.6598190727120407,1.689156529926087e-11,3.928270999828109e-12
38
+ mean_cert_acc_36,sandwich,sdp,121,121,97,24,0,0.8016528925619835,0.04905891966198347,0.019867688399999972,1005.0,3.783778704446017e-12,6.94503075999648,0.6313664327269527,1.513511481778407e-10,3.4054008340014156e-11
39
+ mean_cert_acc_36,ortho,sandwich,121,120,24,96,1,0.2024793388429752,-0.04018709458429752,-0.027458041900000008,1002.0,5.9401079860634335e-12,-6.881078559242919,0.6281536578104159,2.2572410347041047e-10,4.752086388850747e-11
40
+ mean_cert_acc_36,ldlt,ldlt-resnet,121,121,39,82,0,0.32231404958677684,-0.08062877173140495,-0.03722838319999999,1356.0,1.5687653359134654e-09,-6.037132884108671,0.5488302621916974,5.176925608514436e-08,1.0981357351394257e-08
41
+ mean_cert_acc_36,ldlt,ortho,121,121,47,74,0,0.3884297520661157,-0.06723742521652892,-0.018995806599999998,1855.0,2.0705094452157784e-06,-4.74641767023968,0.43149251547633455,4.762171723996291e-05,1.242305667129467e-05
42
+ mean_cert_acc_36,ldlt,sdp,121,121,49,72,0,0.4049586776859504,-0.05836560013884298,-0.007477333800000013,2119.0,4.833107021995231e-05,-4.063554310597567,0.36941402823614244,0.0009182903341790939,0.00024165535109976156
43
+ mean_cert_acc_36,ldlt-resnet,sandwich,121,121,41,80,0,0.33884297520661155,-0.026795748069421487,-0.016848057499999958,2142.0,6.226392248691838e-05,-4.004062426992384,0.3640056751811258,0.001044842007824354,0.0002490556899476735
44
+ mean_cert_acc_36,ldlt-resnet,sdp,121,120,81,39,1,0.6735537190082644,0.02226317159256198,0.011815026399999984,2104.0,6.467109790725387e-05,3.9950848114653006,0.36469967839763645,0.001044842007824354,0.0002490556899476735
45
+ mean_cert_acc_36,ldlt-resnet,ortho,121,121,78,43,0,0.6446280991735537,0.013391346514876033,0.012558475099999966,2429.0,0.0011074347250513686,3.2617071837450875,0.29651883488591707,0.011074347250513686,0.002214869450102737
46
+ mean_cert_acc_36,ortho,sdp,121,121,60,61,0,0.49586776859504134,0.008871825077685951,-0.00043843690000000546,3076.0,0.11224685580376029,1.5881746318949113,0.1443795119904465,0.8656977151682508,0.11224685580376029
47
+ mean_cert_acc_72,aol,sandwich,121,121,7,114,0,0.05785123966942149,-0.2932351713214876,-0.2614153504,107.0,1.9002333534012075e-20,-9.26780082423366,0.8425273476576055,1.3111610138468333e-18,2.850350030101811e-19
48
+ mean_cert_acc_72,aol,ldlt-resnet,121,121,5,116,0,0.04132231404958678,-0.2631359925727273,-0.23269398510000006,116.0,2.3629582907707156e-20,-9.244521391518589,0.840411035592599,1.6068116377240865e-18,3.308141607079002e-19
49
+ mean_cert_acc_72,aol,sdp,121,121,5,116,0,0.04132231404958678,-0.23148971349173555,-0.1927602664,162.0,7.138107476697239e-20,-9.12553762430822,0.8295943294825655,4.6397698598532054e-18,9.27953971970641e-19
50
+ mean_cert_acc_72,aol,ortho,121,121,11,110,0,0.09090909090909091,-0.2412404211198347,-0.20635481180000004,214.0,2.4491474386621335e-19,-8.991034235287804,0.8173667486625277,1.5184714119705228e-17,2.93897692639456e-18
51
+ mean_cert_acc_72,aol,ldlt,121,119,19,100,2,0.1652892561983471,-0.1632772664768595,-0.125,557.0,1.3650119218595034e-15,-7.988580616952475,0.7323119844949035,7.098061993669418e-14,1.5015131140454537e-14
52
+ mean_cert_acc_72,ldlt,sandwich,121,121,20,101,0,0.1652892561983471,-0.1299579048446281,-0.0772011476,607.0,1.5300017598947808e-15,-7.974499006729662,0.724954455157242,7.803008975463382e-14,1.530001759894781e-14
53
+ mean_cert_acc_72,ortho,sandwich,121,120,19,101,1,0.16115702479338842,-0.0519947502016529,-0.03462790700000007,601.0,2.1695959323890928e-15,-7.931245068189224,0.7240203054914729,1.0847979661945464e-13,1.9526363391501836e-14
54
+ mean_cert_acc_72,sandwich,sdp,121,120,95,25,1,0.7892561983471075,0.06174545782975206,0.03927724810000002,801.0,1.287303814085018e-13,7.407471248265881,0.6762065161243622,5.792867163382581e-12,1.0298430512680145e-12
55
+ mean_cert_acc_72,ldlt,ldlt-resnet,121,121,30,91,0,0.24793388429752067,-0.09985872609586775,-0.062678976,930.0,9.399453364498409e-13,-7.139026032622079,0.6490023666020072,3.9477704130893314e-11,6.579617355148886e-12
56
+ mean_cert_acc_72,ldlt,ortho,121,121,42,79,0,0.34710743801652894,-0.07796315464297522,-0.020989417999999982,1696.0,2.500182392734213e-07,-5.157687648205951,0.4688806952914501,7.500547178202639e-06,1.5001094356405279e-06
57
+ mean_cert_acc_72,ldlt,sdp,121,121,42,79,0,0.34710743801652894,-0.06821244701487603,-0.021312758300000012,1776.0,7.392446683490399e-07,-4.950759357405312,0.450069032491392,1.9959606045424077e-05,3.6962233417451994e-06
58
+ mean_cert_acc_72,ldlt-resnet,sdp,121,121,83,38,0,0.6859504132231405,0.03164627908099173,0.01917563379999998,1938.0,5.850271358991362e-06,4.531729568534016,0.4119754153212742,0.00012870596989780997,2.3401085435965447e-05
59
+ mean_cert_acc_72,ldlt-resnet,sandwich,121,121,40,81,0,0.3305785123966942,-0.03009917874876034,-0.019695848200000032,2062.0,2.5425319440171077e-05,-4.210990717793024,0.382817337981184,0.0005158857957045123,7.627595832051323e-05
60
+ mean_cert_acc_72,ldlt-resnet,ortho,121,121,78,43,0,0.6446280991735537,0.021895571452892563,0.017794482400000033,2306.0,0.0003437790889925944,3.579859430851071,0.3254417664410065,0.004469128156903727,0.0006875581779851888
61
+ mean_cert_acc_72,ortho,sdp,121,121,66,55,0,0.5454545454545454,0.009750707628099172,0.004098355799999953,3178.0,0.18538979937926348,1.3243410611240953,0.1203946419203723,0.8656977151682508,0.18538979937926348
62
+ mean_test_acc,aol,ldlt,121,121,16,105,0,0.1322314049586777,-0.09281452340082647,-0.056798912199999996,412.0,2.273589154706615e-17,-8.478886715556222,0.7708078832323838,1.2959458181827706e-15,3.4103837320599226e-16
63
+ mean_test_acc,aol,sandwich,121,121,18,103,0,0.1487603305785124,-0.09203259326611571,-0.05946643780000005,518.0,2.311544436918459e-16,-8.204706730245373,0.7458824300223067,1.248233995935968e-14,3.2361622116858428e-15
64
+ mean_test_acc,aol,sdp,121,121,22,99,0,0.18181818181818182,-0.06835675380991735,-0.03513440550000002,806.0,8.667701016468735e-14,-7.459764883363071,0.6781604439420974,3.987142467575618e-12,1.1268011321409356e-12
65
+ mean_test_acc,aol,ortho,121,121,27,94,0,0.2231404958677686,-0.0674542894,-0.02649849470000004,971.0,2.0217519208624917e-12,-7.032975283586752,0.6393613894169774,8.289182875536216e-11,2.42610230503499e-11
66
+ mean_test_acc,aol,ldlt-resnet,121,121,25,96,0,0.2066115702479339,-0.07273327814214876,-0.031338923699999965,1013.0,4.3801917672420244e-12,-6.924337930916415,0.6294852664469468,1.7082747892243896e-10,4.818210943966227e-11
67
+ mean_test_acc,ortho,sandwich,121,120,31,89,1,0.2603305785123967,-0.024578303866115706,-0.012561727300000047,1269.0,6.335852078999485e-10,-6.181840509645258,0.5643222490053234,2.21754822764982e-08,6.335852078999485e-09
68
+ mean_test_acc,ldlt,ortho,121,121,94,27,0,0.7768595041322314,0.02536023400082645,0.013893890999999992,1309.0,7.334300863478093e-10,6.158703254954046,0.5598821140867315,2.4936622935825517e-08,6.600870777130284e-09
69
+ mean_test_acc,ldlt,sdp,121,121,86,35,0,0.7107438016528925,0.024457769590909093,0.011069503199999942,1503.0,1.5412957513923103e-08,5.6569021497624945,0.5142638317965904,4.932146404455393e-07,1.2330366011138482e-07
70
+ mean_test_acc,ldlt,ldlt-resnet,121,120,87,33,1,0.7231404958677686,0.020081245258677688,0.01084393090000002,1689.0,3.7364765861695115e-07,5.081915487806236,0.46391329133439085,1.0835782099891583e-05,2.615533610318658e-06
71
+ mean_test_acc,sandwich,sdp,121,121,83,38,0,0.6859504132231405,0.02367583945619835,0.008980192799999953,1789.0,8.782065986480298e-07,4.917133510150208,0.44701213728638256,2.2833371564848774e-05,5.269239591888179e-06
72
+ mean_test_acc,ldlt-resnet,sandwich,121,121,43,78,0,0.35537190082644626,-0.019299315123966942,-0.006794625399999976,2364.0,0.0006039452283418727,-3.4298364200206075,0.3118033109109643,0.007247342740102473,0.0030197261417093633
73
+ mean_test_acc,ldlt-resnet,sdp,121,120,66,54,1,0.5495867768595041,0.004376524332231406,0.0019017287000000493,3070.0,0.14285074221929925,1.4652572612355523,0.133759075754492,0.8656977151682508,0.571402968877197
74
+ mean_test_acc,ldlt-resnet,ortho,121,121,71,50,0,0.5867768595041323,0.005278988742148763,0.002452642000000005,3138.0,0.15334793383215564,1.4278052065244156,0.12980047332040143,0.8656977151682508,0.571402968877197
75
+ mean_test_acc,ortho,sdp,121,121,60,61,0,0.49586776859504134,-0.0009024644099173576,-0.00036599980000007193,3623.0,0.862413703083493,-0.17330244354553592,0.01575476759504872,1.0,1.0
76
+ mean_test_acc,ldlt,sandwich,121,121,59,62,0,0.48760330578512395,0.000781930134710744,-0.00016415209999998126,3624.0,0.8644472072224189,0.170715839910528,0.015519621810048,1.0,1.0
UCI_N4/wilcoxon_pairwise_all.json ADDED
@@ -0,0 +1,1427 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metric":"mean_cert_acc_108",
4
+ "alg_a":"aol",
5
+ "alg_b":"ldlt-resnet",
6
+ "n_common":121,
7
+ "n_nonzero":121,
8
+ "wins_a":1,
9
+ "wins_b":120,
10
+ "ties":0,
11
+ "win_rate_a_over_b":0.0082644628,
12
+ "mean_diff_a_minus_b":-0.2415859185,
13
+ "median_diff_a_minus_b":-0.2228611507,
14
+ "W_stat":11.0,
15
+ "p_two_sided":1.797749072e-21,
16
+ "z_equiv":-9.5161147732,
17
+ "effect_size_r":0.865101343,
18
+ "p_holm_global":1.348311804e-19,
19
+ "p_holm_within_metric":2.696623608e-20
20
+ },
21
+ {
22
+ "metric":"mean_cert_acc_108",
23
+ "alg_a":"aol",
24
+ "alg_b":"sdp",
25
+ "n_common":121,
26
+ "n_nonzero":121,
27
+ "wins_a":4,
28
+ "wins_b":117,
29
+ "ties":0,
30
+ "win_rate_a_over_b":0.0330578512,
31
+ "mean_diff_a_minus_b":-0.2070521511,
32
+ "median_diff_a_minus_b":-0.1616377295,
33
+ "W_stat":33.0,
34
+ "p_two_sided":3.102799787e-21,
35
+ "z_equiv":-9.4592094932,
36
+ "effect_size_r":0.8599281357,
37
+ "p_holm_global":2.296071842e-19,
38
+ "p_holm_within_metric":4.343919702e-20
39
+ },
40
+ {
41
+ "metric":"mean_cert_acc_108",
42
+ "alg_a":"aol",
43
+ "alg_b":"ortho",
44
+ "n_common":121,
45
+ "n_nonzero":121,
46
+ "wins_a":6,
47
+ "wins_b":115,
48
+ "ties":0,
49
+ "win_rate_a_over_b":0.0495867769,
50
+ "mean_diff_a_minus_b":-0.2224755243,
51
+ "median_diff_a_minus_b":-0.1828913777,
52
+ "W_stat":54.0,
53
+ "p_two_sided":5.208425291e-21,
54
+ "z_equiv":-9.4048908169,
55
+ "effect_size_r":0.8549900743,
56
+ "p_holm_global":3.802150463e-19,
57
+ "p_holm_within_metric":6.770952879e-20
58
+ },
59
+ {
60
+ "metric":"mean_cert_acc_108",
61
+ "alg_a":"aol",
62
+ "alg_b":"sandwich",
63
+ "n_common":121,
64
+ "n_nonzero":121,
65
+ "wins_a":5,
66
+ "wins_b":116,
67
+ "ties":0,
68
+ "win_rate_a_over_b":0.041322314,
69
+ "mean_diff_a_minus_b":-0.2760772691,
70
+ "median_diff_a_minus_b":-0.2530477867,
71
+ "W_stat":63.0,
72
+ "p_two_sided":6.497205758e-21,
73
+ "z_equiv":-9.3816113842,
74
+ "effect_size_r":0.8528737622,
75
+ "p_holm_global":4.677988146e-19,
76
+ "p_holm_within_metric":7.79664691e-20
77
+ },
78
+ {
79
+ "metric":"mean_cert_acc_108",
80
+ "alg_a":"aol",
81
+ "alg_b":"ldlt",
82
+ "n_common":121,
83
+ "n_nonzero":117,
84
+ "wins_a":15,
85
+ "wins_b":102,
86
+ "ties":4,
87
+ "win_rate_a_over_b":0.1404958678,
88
+ "mean_diff_a_minus_b":-0.1459002825,
89
+ "median_diff_a_minus_b":-0.0794756578,
90
+ "W_stat":265.0,
91
+ "p_two_sided":4.503316115e-18,
92
+ "z_equiv":-8.6652984778,
93
+ "effect_size_r":0.8011071277,
94
+ "p_holm_global":2.656956508e-16,
95
+ "p_holm_within_metric":4.953647726e-17
96
+ },
97
+ {
98
+ "metric":"mean_cert_acc_108",
99
+ "alg_a":"ldlt",
100
+ "alg_b":"sandwich",
101
+ "n_common":121,
102
+ "n_nonzero":120,
103
+ "wins_a":16,
104
+ "wins_b":104,
105
+ "ties":1,
106
+ "win_rate_a_over_b":0.1363636364,
107
+ "mean_diff_a_minus_b":-0.1301769866,
108
+ "median_diff_a_minus_b":-0.0911340416,
109
+ "W_stat":469.0,
110
+ "p_two_sided":1.263853299e-16,
111
+ "z_equiv":-8.2769357893,
112
+ "effect_size_r":0.7555774065,
113
+ "p_holm_global":0.0,
114
+ "p_holm_within_metric":0.0
115
+ },
116
+ {
117
+ "metric":"mean_cert_acc_108",
118
+ "alg_a":"ortho",
119
+ "alg_b":"sandwich",
120
+ "n_common":121,
121
+ "n_nonzero":121,
122
+ "wins_a":15,
123
+ "wins_b":106,
124
+ "ties":0,
125
+ "win_rate_a_over_b":0.1239669421,
126
+ "mean_diff_a_minus_b":-0.0536017448,
127
+ "median_diff_a_minus_b":-0.0410954431,
128
+ "W_stat":634.0,
129
+ "p_two_sided":0.0,
130
+ "z_equiv":-7.9046607086,
131
+ "effect_size_r":0.718605519,
132
+ "p_holm_global":0.0,
133
+ "p_holm_within_metric":0.0
134
+ },
135
+ {
136
+ "metric":"mean_cert_acc_108",
137
+ "alg_a":"sandwich",
138
+ "alg_b":"sdp",
139
+ "n_common":121,
140
+ "n_nonzero":120,
141
+ "wins_a":95,
142
+ "wins_b":25,
143
+ "ties":1,
144
+ "win_rate_a_over_b":0.7892561983,
145
+ "mean_diff_a_minus_b":0.069025118,
146
+ "median_diff_a_minus_b":0.0391470212,
147
+ "W_stat":769.0,
148
+ "p_two_sided":0.0,
149
+ "z_equiv":7.4912750595,
150
+ "effect_size_r":0.6838567224,
151
+ "p_holm_global":0.0,
152
+ "p_holm_within_metric":0.0
153
+ },
154
+ {
155
+ "metric":"mean_cert_acc_108",
156
+ "alg_a":"ldlt",
157
+ "alg_b":"ldlt-resnet",
158
+ "n_common":121,
159
+ "n_nonzero":121,
160
+ "wins_a":28,
161
+ "wins_b":93,
162
+ "ties":0,
163
+ "win_rate_a_over_b":0.2314049587,
164
+ "mean_diff_a_minus_b":-0.0956856361,
165
+ "median_diff_a_minus_b":-0.0559161572,
166
+ "W_stat":854.0,
167
+ "p_two_sided":0.0,
168
+ "z_equiv":-7.3356079089,
169
+ "effect_size_r":0.6668734463,
170
+ "p_holm_global":0.0,
171
+ "p_holm_within_metric":0.0
172
+ },
173
+ {
174
+ "metric":"mean_cert_acc_108",
175
+ "alg_a":"ldlt",
176
+ "alg_b":"ortho",
177
+ "n_common":121,
178
+ "n_nonzero":121,
179
+ "wins_a":39,
180
+ "wins_b":82,
181
+ "ties":0,
182
+ "win_rate_a_over_b":0.3223140496,
183
+ "mean_diff_a_minus_b":-0.0765752418,
184
+ "median_diff_a_minus_b":-0.0288892186,
185
+ "W_stat":1595.0,
186
+ "p_two_sided":0.00000006,
187
+ "z_equiv":-5.4189346153,
188
+ "effect_size_r":0.4926304196,
189
+ "p_holm_global":0.0000018586,
190
+ "p_holm_within_metric":0.0000003597
191
+ },
192
+ {
193
+ "metric":"mean_cert_acc_108",
194
+ "alg_a":"ldlt",
195
+ "alg_b":"sdp",
196
+ "n_common":121,
197
+ "n_nonzero":119,
198
+ "wins_a":37,
199
+ "wins_b":82,
200
+ "ties":2,
201
+ "win_rate_a_over_b":0.3140495868,
202
+ "mean_diff_a_minus_b":-0.0611518687,
203
+ "median_diff_a_minus_b":-0.023088851,
204
+ "W_stat":1675.0,
205
+ "p_two_sided":0.0000005064,
206
+ "z_equiv":-5.0238559266,
207
+ "effect_size_r":0.4605361177,
208
+ "p_holm_global":0.0000141804,
209
+ "p_holm_within_metric":0.0000025322
210
+ },
211
+ {
212
+ "metric":"mean_cert_acc_108",
213
+ "alg_a":"ldlt-resnet",
214
+ "alg_b":"sdp",
215
+ "n_common":121,
216
+ "n_nonzero":121,
217
+ "wins_a":83,
218
+ "wins_b":38,
219
+ "ties":0,
220
+ "win_rate_a_over_b":0.6859504132,
221
+ "mean_diff_a_minus_b":0.0345337674,
222
+ "median_diff_a_minus_b":0.0187233128,
223
+ "W_stat":2059.0,
224
+ "p_two_sided":0.000024566,
225
+ "z_equiv":4.2187505287,
226
+ "effect_size_r":0.3835227753,
227
+ "p_holm_global":0.0005158858,
228
+ "p_holm_within_metric":0.000098264
229
+ },
230
+ {
231
+ "metric":"mean_cert_acc_108",
232
+ "alg_a":"ldlt-resnet",
233
+ "alg_b":"sandwich",
234
+ "n_common":121,
235
+ "n_nonzero":121,
236
+ "wins_a":43,
237
+ "wins_b":78,
238
+ "ties":0,
239
+ "win_rate_a_over_b":0.3553719008,
240
+ "mean_diff_a_minus_b":-0.0344913506,
241
+ "median_diff_a_minus_b":-0.0212858766,
242
+ "W_stat":2138.0,
243
+ "p_two_sided":0.000059595,
244
+ "z_equiv":-4.0144088415,
245
+ "effect_size_r":0.3649462583,
246
+ "p_holm_global":0.001044842,
247
+ "p_holm_within_metric":0.0001787849
248
+ },
249
+ {
250
+ "metric":"mean_cert_acc_108",
251
+ "alg_a":"ldlt-resnet",
252
+ "alg_b":"ortho",
253
+ "n_common":121,
254
+ "n_nonzero":121,
255
+ "wins_a":77,
256
+ "wins_b":44,
257
+ "ties":0,
258
+ "win_rate_a_over_b":0.6363636364,
259
+ "mean_diff_a_minus_b":0.0191103942,
260
+ "median_diff_a_minus_b":0.0181754008,
261
+ "W_stat":2506.0,
262
+ "p_two_sided":0.0021946809,
263
+ "z_equiv":3.0625387038,
264
+ "effect_size_r":0.2784126094,
265
+ "p_holm_global":0.0197521283,
266
+ "p_holm_within_metric":0.0043893618
267
+ },
268
+ {
269
+ "metric":"mean_cert_acc_108",
270
+ "alg_a":"ortho",
271
+ "alg_b":"sdp",
272
+ "n_common":121,
273
+ "n_nonzero":121,
274
+ "wins_a":65,
275
+ "wins_b":56,
276
+ "ties":0,
277
+ "win_rate_a_over_b":0.5371900826,
278
+ "mean_diff_a_minus_b":0.0154233732,
279
+ "median_diff_a_minus_b":0.0037754271,
280
+ "W_stat":3069.0,
281
+ "p_two_sided":0.1082122144,
282
+ "z_equiv":1.6062808573,
283
+ "effect_size_r":0.1460255325,
284
+ "p_holm_global":0.8656977152,
285
+ "p_holm_within_metric":0.1082122144
286
+ },
287
+ {
288
+ "metric":"mean_cert_acc_255",
289
+ "alg_a":"aol",
290
+ "alg_b":"ldlt-resnet",
291
+ "n_common":121,
292
+ "n_nonzero":112,
293
+ "wins_a":1,
294
+ "wins_b":111,
295
+ "ties":9,
296
+ "win_rate_a_over_b":0.0454545455,
297
+ "mean_diff_a_minus_b":-0.1173470639,
298
+ "median_diff_a_minus_b":-0.0569680196,
299
+ "W_stat":10.0,
300
+ "p_two_sided":5.435127869e-20,
301
+ "z_equiv":-9.1550129731,
302
+ "effect_size_r":0.8650674134,
303
+ "p_holm_global":3.587184393e-18,
304
+ "p_holm_within_metric":8.152691803e-19
305
+ },
306
+ {
307
+ "metric":"mean_cert_acc_255",
308
+ "alg_a":"aol",
309
+ "alg_b":"sandwich",
310
+ "n_common":121,
311
+ "n_nonzero":114,
312
+ "wins_a":2,
313
+ "wins_b":112,
314
+ "ties":7,
315
+ "win_rate_a_over_b":0.0454545455,
316
+ "mean_diff_a_minus_b":-0.1497530324,
317
+ "median_diff_a_minus_b":-0.0803308832,
318
+ "W_stat":62.0,
319
+ "p_two_sided":9.896991201e-20,
320
+ "z_equiv":-9.0900759336,
321
+ "effect_size_r":0.8513636146,
322
+ "p_holm_global":6.334074369e-18,
323
+ "p_holm_within_metric":1.385578768e-18
324
+ },
325
+ {
326
+ "metric":"mean_cert_acc_255",
327
+ "alg_a":"aol",
328
+ "alg_b":"sdp",
329
+ "n_common":121,
330
+ "n_nonzero":107,
331
+ "wins_a":3,
332
+ "wins_b":104,
333
+ "ties":14,
334
+ "win_rate_a_over_b":0.0826446281,
335
+ "mean_diff_a_minus_b":-0.0919241391,
336
+ "median_diff_a_minus_b":-0.0476176738,
337
+ "W_stat":23.0,
338
+ "p_two_sided":5.290354121e-19,
339
+ "z_equiv":-8.9060071017,
340
+ "effect_size_r":0.8609762037,
341
+ "p_holm_global":3.227116014e-17,
342
+ "p_holm_within_metric":6.877460357e-18
343
+ },
344
+ {
345
+ "metric":"mean_cert_acc_255",
346
+ "alg_a":"aol",
347
+ "alg_b":"ortho",
348
+ "n_common":121,
349
+ "n_nonzero":110,
350
+ "wins_a":5,
351
+ "wins_b":105,
352
+ "ties":11,
353
+ "win_rate_a_over_b":0.0867768595,
354
+ "mean_diff_a_minus_b":-0.0971526016,
355
+ "median_diff_a_minus_b":-0.036305353,
356
+ "W_stat":122.0,
357
+ "p_two_sided":2.369681608e-18,
358
+ "z_equiv":-8.7381455094,
359
+ "effect_size_r":0.8331494843,
360
+ "p_holm_global":1.421808965e-16,
361
+ "p_holm_within_metric":2.84361793e-17
362
+ },
363
+ {
364
+ "metric":"mean_cert_acc_255",
365
+ "alg_a":"ortho",
366
+ "alg_b":"sandwich",
367
+ "n_common":121,
368
+ "n_nonzero":114,
369
+ "wins_a":11,
370
+ "wins_b":103,
371
+ "ties":7,
372
+ "win_rate_a_over_b":0.1198347107,
373
+ "mean_diff_a_minus_b":-0.0526004308,
374
+ "median_diff_a_minus_b":-0.0312724002,
375
+ "W_stat":258.0,
376
+ "p_two_sided":1.390608438e-17,
377
+ "z_equiv":-8.5359064521,
378
+ "effect_size_r":0.7994608872,
379
+ "p_holm_global":8.065528942e-16,
380
+ "p_holm_within_metric":1.529669282e-16
381
+ },
382
+ {
383
+ "metric":"mean_cert_acc_255",
384
+ "alg_a":"ldlt",
385
+ "alg_b":"sandwich",
386
+ "n_common":121,
387
+ "n_nonzero":114,
388
+ "wins_a":12,
389
+ "wins_b":102,
390
+ "ties":7,
391
+ "win_rate_a_over_b":0.1280991736,
392
+ "mean_diff_a_minus_b":-0.0844428848,
393
+ "median_diff_a_minus_b":-0.0396959223,
394
+ "W_stat":342.0,
395
+ "p_two_sided":1.05518212e-16,
396
+ "z_equiv":-8.2984052458,
397
+ "effect_size_r":0.7772168612,
398
+ "p_holm_global":0.0,
399
+ "p_holm_within_metric":0.0
400
+ },
401
+ {
402
+ "metric":"mean_cert_acc_255",
403
+ "alg_a":"aol",
404
+ "alg_b":"ldlt",
405
+ "n_common":121,
406
+ "n_nonzero":93,
407
+ "wins_a":8,
408
+ "wins_b":85,
409
+ "ties":28,
410
+ "win_rate_a_over_b":0.1818181818,
411
+ "mean_diff_a_minus_b":-0.0653101477,
412
+ "median_diff_a_minus_b":-0.0160309789,
413
+ "W_stat":182.0,
414
+ "p_two_sided":0.0,
415
+ "z_equiv":-7.6746815803,
416
+ "effect_size_r":0.7958274071,
417
+ "p_holm_global":0.0,
418
+ "p_holm_within_metric":0.0
419
+ },
420
+ {
421
+ "metric":"mean_cert_acc_255",
422
+ "alg_a":"sandwich",
423
+ "alg_b":"sdp",
424
+ "n_common":121,
425
+ "n_nonzero":115,
426
+ "wins_a":90,
427
+ "wins_b":25,
428
+ "ties":6,
429
+ "win_rate_a_over_b":0.7685950413,
430
+ "mean_diff_a_minus_b":0.0578288934,
431
+ "median_diff_a_minus_b":0.0239693746,
432
+ "W_stat":977.0,
433
+ "p_two_sided":0.0,
434
+ "z_equiv":6.5792049823,
435
+ "effect_size_r":0.613514028,
436
+ "p_holm_global":0.0000000017,
437
+ "p_holm_within_metric":0.0000000004
438
+ },
439
+ {
440
+ "metric":"mean_cert_acc_255",
441
+ "alg_a":"ldlt",
442
+ "alg_b":"ldlt-resnet",
443
+ "n_common":121,
444
+ "n_nonzero":112,
445
+ "wins_a":23,
446
+ "wins_b":89,
447
+ "ties":9,
448
+ "win_rate_a_over_b":0.2272727273,
449
+ "mean_diff_a_minus_b":-0.0520369162,
450
+ "median_diff_a_minus_b":-0.0241820474,
451
+ "W_stat":927.0,
452
+ "p_two_sided":0.0000000001,
453
+ "z_equiv":-6.4928449387,
454
+ "effect_size_r":0.6135161789,
455
+ "p_holm_global":0.000000003,
456
+ "p_holm_within_metric":0.0000000006
457
+ },
458
+ {
459
+ "metric":"mean_cert_acc_255",
460
+ "alg_a":"ldlt-resnet",
461
+ "alg_b":"sdp",
462
+ "n_common":121,
463
+ "n_nonzero":115,
464
+ "wins_a":80,
465
+ "wins_b":35,
466
+ "ties":6,
467
+ "win_rate_a_over_b":0.6859504132,
468
+ "mean_diff_a_minus_b":0.0254229248,
469
+ "median_diff_a_minus_b":0.0174753755,
470
+ "W_stat":1603.0,
471
+ "p_two_sided":0.0000013504,
472
+ "z_equiv":4.8321923338,
473
+ "effect_size_r":0.4506042586,
474
+ "p_holm_global":0.0000337594,
475
+ "p_holm_within_metric":0.0000081023
476
+ },
477
+ {
478
+ "metric":"mean_cert_acc_255",
479
+ "alg_a":"ldlt",
480
+ "alg_b":"sdp",
481
+ "n_common":121,
482
+ "n_nonzero":106,
483
+ "wins_a":27,
484
+ "wins_b":79,
485
+ "ties":15,
486
+ "win_rate_a_over_b":0.2851239669,
487
+ "mean_diff_a_minus_b":-0.0266139914,
488
+ "median_diff_a_minus_b":-0.0090909088,
489
+ "W_stat":1323.0,
490
+ "p_two_sided":0.0000018824,
491
+ "z_equiv":-4.76565708,
492
+ "effect_size_r":0.4628815347,
493
+ "p_holm_global":0.0000451774,
494
+ "p_holm_within_metric":0.000009412
495
+ },
496
+ {
497
+ "metric":"mean_cert_acc_255",
498
+ "alg_a":"ldlt",
499
+ "alg_b":"ortho",
500
+ "n_common":121,
501
+ "n_nonzero":111,
502
+ "wins_a":36,
503
+ "wins_b":75,
504
+ "ties":10,
505
+ "win_rate_a_over_b":0.3388429752,
506
+ "mean_diff_a_minus_b":-0.031842454,
507
+ "median_diff_a_minus_b":-0.0084677431,
508
+ "W_stat":1741.0,
509
+ "p_two_sided":0.0000580468,
510
+ "z_equiv":-4.0206134822,
511
+ "effect_size_r":0.3816197434,
512
+ "p_holm_global":0.001044842,
513
+ "p_holm_within_metric":0.0002321871
514
+ },
515
+ {
516
+ "metric":"mean_cert_acc_255",
517
+ "alg_a":"ldlt-resnet",
518
+ "alg_b":"ortho",
519
+ "n_common":121,
520
+ "n_nonzero":117,
521
+ "wins_a":77,
522
+ "wins_b":40,
523
+ "ties":4,
524
+ "win_rate_a_over_b":0.652892562,
525
+ "mean_diff_a_minus_b":0.0201944623,
526
+ "median_diff_a_minus_b":0.0131578948,
527
+ "W_stat":1982.0,
528
+ "p_two_sided":0.0000645869,
529
+ "z_equiv":3.9953934287,
530
+ "effect_size_r":0.3693742531,
531
+ "p_holm_global":0.001044842,
532
+ "p_holm_within_metric":0.0002321871
533
+ },
534
+ {
535
+ "metric":"mean_cert_acc_255",
536
+ "alg_a":"ldlt-resnet",
537
+ "alg_b":"sandwich",
538
+ "n_common":121,
539
+ "n_nonzero":118,
540
+ "wins_a":45,
541
+ "wins_b":73,
542
+ "ties":3,
543
+ "win_rate_a_over_b":0.3842975207,
544
+ "mean_diff_a_minus_b":-0.0324059685,
545
+ "median_diff_a_minus_b":-0.0077698529,
546
+ "W_stat":2234.0,
547
+ "p_two_sided":0.0006111136,
548
+ "z_equiv":-3.426633354,
549
+ "effect_size_r":0.3154471691,
550
+ "p_holm_global":0.0072473427,
551
+ "p_holm_within_metric":0.0012222272
552
+ },
553
+ {
554
+ "metric":"mean_cert_acc_255",
555
+ "alg_a":"ortho",
556
+ "alg_b":"sdp",
557
+ "n_common":121,
558
+ "n_nonzero":113,
559
+ "wins_a":55,
560
+ "wins_b":58,
561
+ "ties":8,
562
+ "win_rate_a_over_b":0.4876033058,
563
+ "mean_diff_a_minus_b":0.0052284626,
564
+ "median_diff_a_minus_b":0.0,
565
+ "W_stat":3068.0,
566
+ "p_two_sided":0.6632312125,
567
+ "z_equiv":0.4354563548,
568
+ "effect_size_r":0.040964288,
569
+ "p_holm_global":1.0,
570
+ "p_holm_within_metric":0.6632312125
571
+ },
572
+ {
573
+ "metric":"mean_cert_acc_36",
574
+ "alg_a":"aol",
575
+ "alg_b":"ldlt-resnet",
576
+ "n_common":121,
577
+ "n_nonzero":121,
578
+ "wins_a":6,
579
+ "wins_b":115,
580
+ "ties":0,
581
+ "win_rate_a_over_b":0.0495867769,
582
+ "mean_diff_a_minus_b":-0.2438353373,
583
+ "median_diff_a_minus_b":-0.231873706,
584
+ "W_stat":84.0,
585
+ "p_two_sided":1.086095964e-20,
586
+ "z_equiv":-9.3272927078,
587
+ "effect_size_r":0.8479357007,
588
+ "p_holm_global":7.711281345e-19,
589
+ "p_holm_within_metric":1.629143946e-19
590
+ },
591
+ {
592
+ "metric":"mean_cert_acc_36",
593
+ "alg_a":"aol",
594
+ "alg_b":"sandwich",
595
+ "n_common":121,
596
+ "n_nonzero":121,
597
+ "wins_a":6,
598
+ "wins_b":115,
599
+ "ties":0,
600
+ "win_rate_a_over_b":0.0495867769,
601
+ "mean_diff_a_minus_b":-0.2706310854,
602
+ "median_diff_a_minus_b":-0.2436474561,
603
+ "W_stat":88.0,
604
+ "p_two_sided":1.197367966e-20,
605
+ "z_equiv":-9.3169462933,
606
+ "effect_size_r":0.8469951176,
607
+ "p_holm_global":8.381575764e-19,
608
+ "p_holm_within_metric":1.676315153e-19
609
+ },
610
+ {
611
+ "metric":"mean_cert_acc_36",
612
+ "alg_a":"aol",
613
+ "alg_b":"sdp",
614
+ "n_common":121,
615
+ "n_nonzero":121,
616
+ "wins_a":6,
617
+ "wins_b":115,
618
+ "ties":0,
619
+ "win_rate_a_over_b":0.0495867769,
620
+ "mean_diff_a_minus_b":-0.2215721657,
621
+ "median_diff_a_minus_b":-0.1912159696,
622
+ "W_stat":145.0,
623
+ "p_two_sided":4.751745038e-20,
624
+ "z_equiv":-9.1695098861,
625
+ "effect_size_r":0.8335918078,
626
+ "p_holm_global":3.183669175e-18,
627
+ "p_holm_within_metric":6.177268549e-19
628
+ },
629
+ {
630
+ "metric":"mean_cert_acc_36",
631
+ "alg_a":"aol",
632
+ "alg_b":"ortho",
633
+ "n_common":121,
634
+ "n_nonzero":121,
635
+ "wins_a":10,
636
+ "wins_b":111,
637
+ "ties":0,
638
+ "win_rate_a_over_b":0.0826446281,
639
+ "mean_diff_a_minus_b":-0.2304439908,
640
+ "median_diff_a_minus_b":-0.218675293,
641
+ "W_stat":196.0,
642
+ "p_two_sided":1.60159291e-19,
643
+ "z_equiv":-9.0375931007,
644
+ "effect_size_r":0.8215993728,
645
+ "p_holm_global":1.009003533e-17,
646
+ "p_holm_within_metric":1.921911492e-18
647
+ },
648
+ {
649
+ "metric":"mean_cert_acc_36",
650
+ "alg_a":"aol",
651
+ "alg_b":"ldlt",
652
+ "n_common":121,
653
+ "n_nonzero":121,
654
+ "wins_a":16,
655
+ "wins_b":105,
656
+ "ties":0,
657
+ "win_rate_a_over_b":0.132231405,
658
+ "mean_diff_a_minus_b":-0.1632065656,
659
+ "median_diff_a_minus_b":-0.1217573732,
660
+ "W_stat":579.0,
661
+ "p_two_sided":8.490093064e-16,
662
+ "z_equiv":-8.0469239085,
663
+ "effect_size_r":0.7315385371,
664
+ "p_holm_global":0.0,
665
+ "p_holm_within_metric":0.0
666
+ },
667
+ {
668
+ "metric":"mean_cert_acc_36",
669
+ "alg_a":"ldlt",
670
+ "alg_b":"sandwich",
671
+ "n_common":121,
672
+ "n_nonzero":121,
673
+ "wins_a":28,
674
+ "wins_b":93,
675
+ "ties":0,
676
+ "win_rate_a_over_b":0.2314049587,
677
+ "mean_diff_a_minus_b":-0.1074245198,
678
+ "median_diff_a_minus_b":-0.0510568023,
679
+ "W_stat":884.0,
680
+ "p_two_sided":0.0,
681
+ "z_equiv":-7.2580097998,
682
+ "effect_size_r":0.6598190727,
683
+ "p_holm_global":0.0,
684
+ "p_holm_within_metric":0.0
685
+ },
686
+ {
687
+ "metric":"mean_cert_acc_36",
688
+ "alg_a":"sandwich",
689
+ "alg_b":"sdp",
690
+ "n_common":121,
691
+ "n_nonzero":121,
692
+ "wins_a":97,
693
+ "wins_b":24,
694
+ "ties":0,
695
+ "win_rate_a_over_b":0.8016528926,
696
+ "mean_diff_a_minus_b":0.0490589197,
697
+ "median_diff_a_minus_b":0.0198676884,
698
+ "W_stat":1005.0,
699
+ "p_two_sided":0.0,
700
+ "z_equiv":6.94503076,
701
+ "effect_size_r":0.6313664327,
702
+ "p_holm_global":0.0000000002,
703
+ "p_holm_within_metric":0.0
704
+ },
705
+ {
706
+ "metric":"mean_cert_acc_36",
707
+ "alg_a":"ortho",
708
+ "alg_b":"sandwich",
709
+ "n_common":121,
710
+ "n_nonzero":120,
711
+ "wins_a":24,
712
+ "wins_b":96,
713
+ "ties":1,
714
+ "win_rate_a_over_b":0.2024793388,
715
+ "mean_diff_a_minus_b":-0.0401870946,
716
+ "median_diff_a_minus_b":-0.0274580419,
717
+ "W_stat":1002.0,
718
+ "p_two_sided":0.0,
719
+ "z_equiv":-6.8810785592,
720
+ "effect_size_r":0.6281536578,
721
+ "p_holm_global":0.0000000002,
722
+ "p_holm_within_metric":0.0
723
+ },
724
+ {
725
+ "metric":"mean_cert_acc_36",
726
+ "alg_a":"ldlt",
727
+ "alg_b":"ldlt-resnet",
728
+ "n_common":121,
729
+ "n_nonzero":121,
730
+ "wins_a":39,
731
+ "wins_b":82,
732
+ "ties":0,
733
+ "win_rate_a_over_b":0.3223140496,
734
+ "mean_diff_a_minus_b":-0.0806287717,
735
+ "median_diff_a_minus_b":-0.0372283832,
736
+ "W_stat":1356.0,
737
+ "p_two_sided":0.0000000016,
738
+ "z_equiv":-6.0371328841,
739
+ "effect_size_r":0.5488302622,
740
+ "p_holm_global":0.0000000518,
741
+ "p_holm_within_metric":0.000000011
742
+ },
743
+ {
744
+ "metric":"mean_cert_acc_36",
745
+ "alg_a":"ldlt",
746
+ "alg_b":"ortho",
747
+ "n_common":121,
748
+ "n_nonzero":121,
749
+ "wins_a":47,
750
+ "wins_b":74,
751
+ "ties":0,
752
+ "win_rate_a_over_b":0.3884297521,
753
+ "mean_diff_a_minus_b":-0.0672374252,
754
+ "median_diff_a_minus_b":-0.0189958066,
755
+ "W_stat":1855.0,
756
+ "p_two_sided":0.0000020705,
757
+ "z_equiv":-4.7464176702,
758
+ "effect_size_r":0.4314925155,
759
+ "p_holm_global":0.0000476217,
760
+ "p_holm_within_metric":0.0000124231
761
+ },
762
+ {
763
+ "metric":"mean_cert_acc_36",
764
+ "alg_a":"ldlt",
765
+ "alg_b":"sdp",
766
+ "n_common":121,
767
+ "n_nonzero":121,
768
+ "wins_a":49,
769
+ "wins_b":72,
770
+ "ties":0,
771
+ "win_rate_a_over_b":0.4049586777,
772
+ "mean_diff_a_minus_b":-0.0583656001,
773
+ "median_diff_a_minus_b":-0.0074773338,
774
+ "W_stat":2119.0,
775
+ "p_two_sided":0.0000483311,
776
+ "z_equiv":-4.0635543106,
777
+ "effect_size_r":0.3694140282,
778
+ "p_holm_global":0.0009182903,
779
+ "p_holm_within_metric":0.0002416554
780
+ },
781
+ {
782
+ "metric":"mean_cert_acc_36",
783
+ "alg_a":"ldlt-resnet",
784
+ "alg_b":"sandwich",
785
+ "n_common":121,
786
+ "n_nonzero":121,
787
+ "wins_a":41,
788
+ "wins_b":80,
789
+ "ties":0,
790
+ "win_rate_a_over_b":0.3388429752,
791
+ "mean_diff_a_minus_b":-0.0267957481,
792
+ "median_diff_a_minus_b":-0.0168480575,
793
+ "W_stat":2142.0,
794
+ "p_two_sided":0.0000622639,
795
+ "z_equiv":-4.004062427,
796
+ "effect_size_r":0.3640056752,
797
+ "p_holm_global":0.001044842,
798
+ "p_holm_within_metric":0.0002490557
799
+ },
800
+ {
801
+ "metric":"mean_cert_acc_36",
802
+ "alg_a":"ldlt-resnet",
803
+ "alg_b":"sdp",
804
+ "n_common":121,
805
+ "n_nonzero":120,
806
+ "wins_a":81,
807
+ "wins_b":39,
808
+ "ties":1,
809
+ "win_rate_a_over_b":0.673553719,
810
+ "mean_diff_a_minus_b":0.0222631716,
811
+ "median_diff_a_minus_b":0.0118150264,
812
+ "W_stat":2104.0,
813
+ "p_two_sided":0.0000646711,
814
+ "z_equiv":3.9950848115,
815
+ "effect_size_r":0.3646996784,
816
+ "p_holm_global":0.001044842,
817
+ "p_holm_within_metric":0.0002490557
818
+ },
819
+ {
820
+ "metric":"mean_cert_acc_36",
821
+ "alg_a":"ldlt-resnet",
822
+ "alg_b":"ortho",
823
+ "n_common":121,
824
+ "n_nonzero":121,
825
+ "wins_a":78,
826
+ "wins_b":43,
827
+ "ties":0,
828
+ "win_rate_a_over_b":0.6446280992,
829
+ "mean_diff_a_minus_b":0.0133913465,
830
+ "median_diff_a_minus_b":0.0125584751,
831
+ "W_stat":2429.0,
832
+ "p_two_sided":0.0011074347,
833
+ "z_equiv":3.2617071837,
834
+ "effect_size_r":0.2965188349,
835
+ "p_holm_global":0.0110743473,
836
+ "p_holm_within_metric":0.0022148695
837
+ },
838
+ {
839
+ "metric":"mean_cert_acc_36",
840
+ "alg_a":"ortho",
841
+ "alg_b":"sdp",
842
+ "n_common":121,
843
+ "n_nonzero":121,
844
+ "wins_a":60,
845
+ "wins_b":61,
846
+ "ties":0,
847
+ "win_rate_a_over_b":0.4958677686,
848
+ "mean_diff_a_minus_b":0.0088718251,
849
+ "median_diff_a_minus_b":-0.0004384369,
850
+ "W_stat":3076.0,
851
+ "p_two_sided":0.1122468558,
852
+ "z_equiv":1.5881746319,
853
+ "effect_size_r":0.144379512,
854
+ "p_holm_global":0.8656977152,
855
+ "p_holm_within_metric":0.1122468558
856
+ },
857
+ {
858
+ "metric":"mean_cert_acc_72",
859
+ "alg_a":"aol",
860
+ "alg_b":"sandwich",
861
+ "n_common":121,
862
+ "n_nonzero":121,
863
+ "wins_a":7,
864
+ "wins_b":114,
865
+ "ties":0,
866
+ "win_rate_a_over_b":0.0578512397,
867
+ "mean_diff_a_minus_b":-0.2932351713,
868
+ "median_diff_a_minus_b":-0.2614153504,
869
+ "W_stat":107.0,
870
+ "p_two_sided":1.900233353e-20,
871
+ "z_equiv":-9.2678008242,
872
+ "effect_size_r":0.8425273477,
873
+ "p_holm_global":1.311161014e-18,
874
+ "p_holm_within_metric":2.85035003e-19
875
+ },
876
+ {
877
+ "metric":"mean_cert_acc_72",
878
+ "alg_a":"aol",
879
+ "alg_b":"ldlt-resnet",
880
+ "n_common":121,
881
+ "n_nonzero":121,
882
+ "wins_a":5,
883
+ "wins_b":116,
884
+ "ties":0,
885
+ "win_rate_a_over_b":0.041322314,
886
+ "mean_diff_a_minus_b":-0.2631359926,
887
+ "median_diff_a_minus_b":-0.2326939851,
888
+ "W_stat":116.0,
889
+ "p_two_sided":2.362958291e-20,
890
+ "z_equiv":-9.2445213915,
891
+ "effect_size_r":0.8404110356,
892
+ "p_holm_global":1.606811638e-18,
893
+ "p_holm_within_metric":3.308141607e-19
894
+ },
895
+ {
896
+ "metric":"mean_cert_acc_72",
897
+ "alg_a":"aol",
898
+ "alg_b":"sdp",
899
+ "n_common":121,
900
+ "n_nonzero":121,
901
+ "wins_a":5,
902
+ "wins_b":116,
903
+ "ties":0,
904
+ "win_rate_a_over_b":0.041322314,
905
+ "mean_diff_a_minus_b":-0.2314897135,
906
+ "median_diff_a_minus_b":-0.1927602664,
907
+ "W_stat":162.0,
908
+ "p_two_sided":7.138107477e-20,
909
+ "z_equiv":-9.1255376243,
910
+ "effect_size_r":0.8295943295,
911
+ "p_holm_global":4.63976986e-18,
912
+ "p_holm_within_metric":9.27953972e-19
913
+ },
914
+ {
915
+ "metric":"mean_cert_acc_72",
916
+ "alg_a":"aol",
917
+ "alg_b":"ortho",
918
+ "n_common":121,
919
+ "n_nonzero":121,
920
+ "wins_a":11,
921
+ "wins_b":110,
922
+ "ties":0,
923
+ "win_rate_a_over_b":0.0909090909,
924
+ "mean_diff_a_minus_b":-0.2412404211,
925
+ "median_diff_a_minus_b":-0.2063548118,
926
+ "W_stat":214.0,
927
+ "p_two_sided":2.449147439e-19,
928
+ "z_equiv":-8.9910342353,
929
+ "effect_size_r":0.8173667487,
930
+ "p_holm_global":1.518471412e-17,
931
+ "p_holm_within_metric":2.938976926e-18
932
+ },
933
+ {
934
+ "metric":"mean_cert_acc_72",
935
+ "alg_a":"aol",
936
+ "alg_b":"ldlt",
937
+ "n_common":121,
938
+ "n_nonzero":119,
939
+ "wins_a":19,
940
+ "wins_b":100,
941
+ "ties":2,
942
+ "win_rate_a_over_b":0.1652892562,
943
+ "mean_diff_a_minus_b":-0.1632772665,
944
+ "median_diff_a_minus_b":-0.125,
945
+ "W_stat":557.0,
946
+ "p_two_sided":0.0,
947
+ "z_equiv":-7.988580617,
948
+ "effect_size_r":0.7323119845,
949
+ "p_holm_global":0.0,
950
+ "p_holm_within_metric":0.0
951
+ },
952
+ {
953
+ "metric":"mean_cert_acc_72",
954
+ "alg_a":"ldlt",
955
+ "alg_b":"sandwich",
956
+ "n_common":121,
957
+ "n_nonzero":121,
958
+ "wins_a":20,
959
+ "wins_b":101,
960
+ "ties":0,
961
+ "win_rate_a_over_b":0.1652892562,
962
+ "mean_diff_a_minus_b":-0.1299579048,
963
+ "median_diff_a_minus_b":-0.0772011476,
964
+ "W_stat":607.0,
965
+ "p_two_sided":0.0,
966
+ "z_equiv":-7.9744990067,
967
+ "effect_size_r":0.7249544552,
968
+ "p_holm_global":0.0,
969
+ "p_holm_within_metric":0.0
970
+ },
971
+ {
972
+ "metric":"mean_cert_acc_72",
973
+ "alg_a":"ortho",
974
+ "alg_b":"sandwich",
975
+ "n_common":121,
976
+ "n_nonzero":120,
977
+ "wins_a":19,
978
+ "wins_b":101,
979
+ "ties":1,
980
+ "win_rate_a_over_b":0.1611570248,
981
+ "mean_diff_a_minus_b":-0.0519947502,
982
+ "median_diff_a_minus_b":-0.034627907,
983
+ "W_stat":601.0,
984
+ "p_two_sided":0.0,
985
+ "z_equiv":-7.9312450682,
986
+ "effect_size_r":0.7240203055,
987
+ "p_holm_global":0.0,
988
+ "p_holm_within_metric":0.0
989
+ },
990
+ {
991
+ "metric":"mean_cert_acc_72",
992
+ "alg_a":"sandwich",
993
+ "alg_b":"sdp",
994
+ "n_common":121,
995
+ "n_nonzero":120,
996
+ "wins_a":95,
997
+ "wins_b":25,
998
+ "ties":1,
999
+ "win_rate_a_over_b":0.7892561983,
1000
+ "mean_diff_a_minus_b":0.0617454578,
1001
+ "median_diff_a_minus_b":0.0392772481,
1002
+ "W_stat":801.0,
1003
+ "p_two_sided":0.0,
1004
+ "z_equiv":7.4074712483,
1005
+ "effect_size_r":0.6762065161,
1006
+ "p_holm_global":0.0,
1007
+ "p_holm_within_metric":0.0
1008
+ },
1009
+ {
1010
+ "metric":"mean_cert_acc_72",
1011
+ "alg_a":"ldlt",
1012
+ "alg_b":"ldlt-resnet",
1013
+ "n_common":121,
1014
+ "n_nonzero":121,
1015
+ "wins_a":30,
1016
+ "wins_b":91,
1017
+ "ties":0,
1018
+ "win_rate_a_over_b":0.2479338843,
1019
+ "mean_diff_a_minus_b":-0.0998587261,
1020
+ "median_diff_a_minus_b":-0.062678976,
1021
+ "W_stat":930.0,
1022
+ "p_two_sided":0.0,
1023
+ "z_equiv":-7.1390260326,
1024
+ "effect_size_r":0.6490023666,
1025
+ "p_holm_global":0.0,
1026
+ "p_holm_within_metric":0.0
1027
+ },
1028
+ {
1029
+ "metric":"mean_cert_acc_72",
1030
+ "alg_a":"ldlt",
1031
+ "alg_b":"ortho",
1032
+ "n_common":121,
1033
+ "n_nonzero":121,
1034
+ "wins_a":42,
1035
+ "wins_b":79,
1036
+ "ties":0,
1037
+ "win_rate_a_over_b":0.347107438,
1038
+ "mean_diff_a_minus_b":-0.0779631546,
1039
+ "median_diff_a_minus_b":-0.020989418,
1040
+ "W_stat":1696.0,
1041
+ "p_two_sided":0.00000025,
1042
+ "z_equiv":-5.1576876482,
1043
+ "effect_size_r":0.4688806953,
1044
+ "p_holm_global":0.0000075005,
1045
+ "p_holm_within_metric":0.0000015001
1046
+ },
1047
+ {
1048
+ "metric":"mean_cert_acc_72",
1049
+ "alg_a":"ldlt",
1050
+ "alg_b":"sdp",
1051
+ "n_common":121,
1052
+ "n_nonzero":121,
1053
+ "wins_a":42,
1054
+ "wins_b":79,
1055
+ "ties":0,
1056
+ "win_rate_a_over_b":0.347107438,
1057
+ "mean_diff_a_minus_b":-0.068212447,
1058
+ "median_diff_a_minus_b":-0.0213127583,
1059
+ "W_stat":1776.0,
1060
+ "p_two_sided":0.0000007392,
1061
+ "z_equiv":-4.9507593574,
1062
+ "effect_size_r":0.4500690325,
1063
+ "p_holm_global":0.0000199596,
1064
+ "p_holm_within_metric":0.0000036962
1065
+ },
1066
+ {
1067
+ "metric":"mean_cert_acc_72",
1068
+ "alg_a":"ldlt-resnet",
1069
+ "alg_b":"sdp",
1070
+ "n_common":121,
1071
+ "n_nonzero":121,
1072
+ "wins_a":83,
1073
+ "wins_b":38,
1074
+ "ties":0,
1075
+ "win_rate_a_over_b":0.6859504132,
1076
+ "mean_diff_a_minus_b":0.0316462791,
1077
+ "median_diff_a_minus_b":0.0191756338,
1078
+ "W_stat":1938.0,
1079
+ "p_two_sided":0.0000058503,
1080
+ "z_equiv":4.5317295685,
1081
+ "effect_size_r":0.4119754153,
1082
+ "p_holm_global":0.000128706,
1083
+ "p_holm_within_metric":0.0000234011
1084
+ },
1085
+ {
1086
+ "metric":"mean_cert_acc_72",
1087
+ "alg_a":"ldlt-resnet",
1088
+ "alg_b":"sandwich",
1089
+ "n_common":121,
1090
+ "n_nonzero":121,
1091
+ "wins_a":40,
1092
+ "wins_b":81,
1093
+ "ties":0,
1094
+ "win_rate_a_over_b":0.3305785124,
1095
+ "mean_diff_a_minus_b":-0.0300991787,
1096
+ "median_diff_a_minus_b":-0.0196958482,
1097
+ "W_stat":2062.0,
1098
+ "p_two_sided":0.0000254253,
1099
+ "z_equiv":-4.2109907178,
1100
+ "effect_size_r":0.382817338,
1101
+ "p_holm_global":0.0005158858,
1102
+ "p_holm_within_metric":0.000076276
1103
+ },
1104
+ {
1105
+ "metric":"mean_cert_acc_72",
1106
+ "alg_a":"ldlt-resnet",
1107
+ "alg_b":"ortho",
1108
+ "n_common":121,
1109
+ "n_nonzero":121,
1110
+ "wins_a":78,
1111
+ "wins_b":43,
1112
+ "ties":0,
1113
+ "win_rate_a_over_b":0.6446280992,
1114
+ "mean_diff_a_minus_b":0.0218955715,
1115
+ "median_diff_a_minus_b":0.0177944824,
1116
+ "W_stat":2306.0,
1117
+ "p_two_sided":0.0003437791,
1118
+ "z_equiv":3.5798594309,
1119
+ "effect_size_r":0.3254417664,
1120
+ "p_holm_global":0.0044691282,
1121
+ "p_holm_within_metric":0.0006875582
1122
+ },
1123
+ {
1124
+ "metric":"mean_cert_acc_72",
1125
+ "alg_a":"ortho",
1126
+ "alg_b":"sdp",
1127
+ "n_common":121,
1128
+ "n_nonzero":121,
1129
+ "wins_a":66,
1130
+ "wins_b":55,
1131
+ "ties":0,
1132
+ "win_rate_a_over_b":0.5454545455,
1133
+ "mean_diff_a_minus_b":0.0097507076,
1134
+ "median_diff_a_minus_b":0.0040983558,
1135
+ "W_stat":3178.0,
1136
+ "p_two_sided":0.1853897994,
1137
+ "z_equiv":1.3243410611,
1138
+ "effect_size_r":0.1203946419,
1139
+ "p_holm_global":0.8656977152,
1140
+ "p_holm_within_metric":0.1853897994
1141
+ },
1142
+ {
1143
+ "metric":"mean_test_acc",
1144
+ "alg_a":"aol",
1145
+ "alg_b":"ldlt",
1146
+ "n_common":121,
1147
+ "n_nonzero":121,
1148
+ "wins_a":16,
1149
+ "wins_b":105,
1150
+ "ties":0,
1151
+ "win_rate_a_over_b":0.132231405,
1152
+ "mean_diff_a_minus_b":-0.0928145234,
1153
+ "median_diff_a_minus_b":-0.0567989122,
1154
+ "W_stat":412.0,
1155
+ "p_two_sided":2.273589155e-17,
1156
+ "z_equiv":-8.4788867156,
1157
+ "effect_size_r":0.7708078832,
1158
+ "p_holm_global":0.0,
1159
+ "p_holm_within_metric":3.410383732e-16
1160
+ },
1161
+ {
1162
+ "metric":"mean_test_acc",
1163
+ "alg_a":"aol",
1164
+ "alg_b":"sandwich",
1165
+ "n_common":121,
1166
+ "n_nonzero":121,
1167
+ "wins_a":18,
1168
+ "wins_b":103,
1169
+ "ties":0,
1170
+ "win_rate_a_over_b":0.1487603306,
1171
+ "mean_diff_a_minus_b":-0.0920325933,
1172
+ "median_diff_a_minus_b":-0.0594664378,
1173
+ "W_stat":518.0,
1174
+ "p_two_sided":2.311544437e-16,
1175
+ "z_equiv":-8.2047067302,
1176
+ "effect_size_r":0.74588243,
1177
+ "p_holm_global":0.0,
1178
+ "p_holm_within_metric":0.0
1179
+ },
1180
+ {
1181
+ "metric":"mean_test_acc",
1182
+ "alg_a":"aol",
1183
+ "alg_b":"sdp",
1184
+ "n_common":121,
1185
+ "n_nonzero":121,
1186
+ "wins_a":22,
1187
+ "wins_b":99,
1188
+ "ties":0,
1189
+ "win_rate_a_over_b":0.1818181818,
1190
+ "mean_diff_a_minus_b":-0.0683567538,
1191
+ "median_diff_a_minus_b":-0.0351344055,
1192
+ "W_stat":806.0,
1193
+ "p_two_sided":0.0,
1194
+ "z_equiv":-7.4597648834,
1195
+ "effect_size_r":0.6781604439,
1196
+ "p_holm_global":0.0,
1197
+ "p_holm_within_metric":0.0
1198
+ },
1199
+ {
1200
+ "metric":"mean_test_acc",
1201
+ "alg_a":"aol",
1202
+ "alg_b":"ortho",
1203
+ "n_common":121,
1204
+ "n_nonzero":121,
1205
+ "wins_a":27,
1206
+ "wins_b":94,
1207
+ "ties":0,
1208
+ "win_rate_a_over_b":0.2231404959,
1209
+ "mean_diff_a_minus_b":-0.0674542894,
1210
+ "median_diff_a_minus_b":-0.0264984947,
1211
+ "W_stat":971.0,
1212
+ "p_two_sided":0.0,
1213
+ "z_equiv":-7.0329752836,
1214
+ "effect_size_r":0.6393613894,
1215
+ "p_holm_global":0.0000000001,
1216
+ "p_holm_within_metric":0.0
1217
+ },
1218
+ {
1219
+ "metric":"mean_test_acc",
1220
+ "alg_a":"aol",
1221
+ "alg_b":"ldlt-resnet",
1222
+ "n_common":121,
1223
+ "n_nonzero":121,
1224
+ "wins_a":25,
1225
+ "wins_b":96,
1226
+ "ties":0,
1227
+ "win_rate_a_over_b":0.2066115702,
1228
+ "mean_diff_a_minus_b":-0.0727332781,
1229
+ "median_diff_a_minus_b":-0.0313389237,
1230
+ "W_stat":1013.0,
1231
+ "p_two_sided":0.0,
1232
+ "z_equiv":-6.9243379309,
1233
+ "effect_size_r":0.6294852664,
1234
+ "p_holm_global":0.0000000002,
1235
+ "p_holm_within_metric":0.0
1236
+ },
1237
+ {
1238
+ "metric":"mean_test_acc",
1239
+ "alg_a":"ortho",
1240
+ "alg_b":"sandwich",
1241
+ "n_common":121,
1242
+ "n_nonzero":120,
1243
+ "wins_a":31,
1244
+ "wins_b":89,
1245
+ "ties":1,
1246
+ "win_rate_a_over_b":0.2603305785,
1247
+ "mean_diff_a_minus_b":-0.0245783039,
1248
+ "median_diff_a_minus_b":-0.0125617273,
1249
+ "W_stat":1269.0,
1250
+ "p_two_sided":0.0000000006,
1251
+ "z_equiv":-6.1818405096,
1252
+ "effect_size_r":0.564322249,
1253
+ "p_holm_global":0.0000000222,
1254
+ "p_holm_within_metric":0.0000000063
1255
+ },
1256
+ {
1257
+ "metric":"mean_test_acc",
1258
+ "alg_a":"ldlt",
1259
+ "alg_b":"ortho",
1260
+ "n_common":121,
1261
+ "n_nonzero":121,
1262
+ "wins_a":94,
1263
+ "wins_b":27,
1264
+ "ties":0,
1265
+ "win_rate_a_over_b":0.7768595041,
1266
+ "mean_diff_a_minus_b":0.025360234,
1267
+ "median_diff_a_minus_b":0.013893891,
1268
+ "W_stat":1309.0,
1269
+ "p_two_sided":0.0000000007,
1270
+ "z_equiv":6.158703255,
1271
+ "effect_size_r":0.5598821141,
1272
+ "p_holm_global":0.0000000249,
1273
+ "p_holm_within_metric":0.0000000066
1274
+ },
1275
+ {
1276
+ "metric":"mean_test_acc",
1277
+ "alg_a":"ldlt",
1278
+ "alg_b":"sdp",
1279
+ "n_common":121,
1280
+ "n_nonzero":121,
1281
+ "wins_a":86,
1282
+ "wins_b":35,
1283
+ "ties":0,
1284
+ "win_rate_a_over_b":0.7107438017,
1285
+ "mean_diff_a_minus_b":0.0244577696,
1286
+ "median_diff_a_minus_b":0.0110695032,
1287
+ "W_stat":1503.0,
1288
+ "p_two_sided":0.0000000154,
1289
+ "z_equiv":5.6569021498,
1290
+ "effect_size_r":0.5142638318,
1291
+ "p_holm_global":0.0000004932,
1292
+ "p_holm_within_metric":0.0000001233
1293
+ },
1294
+ {
1295
+ "metric":"mean_test_acc",
1296
+ "alg_a":"ldlt",
1297
+ "alg_b":"ldlt-resnet",
1298
+ "n_common":121,
1299
+ "n_nonzero":120,
1300
+ "wins_a":87,
1301
+ "wins_b":33,
1302
+ "ties":1,
1303
+ "win_rate_a_over_b":0.7231404959,
1304
+ "mean_diff_a_minus_b":0.0200812453,
1305
+ "median_diff_a_minus_b":0.0108439309,
1306
+ "W_stat":1689.0,
1307
+ "p_two_sided":0.0000003736,
1308
+ "z_equiv":5.0819154878,
1309
+ "effect_size_r":0.4639132913,
1310
+ "p_holm_global":0.0000108358,
1311
+ "p_holm_within_metric":0.0000026155
1312
+ },
1313
+ {
1314
+ "metric":"mean_test_acc",
1315
+ "alg_a":"sandwich",
1316
+ "alg_b":"sdp",
1317
+ "n_common":121,
1318
+ "n_nonzero":121,
1319
+ "wins_a":83,
1320
+ "wins_b":38,
1321
+ "ties":0,
1322
+ "win_rate_a_over_b":0.6859504132,
1323
+ "mean_diff_a_minus_b":0.0236758395,
1324
+ "median_diff_a_minus_b":0.0089801928,
1325
+ "W_stat":1789.0,
1326
+ "p_two_sided":0.0000008782,
1327
+ "z_equiv":4.9171335102,
1328
+ "effect_size_r":0.4470121373,
1329
+ "p_holm_global":0.0000228334,
1330
+ "p_holm_within_metric":0.0000052692
1331
+ },
1332
+ {
1333
+ "metric":"mean_test_acc",
1334
+ "alg_a":"ldlt-resnet",
1335
+ "alg_b":"sandwich",
1336
+ "n_common":121,
1337
+ "n_nonzero":121,
1338
+ "wins_a":43,
1339
+ "wins_b":78,
1340
+ "ties":0,
1341
+ "win_rate_a_over_b":0.3553719008,
1342
+ "mean_diff_a_minus_b":-0.0192993151,
1343
+ "median_diff_a_minus_b":-0.0067946254,
1344
+ "W_stat":2364.0,
1345
+ "p_two_sided":0.0006039452,
1346
+ "z_equiv":-3.42983642,
1347
+ "effect_size_r":0.3118033109,
1348
+ "p_holm_global":0.0072473427,
1349
+ "p_holm_within_metric":0.0030197261
1350
+ },
1351
+ {
1352
+ "metric":"mean_test_acc",
1353
+ "alg_a":"ldlt-resnet",
1354
+ "alg_b":"sdp",
1355
+ "n_common":121,
1356
+ "n_nonzero":120,
1357
+ "wins_a":66,
1358
+ "wins_b":54,
1359
+ "ties":1,
1360
+ "win_rate_a_over_b":0.5495867769,
1361
+ "mean_diff_a_minus_b":0.0043765243,
1362
+ "median_diff_a_minus_b":0.0019017287,
1363
+ "W_stat":3070.0,
1364
+ "p_two_sided":0.1428507422,
1365
+ "z_equiv":1.4652572612,
1366
+ "effect_size_r":0.1337590758,
1367
+ "p_holm_global":0.8656977152,
1368
+ "p_holm_within_metric":0.5714029689
1369
+ },
1370
+ {
1371
+ "metric":"mean_test_acc",
1372
+ "alg_a":"ldlt-resnet",
1373
+ "alg_b":"ortho",
1374
+ "n_common":121,
1375
+ "n_nonzero":121,
1376
+ "wins_a":71,
1377
+ "wins_b":50,
1378
+ "ties":0,
1379
+ "win_rate_a_over_b":0.5867768595,
1380
+ "mean_diff_a_minus_b":0.0052789887,
1381
+ "median_diff_a_minus_b":0.002452642,
1382
+ "W_stat":3138.0,
1383
+ "p_two_sided":0.1533479338,
1384
+ "z_equiv":1.4278052065,
1385
+ "effect_size_r":0.1298004733,
1386
+ "p_holm_global":0.8656977152,
1387
+ "p_holm_within_metric":0.5714029689
1388
+ },
1389
+ {
1390
+ "metric":"mean_test_acc",
1391
+ "alg_a":"ortho",
1392
+ "alg_b":"sdp",
1393
+ "n_common":121,
1394
+ "n_nonzero":121,
1395
+ "wins_a":60,
1396
+ "wins_b":61,
1397
+ "ties":0,
1398
+ "win_rate_a_over_b":0.4958677686,
1399
+ "mean_diff_a_minus_b":-0.0009024644,
1400
+ "median_diff_a_minus_b":-0.0003659998,
1401
+ "W_stat":3623.0,
1402
+ "p_two_sided":0.8624137031,
1403
+ "z_equiv":-0.1733024435,
1404
+ "effect_size_r":0.0157547676,
1405
+ "p_holm_global":1.0,
1406
+ "p_holm_within_metric":1.0
1407
+ },
1408
+ {
1409
+ "metric":"mean_test_acc",
1410
+ "alg_a":"ldlt",
1411
+ "alg_b":"sandwich",
1412
+ "n_common":121,
1413
+ "n_nonzero":121,
1414
+ "wins_a":59,
1415
+ "wins_b":62,
1416
+ "ties":0,
1417
+ "win_rate_a_over_b":0.4876033058,
1418
+ "mean_diff_a_minus_b":0.0007819301,
1419
+ "median_diff_a_minus_b":-0.0001641521,
1420
+ "W_stat":3624.0,
1421
+ "p_two_sided":0.8644472072,
1422
+ "z_equiv":0.1707158399,
1423
+ "effect_size_r":0.0155196218,
1424
+ "p_holm_global":1.0,
1425
+ "p_holm_within_metric":1.0
1426
+ }
1427
+ ]
UCI_N4/wilcoxon_prep_all.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N6/jmlr_tables.tex ADDED
@@ -0,0 +1,469 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ % JMLR-ready tables for two-column papers
2
+ % Required packages (no siunitx):
3
+ % \usepackage{booktabs}
4
+ % \usepackage{threeparttable}
5
+ % \usepackage{threeparttablex} % for TableNotes + longtable
6
+ % \usepackage{longtable}
7
+ % Optional for landscape: \usepackage{pdflscape}
8
+
9
+ \begin{table*}[t]
10
+ \centering
11
+ \begin{threeparttable}
12
+ \caption{Model dimension ranges (min--max across all datasets and folds). Input/Output dimensions follow dataset label spaces.}
13
+ \label{tab:model-ranges}
14
+ \begin{tabular}{l r r r r r r}
15
+ \toprule
16
+ Algorithm & Width & Depth & Parameters & Padding & Input dim & Output dim \\
17
+ \midrule
18
+ AOL & 32--512 & 6--6 & 502--1245037 & 10--524 & 3--262 & 2--100 \\
19
+ Orthogonal & 32--512 & 6--6 & 507--1245042 & 10--524 & 3--262 & 2--100 \\
20
+ Sandwich & 32--512 & 6--6 & 1057--2620542 & 10--524 & 3--262 & 2--100 \\
21
+ SLL & 32--512 & 6--6 & 2326--1622697 & 10--524 & 3--262 & 2--100 \\
22
+ LDLT-L & 32--512 & 6--6 & 5480--1454611 & 10--524 & 3--262 & 2--100 \\
23
+ LDLT-R & 32--512 & 6--6 & 5577--1588756 & 10--524 & 3--262 & 2--100 \\
24
+ \bottomrule
25
+ \end{tabular}
26
+ \end{threeparttable}
27
+ \end{table*}
28
+
29
+ \begin{table*}[t]
30
+ \centering
31
+ \begin{threeparttable}
32
+ \caption{Sorted mean$\pm$std across $N$ datasets for each algorithm.}
33
+ \label{tab:metric_summary}
34
+ \begin{tabular}{l r lllll}
35
+ \toprule
36
+ & & & \multicolumn{4}{c}{Certified Accuracy} \\
37
+ \cmidrule(lr){4-7}
38
+ Algorithm & $N$ & Accuracy & 36/255 & 72/255 & 108/255 & 255/255 \\
39
+ \midrule
40
+ AOL & 121 & 0.6049\,\tiny$\pm$0.2396 & 0.2876\,\tiny$\pm$0.3111 & 0.2157\,\tiny$\pm$0.2940 & 0.1739\,\tiny$\pm$0.2716 & 0.0837\,\tiny$\pm$0.1775 \\
41
+ Orthogonal & 121 & 0.7036\,\tiny$\pm$0.1911 & 0.6021\,\tiny$\pm$0.2403 & 0.5088\,\tiny$\pm$0.2638 & 0.4229\,\tiny$\pm$0.2741 & 0.1972\,\tiny$\pm$0.2336 \\
42
+ Sandwich & 121 & 0.7163\,\tiny$\pm$0.1879 & \textbf{0.6239\,\tiny$\pm$0.2409} & \textbf{0.5483\,\tiny$\pm$0.2616} & \textbf{0.4738\,\tiny$\pm$0.2712} & \textbf{0.2464\,\tiny$\pm$0.2506} \\
43
+ SLL & 121 & 0.7011\,\tiny$\pm$0.1939 & 0.5816\,\tiny$\pm$0.2487 & 0.4813\,\tiny$\pm$0.2720 & 0.3961\,\tiny$\pm$0.2799 & 0.1888\,\tiny$\pm$0.2320 \\
44
+ \midrule
45
+ LDLT-L & 121 & \textbf{0.7245\,\tiny$\pm$0.1908} & 0.4646\,\tiny$\pm$0.3318 & 0.3865\,\tiny$\pm$0.3245 & 0.3247\,\tiny$\pm$0.3088 & 0.1584\,\tiny$\pm$0.2272 \\
46
+ LDLT-R & 121 & 0.6970\,\tiny$\pm$0.2021 & 0.6036\,\tiny$\pm$0.2378 & 0.5202\,\tiny$\pm$0.2572 & 0.4478\,\tiny$\pm$0.2640 & 0.2175\,\tiny$\pm$0.2278 \\
47
+ \bottomrule
48
+ \end{tabular}
49
+ \end{threeparttable}
50
+ \end{table*}
51
+
52
+ \begin{table}[t]
53
+ \centering
54
+ \begin{threeparttable}
55
+ {\small
56
+ \caption{Overall comparison on Mean Accuracy: average rank (lower is better) with Iman--Davenport $F=34.41$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
57
+ \label{tab:overall:mean_test_acc}
58
+ \setlength{\tabcolsep}{4pt}
59
+ \begin{tabular}{@{}l r r r r r r@{}}
60
+ \toprule
61
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
62
+ \midrule
63
+ LDLT-L & 2.525 & 4 & 0 & 4 & 0.800 & 0.533 \\
64
+ Sandwich & 2.773 & 4 & 0 & 4 & 0.800 & 0.421 \\
65
+ Orthogonal & 3.479 & 1 & 2 & -1 & 0.200 & 0.654 \\
66
+ SLL & 3.545 & 1 & 2 & -1 & 0.200 & 0.621 \\
67
+ LDLT-R & 3.628 & 1 & 2 & -1 & 0.200 & 0.560 \\
68
+ AOL & 5.050 & 0 & 5 & -5 & 0.000 & 0.000 \\
69
+ \bottomrule
70
+ \end{tabular}
71
+ }
72
+ \end{threeparttable}
73
+ \end{table}
74
+
75
+ \begin{table}[t]
76
+ \centering
77
+ \begin{threeparttable}
78
+ {\small
79
+ \caption{Overall comparison on Mean Certified Accuracy (36/255): average rank (lower is better) with Iman--Davenport $F=87.35$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
80
+ \label{tab:overall:mean_cert_acc_36}
81
+ \setlength{\tabcolsep}{4pt}
82
+ \begin{tabular}{@{}l r r r r r r@{}}
83
+ \toprule
84
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
85
+ \midrule
86
+ Sandwich & 2.211 & 5 & 0 & 5 & 1.000 & 0.539 \\
87
+ LDLT-R & 2.603 & 3 & 1 & 2 & 0.600 & 0.599 \\
88
+ Orthogonal & 3.202 & 2 & 1 & 1 & 0.400 & 0.693 \\
89
+ SLL & 3.289 & 2 & 2 & 0 & 0.400 & 0.704 \\
90
+ LDLT-L & 4.091 & 1 & 4 & -3 & 0.200 & 0.648 \\
91
+ AOL & 5.603 & 0 & 5 & -5 & 0.000 & 0.000 \\
92
+ \bottomrule
93
+ \end{tabular}
94
+ }
95
+ \end{threeparttable}
96
+ \end{table}
97
+
98
+ \begin{table}[t]
99
+ \centering
100
+ \begin{threeparttable}
101
+ {\small
102
+ \caption{Overall comparison on Mean Certified Accuracy (72/255): average rank (lower is better) with Iman--Davenport $F=125.56$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
103
+ \label{tab:overall:mean_cert_acc_72}
104
+ \setlength{\tabcolsep}{4pt}
105
+ \begin{tabular}{@{}l r r r r r r@{}}
106
+ \toprule
107
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
108
+ \midrule
109
+ Sandwich & 1.988 & 5 & 0 & 5 & 1.000 & 0.605 \\
110
+ LDLT-R & 2.504 & 4 & 1 & 3 & 0.800 & 0.538 \\
111
+ Orthogonal & 3.202 & 3 & 2 & 1 & 0.600 & 0.547 \\
112
+ SLL & 3.355 & 2 & 3 & -1 & 0.400 & 0.724 \\
113
+ LDLT-L & 4.198 & 1 & 4 & -3 & 0.200 & 0.769 \\
114
+ AOL & 5.752 & 0 & 5 & -5 & 0.000 & 0.000 \\
115
+ \bottomrule
116
+ \end{tabular}
117
+ }
118
+ \end{threeparttable}
119
+ \end{table}
120
+
121
+ \begin{table}[t]
122
+ \centering
123
+ \begin{threeparttable}
124
+ {\small
125
+ \caption{Overall comparison on Mean Certified Accuracy (108/255): average rank (lower is better) with Iman--Davenport $F=134.70$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
126
+ \label{tab:overall:mean_cert_acc_108}
127
+ \setlength{\tabcolsep}{4pt}
128
+ \begin{tabular}{@{}l r r r r r r@{}}
129
+ \toprule
130
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
131
+ \midrule
132
+ Sandwich & 1.988 & 4 & 0 & 4 & 0.800 & 0.721 \\
133
+ LDLT-R & 2.364 & 4 & 0 & 4 & 0.800 & 0.594 \\
134
+ Orthogonal & 3.260 & 2 & 2 & 0 & 0.400 & 0.717 \\
135
+ SLL & 3.388 & 2 & 2 & 0 & 0.400 & 0.696 \\
136
+ LDLT-L & 4.256 & 1 & 4 & -3 & 0.200 & 0.826 \\
137
+ AOL & 5.744 & 0 & 5 & -5 & 0.000 & 0.000 \\
138
+ \bottomrule
139
+ \end{tabular}
140
+ }
141
+ \end{threeparttable}
142
+ \end{table}
143
+
144
+ \begin{table}[t]
145
+ \centering
146
+ \begin{threeparttable}
147
+ {\small
148
+ \caption{Overall comparison on Mean Certified Accuracy (255/255): average rank (lower is better) with Iman--Davenport $F=105.28$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.685$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
149
+ \label{tab:overall:mean_cert_acc_255}
150
+ \setlength{\tabcolsep}{4pt}
151
+ \begin{tabular}{@{}l r r r r r r@{}}
152
+ \toprule
153
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
154
+ \midrule
155
+ Sandwich & 2.000 & 5 & 0 & 5 & 1.000 & 0.643 \\
156
+ LDLT-R & 2.467 & 4 & 1 & 3 & 0.800 & 0.620 \\
157
+ SLL & 3.293 & 2 & 2 & 0 & 0.400 & 0.664 \\
158
+ Orthogonal & 3.442 & 2 & 2 & 0 & 0.400 & 0.652 \\
159
+ LDLT-L & 4.227 & 1 & 4 & -3 & 0.200 & 0.846 \\
160
+ AOL & 5.570 & 0 & 5 & -5 & 0.000 & 0.000 \\
161
+ \bottomrule
162
+ \end{tabular}
163
+ }
164
+ \end{threeparttable}
165
+ \end{table}
166
+
167
+ \begin{table}[t]
168
+ \centering
169
+ \begin{threeparttable}
170
+ {
171
+ \caption{Pairwise Wilcoxon outcomes for Mean Accuracy (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
172
+ \label{tab:signif:mean_test_acc}
173
+ \setlength{\tabcolsep}{3pt}
174
+ \begin{tabular}{@{}l c c c c c c @{}}
175
+ \toprule
176
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
177
+ \midrule
178
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
179
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
180
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
181
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
182
+ Sandwich & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
183
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
184
+ \bottomrule
185
+ \end{tabular}
186
+ }
187
+ \end{threeparttable}
188
+ \end{table}
189
+
190
+ \begin{table}[t]
191
+ \centering
192
+ \begin{threeparttable}
193
+ {
194
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (36/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
195
+ \label{tab:signif:mean_cert_acc_36}
196
+ \setlength{\tabcolsep}{3pt}
197
+ \begin{tabular}{@{}l c c c c c c @{}}
198
+ \toprule
199
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
200
+ \midrule
201
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
202
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
203
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
204
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
205
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
206
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
207
+ \bottomrule
208
+ \end{tabular}
209
+ }
210
+ \end{threeparttable}
211
+ \end{table}
212
+
213
+ \begin{table}[t]
214
+ \centering
215
+ \begin{threeparttable}
216
+ {
217
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (72/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
218
+ \label{tab:signif:mean_cert_acc_72}
219
+ \setlength{\tabcolsep}{3pt}
220
+ \begin{tabular}{@{}l c c c c c c @{}}
221
+ \toprule
222
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
223
+ \midrule
224
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
225
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
226
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
227
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
228
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
229
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
230
+ \bottomrule
231
+ \end{tabular}
232
+ }
233
+ \end{threeparttable}
234
+ \end{table}
235
+
236
+ \begin{table}[t]
237
+ \centering
238
+ \begin{threeparttable}
239
+ {
240
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (108/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
241
+ \label{tab:signif:mean_cert_acc_108}
242
+ \setlength{\tabcolsep}{3pt}
243
+ \begin{tabular}{@{}l c c c c c c @{}}
244
+ \toprule
245
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
246
+ \midrule
247
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
248
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
249
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
250
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
251
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
252
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
253
+ \bottomrule
254
+ \end{tabular}
255
+ }
256
+ \end{threeparttable}
257
+ \end{table}
258
+
259
+ \begin{table}[t]
260
+ \centering
261
+ \begin{threeparttable}
262
+ {
263
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (255/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
264
+ \label{tab:signif:mean_cert_acc_255}
265
+ \setlength{\tabcolsep}{3pt}
266
+ \begin{tabular}{@{}l c c c c c c @{}}
267
+ \toprule
268
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
269
+ \midrule
270
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
271
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
272
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
273
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
274
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
275
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
276
+ \bottomrule
277
+ \end{tabular}
278
+ }
279
+ \end{threeparttable}
280
+ \end{table}
281
+
282
+
283
+ \begin{table*}[t]
284
+ \centering
285
+ \begin{threeparttable}
286
+ \caption[Mean Accuracy]{Wilcoxon signed-rank tests (two-sided) for Mean Accuracy; $p$-values with Holm FWER corrections within-metric and global.}
287
+ \label{tab:wilcoxon:mean_test_acc}
288
+ \begingroup
289
+ \setlength{\tabcolsep}{4pt}
290
+ \begin{tabular}{ll r r r r r r r r r r r}
291
+ \toprule
292
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
293
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
294
+ \midrule
295
+ AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.0632 & 409 & $2.1e-17^{***}$ & $3.2e-16^{***}$ & $0^{***}$ & 0.7715 \\
296
+ AOL & Sandwich & 121 & 23 & 98 & 0 & 0.1901 & -0.0656 & 698 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7036 \\
297
+ AOL & Orthogonal & 121 & 25 & 96 & 0 & 0.2066 & -0.0525 & 908 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6542 \\
298
+ AOL & SLL & 121 & 24 & 97 & 0 & 0.1983 & -0.0445 & 1047 & $0^{***}$ & $1.0e-10^{***}$ & $3.0e-10^{***}$ & 0.6215 \\
299
+ AOL & LDLT-R & 121 & 27 & 94 & 0 & 0.2231 & -0.0357 & 1307 & $7.0e-10^{***}$ & $7.8e-09^{***}$ & $2.3e-08^{***}$ & 0.5604 \\
300
+ LDLT-L & SLL & 121 & 86 & 35 & 0 & 0.7107 & 0.0103 & 1511 & $1.7e-08^{***}$ & $1.7e-07^{***}$ & $5.0e-07^{***}$ & 0.5124 \\
301
+ LDLT-L & LDLT-R & 121 & 87 & 34 & 0 & 0.7190 & 0.0125 & 1779 & $7.7e-07^{***}$ & $6.9e-06^{***}$ & $2.0e-05^{***}$ & 0.4494 \\
302
+ LDLT-L & Orthogonal & 121 & 78 & 43 & 0 & 0.6446 & 0.0104 & 2002 & $1.3e-05^{***}$ & $1.0e-04^{***}$ & $2.5e-04^{***}$ & 0.3969 \\
303
+ Orthogonal & Sandwich & 121 & 39 & 81 & 1 & 0.3264 & -0.0079 & 2171 & $1.3e-04^{***}$ & $9.4e-04^{***}$ & $2.5e-03^{**}$ & 0.3487 \\
304
+ Sandwich & SLL & 121 & 80 & 41 & 0 & 0.6612 & 0.0063 & 2279 & $2.6e-04^{***}$ & $1.6e-03^{**}$ & $4.6e-03^{**}$ & 0.3318 \\
305
+ LDLT-R & Sandwich & 121 & 47 & 74 & 0 & 0.3884 & -0.0101 & 2411 & $9.4e-04^{***}$ & $4.7e-03^{**}$ & $1.4e-02^{*}$ & 0.3008 \\
306
+ LDLT-L & Sandwich & 121 & 64 & 56 & 1 & 0.5331 & 0.0008 & 3145 & $2.0e-01$ & $8.2e-01$ & $1.0e+00$ & 0.1158 \\
307
+ LDLT-R & Orthogonal & 121 & 54 & 67 & 0 & 0.4463 & -0.0024 & 3206 & $2.1e-01$ & $8.2e-01$ & $1.0e+00$ & 0.1138 \\
308
+ Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0000 & 3382 & $4.3e-01$ & $8.5e-01$ & $1.0e+00$ & 0.0724 \\
309
+ LDLT-R & SLL & 121 & 58 & 63 & 0 & 0.4793 & -0.0010 & 3627 & $8.7e-01$ & $8.7e-01$ & $1.0e+00$ & 0.0148 \\
310
+ \bottomrule
311
+ \end{tabular}
312
+ \begin{tablenotes}
313
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
314
+ \end{tablenotes}
315
+ \endgroup
316
+ \end{threeparttable}
317
+ \end{table*}
318
+
319
+
320
+
321
+ \begin{table*}[t]
322
+ \centering
323
+ \begin{threeparttable}
324
+ \caption[Mean Certified Accuracy (36/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (36/255); $p$-values with Holm FWER corrections within-metric and global.}
325
+ \label{tab:wilcoxon:mean_cert_acc_36}
326
+ \begingroup
327
+ \setlength{\tabcolsep}{4pt}
328
+ \begin{tabular}{ll r r r r r r r r r r r}
329
+ \toprule
330
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
331
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
332
+ \midrule
333
+ AOL & LDLT-R & 121 & 3 & 118 & 0 & 0.0248 & -0.2903 & 53 & $5.1e-21^{***}$ & $7.6e-20^{***}$ & $3.6e-19^{***}$ & 0.8552 \\
334
+ AOL & SLL & 121 & 4 & 117 & 0 & 0.0331 & -0.2718 & 115 & $2.3e-20^{***}$ & $3.2e-19^{***}$ & $1.5e-18^{***}$ & 0.8406 \\
335
+ AOL & Sandwich & 121 & 9 & 112 & 0 & 0.0744 & -0.3414 & 135 & $3.7e-20^{***}$ & $4.9e-19^{***}$ & $2.4e-18^{***}$ & 0.8359 \\
336
+ AOL & Orthogonal & 121 & 8 & 113 & 0 & 0.0661 & -0.2982 & 140 & $4.2e-20^{***}$ & $5.1e-19^{***}$ & $2.7e-18^{***}$ & 0.8348 \\
337
+ LDLT-L & Sandwich & 121 & 22 & 99 & 0 & 0.1818 & -0.0761 & 770 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6866 \\
338
+ AOL & LDLT-L & 121 & 22 & 95 & 4 & 0.1983 & -0.1112 & 872 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6485 \\
339
+ LDLT-L & LDLT-R & 121 & 34 & 87 & 0 & 0.2810 & -0.0613 & 1073 & $0^{***}$ & $1.0e-10^{***}$ & $5.0e-10^{***}$ & 0.6154 \\
340
+ LDLT-L & SLL & 121 & 38 & 83 & 0 & 0.3140 & -0.0545 & 1275 & $4.0e-10^{***}$ & $3.4e-09^{***}$ & $1.4e-08^{***}$ & 0.5679 \\
341
+ LDLT-L & Orthogonal & 121 & 40 & 81 & 0 & 0.3306 & -0.0581 & 1346 & $1.3e-09^{***}$ & $9.4e-09^{***}$ & $4.3e-08^{***}$ & 0.5512 \\
342
+ Sandwich & SLL & 121 & 89 & 32 & 0 & 0.7355 & 0.0236 & 1459 & $7.9e-09^{***}$ & $4.7e-08^{***}$ & $2.4e-07^{***}$ & 0.5246 \\
343
+ Orthogonal & Sandwich & 121 & 33 & 87 & 1 & 0.2769 & -0.0164 & 1846 & $3.0e-06^{***}$ & $1.5e-05^{***}$ & $6.4e-05^{***}$ & 0.4264 \\
344
+ LDLT-R & SLL & 121 & 81 & 40 & 0 & 0.6694 & 0.0100 & 2305 & $3.4e-04^{***}$ & $1.4e-03^{**}$ & $5.4e-03^{**}$ & 0.3257 \\
345
+ LDLT-R & Sandwich & 121 & 50 & 71 & 0 & 0.4132 & -0.0094 & 2753 & $1.5e-02^{*}$ & $4.6e-02^{*}$ & $1.8e-01$ & 0.2203 \\
346
+ Orthogonal & SLL & 121 & 65 & 56 & 0 & 0.5372 & 0.0014 & 2942 & $5.3e-02$ & $1.1e-01$ & $3.9e-01$ & 0.1759 \\
347
+ LDLT-R & Orthogonal & 121 & 75 & 46 & 0 & 0.6198 & 0.0065 & 3172 & $1.8e-01$ & $1.8e-01$ & $1.0e+00$ & 0.1218 \\
348
+ \bottomrule
349
+ \end{tabular}
350
+ \begin{tablenotes}
351
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
352
+ \end{tablenotes}
353
+ \endgroup
354
+ \end{threeparttable}
355
+ \end{table*}
356
+
357
+
358
+
359
+ \begin{table*}[t]
360
+ \centering
361
+ \begin{threeparttable}
362
+ \caption[Mean Certified Accuracy (72/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (72/255); $p$-values with Holm FWER corrections within-metric and global.}
363
+ \label{tab:wilcoxon:mean_cert_acc_72}
364
+ \begingroup
365
+ \setlength{\tabcolsep}{4pt}
366
+ \begin{tabular}{ll r r r r r r r r r r r}
367
+ \toprule
368
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
369
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
370
+ \midrule
371
+ AOL & SLL & 121 & 0 & 121 & 0 & 0.0000 & -0.2418 & 0 & $1.4e-21^{***}$ & $2.1e-20^{***}$ & $1.0e-19^{***}$ & 0.8677 \\
372
+ AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2825 & 25 & $2.5e-21^{***}$ & $3.6e-20^{***}$ & $1.9e-19^{***}$ & 0.8618 \\
373
+ AOL & Orthogonal & 121 & 4 & 117 & 0 & 0.0331 & -0.2682 & 45 & $4.2e-21^{***}$ & $5.4e-20^{***}$ & $3.0e-19^{***}$ & 0.8571 \\
374
+ AOL & Sandwich & 121 & 6 & 115 & 0 & 0.0496 & -0.3329 & 80 & $9.9e-21^{***}$ & $1.2e-19^{***}$ & $6.8e-19^{***}$ & 0.8489 \\
375
+ AOL & LDLT-L & 121 & 10 & 93 & 18 & 0.1570 & -0.0849 & 304 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7694 \\
376
+ LDLT-L & Sandwich & 121 & 16 & 105 & 0 & 0.1322 & -0.0864 & 509 & $1.9e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7480 \\
377
+ LDLT-L & LDLT-R & 121 & 30 & 91 & 0 & 0.2479 & -0.0765 & 873 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6624 \\
378
+ Orthogonal & Sandwich & 121 & 22 & 98 & 1 & 0.1860 & -0.0318 & 1154 & $1.0e-10^{***}$ & $6.0e-10^{***}$ & $3.5e-09^{***}$ & 0.5918 \\
379
+ Sandwich & SLL & 121 & 95 & 26 & 0 & 0.7851 & 0.0391 & 1169 & $1.0e-10^{***}$ & $6.0e-10^{***}$ & $2.8e-09^{***}$ & 0.5928 \\
380
+ LDLT-L & SLL & 121 & 34 & 87 & 0 & 0.2810 & -0.0437 & 1219 & $2.0e-10^{***}$ & $1.0e-09^{***}$ & $6.2e-09^{***}$ & 0.5810 \\
381
+ LDLT-L & Orthogonal & 121 & 36 & 85 & 0 & 0.2975 & -0.0452 & 1256 & $3.0e-10^{***}$ & $1.5e-09^{***}$ & $1.1e-08^{***}$ & 0.5723 \\
382
+ LDLT-R & SLL & 121 & 89 & 32 & 0 & 0.7355 & 0.0202 & 1852 & $2.0e-06^{***}$ & $8.0e-06^{***}$ & $5.0e-05^{***}$ & 0.4322 \\
383
+ LDLT-R & Sandwich & 121 & 49 & 72 & 0 & 0.4050 & -0.0133 & 2656 & $7.5e-03^{**}$ & $2.2e-02^{*}$ & $9.7e-02$ & 0.2431 \\
384
+ Orthogonal & SLL & 121 & 67 & 54 & 0 & 0.5537 & 0.0046 & 2784 & $1.9e-02^{*}$ & $3.8e-02^{*}$ & $2.1e-01$ & 0.2130 \\
385
+ LDLT-R & Orthogonal & 121 & 74 & 47 & 0 & 0.6116 & 0.0089 & 2855 & $3.1e-02^{*}$ & $3.8e-02^{*}$ & $3.1e-01$ & 0.1963 \\
386
+ \bottomrule
387
+ \end{tabular}
388
+ \begin{tablenotes}
389
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
390
+ \end{tablenotes}
391
+ \endgroup
392
+ \end{threeparttable}
393
+ \end{table*}
394
+
395
+
396
+
397
+ \begin{table*}[t]
398
+ \centering
399
+ \begin{threeparttable}
400
+ \caption[Mean Certified Accuracy (108/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (108/255); $p$-values with Holm FWER corrections within-metric and global.}
401
+ \label{tab:wilcoxon:mean_cert_acc_108}
402
+ \begingroup
403
+ \setlength{\tabcolsep}{4pt}
404
+ \begin{tabular}{ll r r r r r r r r r r r}
405
+ \toprule
406
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
407
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
408
+ \midrule
409
+ AOL & SLL & 121 & 1 & 116 & 4 & 0.0248 & -0.1721 & 34 & $1.5e-20^{***}$ & $1.8e-19^{***}$ & $1.0e-18^{***}$ & 0.8592 \\
410
+ AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2318 & 45 & $4.2e-21^{***}$ & $6.3e-20^{***}$ & $3.0e-19^{***}$ & 0.8571 \\
411
+ AOL & Orthogonal & 121 & 3 & 117 & 1 & 0.0289 & -0.2099 & 60 & $8.9e-21^{***}$ & $1.2e-19^{***}$ & $6.2e-19^{***}$ & 0.8534 \\
412
+ AOL & Sandwich & 121 & 5 & 116 & 0 & 0.0413 & -0.2735 & 82 & $1.0e-20^{***}$ & $1.3e-19^{***}$ & $7.0e-19^{***}$ & 0.8484 \\
413
+ AOL & LDLT-L & 121 & 6 & 90 & 25 & 0.1529 & -0.0672 & 113 & $5.8e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.8259 \\
414
+ LDLT-L & Sandwich & 121 & 14 & 107 & 0 & 0.1157 & -0.0819 & 450 & $5.3e-17^{***}$ & $5.8e-16^{***}$ & $0^{***}$ & 0.7619 \\
415
+ LDLT-L & LDLT-R & 121 & 25 & 96 & 0 & 0.2066 & -0.0715 & 733 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6953 \\
416
+ Orthogonal & Sandwich & 121 & 18 & 102 & 1 & 0.1529 & -0.0376 & 945 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6418 \\
417
+ Sandwich & SLL & 121 & 93 & 28 & 0 & 0.7686 & 0.0435 & 995 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6337 \\
418
+ LDLT-L & Orthogonal & 121 & 32 & 88 & 1 & 0.2686 & -0.0352 & 1203 & $2.0e-10^{***}$ & $1.3e-09^{***}$ & $7.7e-09^{***}$ & 0.5801 \\
419
+ LDLT-L & SLL & 121 & 35 & 82 & 4 & 0.3058 & -0.0294 & 1335 & $8.7e-09^{***}$ & $4.3e-08^{***}$ & $2.6e-07^{***}$ & 0.5321 \\
420
+ LDLT-R & SLL & 121 & 89 & 32 & 0 & 0.7355 & 0.0233 & 1603 & $6.7e-08^{***}$ & $2.7e-07^{***}$ & $1.9e-06^{***}$ & 0.4907 \\
421
+ LDLT-R & Orthogonal & 121 & 81 & 40 & 0 & 0.6694 & 0.0182 & 2277 & $2.6e-04^{***}$ & $7.7e-04^{***}$ & $4.6e-03^{**}$ & 0.3323 \\
422
+ LDLT-R & Sandwich & 121 & 54 & 67 & 0 & 0.4463 & -0.0097 & 2867 & $3.3e-02^{*}$ & $6.7e-02$ & $3.1e-01$ & 0.1935 \\
423
+ Orthogonal & SLL & 121 & 67 & 54 & 0 & 0.5537 & 0.0061 & 2930 & $4.9e-02^{*}$ & $6.7e-02$ & $3.9e-01$ & 0.1787 \\
424
+ \bottomrule
425
+ \end{tabular}
426
+ \begin{tablenotes}
427
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
428
+ \end{tablenotes}
429
+ \endgroup
430
+ \end{threeparttable}
431
+ \end{table*}
432
+
433
+
434
+
435
+ \begin{table*}[t]
436
+ \centering
437
+ \begin{threeparttable}
438
+ \caption[Mean Certified Accuracy (255/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (255/255); $p$-values with Holm FWER corrections within-metric and global.}
439
+ \label{tab:wilcoxon:mean_cert_acc_255}
440
+ \begingroup
441
+ \setlength{\tabcolsep}{4pt}
442
+ \begin{tabular}{ll r r r r r r r r r r r}
443
+ \toprule
444
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
445
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
446
+ \midrule
447
+ AOL & LDLT-R & 121 & 0 & 110 & 11 & 0.0455 & -0.0717 & 0 & $8.9e-20^{***}$ & $1.3e-18^{***}$ & $5.6e-18^{***}$ & 0.8678 \\
448
+ AOL & SLL & 121 & 2 & 101 & 18 & 0.0909 & -0.0429 & 22 & $2.4e-18^{***}$ & $3.1e-17^{***}$ & $1.5e-16^{***}$ & 0.8608 \\
449
+ AOL & LDLT-L & 121 & 3 & 84 & 34 & 0.1653 & -0.0172 & 48 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.8465 \\
450
+ AOL & Orthogonal & 121 & 2 & 103 & 16 & 0.0826 & -0.0488 & 71 & $4.5e-18^{***}$ & $5.3e-17^{***}$ & $2.7e-16^{***}$ & 0.8458 \\
451
+ AOL & Sandwich & 121 & 2 & 112 & 7 & 0.0455 & -0.0886 & 74 & $1.4e-19^{***}$ & $1.9e-18^{***}$ & $8.4e-18^{***}$ & 0.8482 \\
452
+ LDLT-L & Sandwich & 121 & 10 & 104 & 7 & 0.1116 & -0.0351 & 415 & $5.9e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7579 \\
453
+ Orthogonal & Sandwich & 121 & 17 & 97 & 7 & 0.1694 & -0.0273 & 465 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7446 \\
454
+ LDLT-L & LDLT-R & 121 & 20 & 90 & 11 & 0.2107 & -0.0296 & 685 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6731 \\
455
+ Sandwich & SLL & 121 & 84 & 30 & 7 & 0.7231 & 0.0164 & 1043 & $3.0e-10^{***}$ & $1.9e-09^{***}$ & $9.6e-09^{***}$ & 0.5916 \\
456
+ LDLT-L & SLL & 121 & 27 & 76 & 18 & 0.2975 & -0.0086 & 1234 & $2.0e-06^{***}$ & $1.0e-05^{***}$ & $5.0e-05^{***}$ & 0.4679 \\
457
+ LDLT-L & Orthogonal & 121 & 30 & 74 & 17 & 0.3182 & -0.0039 & 1287 & $2.9e-06^{***}$ & $1.0e-05^{***}$ & $6.4e-05^{***}$ & 0.4587 \\
458
+ LDLT-R & SLL & 121 & 80 & 31 & 10 & 0.7025 & 0.0147 & 1338 & $1.9e-07^{***}$ & $1.2e-06^{***}$ & $5.2e-06^{***}$ & 0.4942 \\
459
+ LDLT-R & Orthogonal & 121 & 79 & 33 & 9 & 0.6901 & 0.0149 & 1541 & $2.5e-06^{***}$ & $1.0e-05^{***}$ & $5.7e-05^{***}$ & 0.4451 \\
460
+ LDLT-R & Sandwich & 121 & 45 & 70 & 6 & 0.3967 & -0.0068 & 2292 & $3.6e-03^{**}$ & $7.2e-03^{**}$ & $5.1e-02$ & 0.2713 \\
461
+ Orthogonal & SLL & 121 & 51 & 56 & 14 & 0.4793 & 0.0000 & 2810 & $8.1e-01$ & $8.1e-01$ & $1.0e+00$ & 0.0236 \\
462
+ \bottomrule
463
+ \end{tabular}
464
+ \begin{tablenotes}
465
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
466
+ \end{tablenotes}
467
+ \endgroup
468
+ \end{threeparttable}
469
+ \end{table*}
UCI_N6/wilcoxon_pairwise_all.csv ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ metric,alg_a,alg_b,n_common,n_nonzero,wins_a,wins_b,ties,win_rate_a_over_b,mean_diff_a_minus_b,median_diff_a_minus_b,W_stat,p_two_sided,z_equiv,effect_size_r,p_holm_global,p_holm_within_metric
2
+ mean_cert_acc_108,aol,ldlt-resnet,121,121,1,120,0,0.008264462809917356,-0.27392309146611565,-0.2317528344,45.0,4.173048144910383e-21,-9.42817024960416,0.8571063863276508,3.04632514578458e-19,6.259572217365575e-20
3
+ mean_cert_acc_108,aol,ortho,121,120,3,117,1,0.028925619834710745,-0.24899719816859503,-0.2098822109,60.0,8.927572293355817e-21,-9.348053251081865,0.853356605729507,6.249300605349072e-19,1.2498601210698143e-19
4
+ mean_cert_acc_108,aol,sandwich,121,121,5,116,0,0.04132231404958678,-0.2999183728280992,-0.2735294178,82.0,1.0343588534993559e-20,-9.332465915108862,0.8484059922826238,7.0336402037956195e-19,1.3446665095491626e-19
5
+ mean_cert_acc_108,aol,sdp,121,117,1,116,4,0.024793388429752067,-0.22223160453553722,-0.17206639070000002,34.0,1.4919341499692146e-20,-9.293573414471693,0.8591911661068367,9.995958804793737e-19,1.7903209799630575e-19
6
+ mean_cert_acc_108,ldlt,sandwich,121,121,14,107,0,0.11570247933884298,-0.14914118170661156,-0.08187162130000003,450.0,5.266046064559084e-17,-8.380595777425917,0.7618723434023561,3.054306717444269e-15,5.792650671014993e-16
7
+ mean_cert_acc_108,aol,ldlt,121,96,6,90,25,0.15289256198347106,-0.1507771911214876,-0.0671557561,113.0,5.846618540929849e-16,-8.092471290134199,0.8259343924562947,3.274106382920715e-14,5.846618540929849e-15
8
+ mean_cert_acc_108,ldlt,ldlt-resnet,121,121,25,96,0,0.2066115702479339,-0.12314590034462813,-0.07149813070000001,733.0,2.0319979828081665e-14,-7.648586948718654,0.6953260862471503,1.0159989914040832e-12,1.82879818452735e-13
9
+ mean_cert_acc_108,ortho,sandwich,121,120,18,102,1,0.15289256198347106,-0.05092117465950414,-0.03757250309999999,945.0,2.0601004521550643e-12,-7.030354097921072,0.6417805877800424,9.270452034697789e-11,1.6480803617240515e-11
10
+ mean_cert_acc_108,sandwich,sdp,121,121,93,28,0,0.768595041322314,0.07768676829256199,0.043483858000000014,995.0,3.149269421374916e-12,6.970896796346558,0.6337178905769598,1.354185851191214e-10,2.2044885949624412e-11
11
+ mean_cert_acc_108,ldlt,ortho,121,120,32,88,1,0.26859504132231404,-0.09822000704710745,-0.035191671,1203.0,2.088529737024506e-10,-6.35468587021996,0.5801007994964698,7.727560026990672e-09,1.2531178422147035e-09
12
+ mean_cert_acc_108,ldlt,sdp,121,117,35,82,4,0.30578512396694213,-0.0714544134140496,-0.0293723642,1335.0,8.658682431527648e-09,-5.755107212473546,0.5320598500093845,2.5976047294582945e-07,4.329341215763824e-08
13
+ mean_cert_acc_108,ldlt-resnet,sdp,121,121,89,32,0,0.7355371900826446,0.051691486930578505,0.02334547050000002,1603.0,6.729713480359853e-08,5.3982417862616945,0.4907492532965177,1.884319774500759e-06,2.6918853921439414e-07
14
+ mean_cert_acc_108,ldlt-resnet,ortho,121,121,81,40,0,0.6694214876033058,0.024925893297520662,0.018210522800000017,2277.0,0.000257311388966313,3.6548709362663034,0.33226099420602756,0.004631605001393634,0.0007719341668989391
15
+ mean_cert_acc_108,ldlt-resnet,sandwich,121,121,54,67,0,0.4462809917355372,-0.025995281361983476,-0.009650468899999987,2867.0,0.03327289749858807,-2.128774791611584,0.19352498105559854,0.3078706868259233,0.06654579499717614
16
+ mean_cert_acc_108,ortho,sdp,121,121,67,54,0,0.5537190082644629,0.02676559363305785,0.006111383400000059,2930.0,0.04931954967599767,1.96581876260608,0.17871079660055272,0.3945563974079814,0.06654579499717614
17
+ mean_cert_acc_255,aol,ldlt-resnet,121,110,0,110,11,0.045454545454545456,-0.1337634204305785,-0.07166579370000001,0.0,8.869456124226732e-20,-9.101986380438365,0.867840350157088,5.587757358262842e-18,1.3304184186340097e-18
18
+ mean_cert_acc_255,aol,sandwich,121,114,2,112,7,0.045454545454545456,-0.1626829197404959,-0.0885858461,74.0,1.3513967462376266e-19,-9.056147189870263,0.8481858965627918,8.378659826673286e-18,1.891955444732677e-18
19
+ mean_cert_acc_255,aol,sdp,121,103,2,101,18,0.09090909090909091,-0.10510361606942148,-0.0429337709,22.0,2.4070122764633777e-18,-8.736379113198142,0.8608210125377133,1.4682774886426603e-16,3.129115959402391e-17
20
+ mean_cert_acc_255,aol,ortho,121,105,2,103,16,0.08264462809917356,-0.11352401609338844,-0.0488128485,71.0,4.4540479170963364e-18,-8.666551629965934,0.8457688367895985,2.672428750257802e-16,5.344857500515604e-17
21
+ mean_cert_acc_255,ldlt,sandwich,121,114,10,104,7,0.1115702479338843,-0.08797530880743801,-0.035087719600000004,415.0,5.869031304740028e-16,-8.09200538788907,0.7578857433539525,3.274106382920715e-14,6.455934435214031e-15
22
+ mean_cert_acc_255,ortho,sandwich,121,114,17,97,7,0.16942148760330578,-0.04915890364710745,-0.0273425561,465.0,1.8555697623108275e-15,-7.950635622202678,0.7446452516811022,1.0020076716478469e-13,1.8555697623108276e-14
23
+ mean_cert_acc_255,aol,ldlt,121,87,3,84,34,0.1652892561983471,-0.07470761093305785,-0.0172084123,48.0,2.8910100531902833e-15,-7.895522718405998,0.8464888875499651,1.53223532819085e-13,2.601909047871255e-14
24
+ mean_cert_acc_255,ldlt,ldlt-resnet,121,110,20,90,11,0.21074380165289255,-0.059055809497520664,-0.029557436699999995,685.0,1.6757315874402246e-12,-7.059109358616517,0.6730596686834297,7.708365302225033e-11,1.3405852699521797e-11
25
+ mean_cert_acc_255,sandwich,sdp,121,114,84,30,7,0.7231404958677686,0.05757930367107439,0.01639589660000007,1043.0,2.677245913589704e-10,6.316401130867988,0.5915851679429525,9.638085288922934e-09,1.8740721395127926e-09
26
+ mean_cert_acc_255,ldlt-resnet,sdp,121,111,80,31,10,0.7024793388429752,0.02865980436115703,0.014675030499999998,1338.0,1.925925419153017e-07,5.206348742635875,0.49416475377488106,5.199998631713146e-06,1.1555552514918102e-06
27
+ mean_cert_acc_255,ldlt,sdp,121,103,27,76,18,0.2975206611570248,-0.030396005136363636,-0.0085921446,1234.0,2.04427321423648e-06,-4.74899764635719,0.46793264228890574,4.9813985833316794e-05,1.02213660711824e-05
28
+ mean_cert_acc_255,ldlt-resnet,ortho,121,112,79,33,9,0.6900826446280992,0.020239404337190077,0.0148802027,1541.0,2.473225995331523e-06,4.710324575483669,0.4450838364687742,5.688419789262503e-05,1.02213660711824e-05
29
+ mean_cert_acc_255,ldlt,ortho,121,104,30,74,17,0.3181818181818182,-0.038816405160330573,-0.0039353251,1287.0,2.9004026494882005e-06,-4.677749709194439,0.45869109705548883,6.380885828874041e-05,1.02213660711824e-05
30
+ mean_cert_acc_255,ldlt-resnet,sandwich,121,115,45,70,6,0.39669421487603307,-0.028919499309917357,-0.006780041400000006,2292.0,0.0036216710008269344,-2.909362118386465,0.27129941643076033,0.05070339401157708,0.007243342001653869
31
+ mean_cert_acc_255,ortho,sdp,121,107,51,56,14,0.4793388429752066,0.008420400023966945,0.0,2810.0,0.8072471562749569,0.2439789068176065,0.0235863311778052,1.0,0.8072471562749569
32
+ mean_cert_acc_36,aol,ldlt-resnet,121,121,3,118,0,0.024793388429752067,-0.31595442485289255,-0.2903496213,53.0,5.081865377201806e-21,-9.407477420524096,0.855225220047645,3.6081244178132824e-19,7.622798065802708e-20
33
+ mean_cert_acc_36,aol,sdp,121,121,4,117,0,0.03305785123966942,-0.29394078019173553,-0.27176492290000004,115.0,2.3064868484496506e-20,-9.247107995153597,0.8406461813775997,1.5222813199767693e-18,3.229081587829511e-19
34
+ mean_cert_acc_36,aol,sandwich,121,121,9,112,0,0.0743801652892562,-0.3362883788859505,-0.3413665891,135.0,3.7368566478163725e-20,-9.195375922453437,0.8359432656775851,2.4289568210806422e-18,4.857913642161284e-19
35
+ mean_cert_acc_36,aol,ortho,121,121,8,113,0,0.06611570247933884,-0.31452074730661156,-0.298160661,140.0,4.214205424175081e-20,-9.1824429042784,0.8347675367525818,2.6970914714720518e-18,5.057046509010097e-19
36
+ mean_cert_acc_36,ldlt,sandwich,121,121,22,99,0,0.18181818181818182,-0.1593331515289256,-0.07613579920000002,770.0,4.257286781467921e-14,-7.552882614223359,0.6866256922021235,2.0860705229192814e-12,4.683015459614713e-13
37
+ mean_cert_acc_36,aol,ldlt,121,117,22,95,4,0.19834710743801653,-0.17695522735702482,-0.1111815423,872.0,2.3097599957727363e-12,-7.014376890817237,0.6484793729556723,1.016294398140004e-10,2.3097599957727362e-11
38
+ mean_cert_acc_36,ldlt,ldlt-resnet,121,121,34,87,0,0.2809917355371901,-0.1389991974958678,-0.061314076199999956,1073.0,1.2954860468318954e-11,-6.769141712815935,0.6153765193469032,5.311492792010771e-10,1.1659374421487058e-10
39
+ mean_cert_acc_36,ldlt,sdp,121,121,38,83,0,0.3140495867768595,-0.11698555283471074,-0.05446506109999999,1275.0,4.1935525354513343e-10,-6.246647778544319,0.5678770707767563,1.4258078620534537e-08,3.3548420283610675e-09
40
+ mean_cert_acc_36,ldlt,ortho,121,121,40,81,0,0.3305785123966942,-0.1375655199495868,-0.05810886200000001,1346.0,1.336065624102734e-09,-6.06299892045875,0.5511817200417046,4.275409997128749e-08,9.352459368719139e-09
41
+ mean_cert_acc_36,sandwich,sdp,121,121,89,32,0,0.7355371900826446,0.04234759869421486,0.023600280299999943,1459.0,7.893695356058128e-09,5.770712709702847,0.5246102463366225,2.4470455603780194e-07,4.7362172136348766e-08
42
+ mean_cert_acc_36,ortho,sandwich,121,120,33,87,1,0.2768595041322314,-0.02176763157933884,-0.016444489399999984,1846.0,3.000975576009626e-06,-4.670753039166412,0.4263794666812091,6.380885828874041e-05,1.5004877880048131e-05
43
+ mean_cert_acc_36,ldlt-resnet,sdp,121,121,81,40,0,0.6694214876033058,0.02201364466115702,0.010049086099999993,2305.0,0.00034039195053310725,3.58244603448608,0.32567691222600725,0.005446271208529716,0.001361567802132429
44
+ mean_cert_acc_36,ldlt-resnet,sandwich,121,121,50,71,0,0.4132231404958678,-0.02033395403305785,-0.009377405099999986,2753.0,0.015365507519162087,-2.4236476060024956,0.22033160054568143,0.18438609022994504,0.04609652255748626
45
+ mean_cert_acc_36,ortho,sdp,121,121,65,56,0,0.5371900826446281,0.02057996711487603,0.0014110952000000454,2942.0,0.05301735742636078,1.934779518985984,0.175889047180544,0.3945563974079814,0.10603471485272156
46
+ mean_cert_acc_36,ldlt-resnet,ortho,121,121,75,46,0,0.6198347107438017,0.0014336775462809915,0.006488025200000025,3172.0,0.1802906425434847,1.3398606829341437,0.1218055166303767,1.0,0.1802906425434847
47
+ mean_cert_acc_72,aol,sdp,121,121,0,121,0,0.0,-0.26562159861322315,-0.24182313309999998,0.0,1.3667681100678347e-21,-9.544567413179516,0.8676879466526833,1.025076082550876e-19,2.0501521651017522e-20
48
+ mean_cert_acc_72,aol,ldlt-resnet,121,121,1,120,0,0.008264462809917356,-0.30451178866033063,-0.2825206725,25.0,2.5452120986672276e-21,-9.47990232230432,0.8618093020276654,1.8834569530137485e-19,3.5632969381341184e-20
49
+ mean_cert_acc_72,aol,ortho,121,121,4,117,0,0.03305785123966942,-0.2930986073024794,-0.2681985311,45.0,4.173048144910383e-21,-9.42817024960416,0.8571063863276508,3.04632514578458e-19,5.424962588383498e-20
50
+ mean_cert_acc_72,aol,sandwich,121,121,6,115,0,0.049586776859504134,-0.332593737,-0.3329101392,80.0,9.850602055157206e-21,-9.337639122378876,0.8488762838526251,6.796915418058472e-19,1.1820722466188648e-19
51
+ mean_cert_acc_72,ldlt,sandwich,121,121,16,105,0,0.1322314049586777,-0.16179231059090907,-0.08644032480000008,509.0,1.9038706859410887e-16,-8.227986162960445,0.7479987420873132,1.0852062909864206e-14,2.0942577545351975e-15
52
+ mean_cert_acc_72,aol,ldlt,121,103,10,93,18,0.15702479338842976,-0.1708014264090909,-0.08492797240000005,304.0,5.7816595349340996e-15,-7.8086220392301975,0.7694063917372481,3.006462958165732e-13,5.7816595349341e-14
53
+ mean_cert_acc_72,ldlt,ldlt-resnet,121,121,30,91,0,0.24793388429752067,-0.13371036225123967,-0.0764530534,873.0,3.1819944830916117e-13,-7.2864624398175355,0.6624056763470487,1.5273573518839737e-11,2.8637950347824507e-12
54
+ mean_cert_acc_72,sandwich,sdp,121,121,95,26,0,0.7851239669421488,0.06697213838677687,0.03906400500000007,1169.0,6.992043780196073e-11,6.5208277638551655,0.5928025239868332,2.796817512078429e-09,5.593635024156859e-10
55
+ mean_cert_acc_72,ortho,sandwich,121,120,22,98,1,0.1859504132231405,-0.03949512969752067,-0.031834617300000034,1154.0,8.991026434826412e-11,-6.483010456101179,0.5918151778914119,3.5065003095823004e-09,6.293718504378489e-10
56
+ mean_cert_acc_72,ldlt,sdp,121,121,34,87,0,0.2809917355371901,-0.09482017220413223,-0.04369919,1219.0,1.6426888021305817e-10,-6.391497582104767,0.581045234736797,6.24221744809621e-09,9.85613281278349e-10
57
+ mean_cert_acc_72,ldlt,ortho,121,121,36,85,0,0.2975206611570248,-0.12229718089338842,-0.045210240900000004,1256.0,3.058317885864245e-10,-6.295793247609471,0.5723448406917702,1.0704112600524858e-08,1.5291589429321226e-09
58
+ mean_cert_acc_72,ldlt-resnet,sdp,121,121,89,32,0,0.7355371900826446,0.03889019004710745,0.020161554299999995,1852.0,1.9925594333326717e-06,4.754177481144703,0.43219795283133666,4.9813985833316794e-05,7.970237733330687e-06
59
+ mean_cert_acc_72,ldlt-resnet,sandwich,121,121,49,72,0,0.4049586776859504,-0.028081948339669427,-0.01332545279999997,2656.0,0.007483002786027263,-2.6745481585982716,0.24314074169075195,0.09727903621835442,0.02244900835808179
60
+ mean_cert_acc_72,ortho,sdp,121,121,67,54,0,0.5537190082644629,0.027477008689256194,0.004555895900000051,2784.0,0.01910566262360874,2.3434628933172474,0.21304208121065885,0.21016228885969615,0.03821132524721748
61
+ mean_cert_acc_72,ldlt-resnet,ortho,121,121,74,47,0,0.6115702479338843,0.011413181357851243,0.00889010730000006,2855.0,0.030787068682592327,2.1598140352316797,0.19634673047560725,0.3078706868259233,0.03821132524721748
62
+ mean_test_acc,aol,ldlt,121,121,16,105,0,0.1322314049586777,-0.11958352569586778,-0.06315010610000005,409.0,2.1268544183487774e-17,-8.486646526461245,0.7715133205873859,1.2548441068257787e-15,3.1902816275231663e-16
63
+ mean_test_acc,aol,sandwich,121,121,23,98,0,0.19008264462809918,-0.11132838667768594,-0.06561486950000006,698.0,1.0010877948097709e-14,-7.739118075943935,0.703556188722176,5.105547753529832e-13,1.4015229127336793e-13
64
+ mean_test_acc,aol,ortho,121,121,25,96,0,0.2066115702479339,-0.09866207272396695,-0.05250947429999997,908.0,6.203585473534351e-13,-7.195931312592255,0.6541755738720232,2.915685172561145e-11,8.064661115594657e-12
65
+ mean_test_acc,aol,sdp,121,121,24,97,0,0.19834710743801653,-0.09612382466942149,-0.044510062900000036,1047.0,8.121173320702691e-12,-6.836393407326143,0.6214903097569221,3.4108927946951305e-10,9.74540798484323e-11
66
+ mean_test_acc,aol,ldlt-resnet,121,121,27,94,0,0.2231404958677686,-0.09206069528677686,-0.03569083780000004,1307.0,7.098533094861746e-10,-6.163876462224062,0.5603524056567329,2.3425159213043762e-08,7.80838640434792e-09
67
+ mean_test_acc,ldlt,sdp,121,121,86,35,0,0.7107438016528925,0.023459701026446286,0.010278406500000004,1511.0,1.7383406684454798e-08,5.636209320682431,0.5123826655165846,5.041187938491891e-07,1.7383406684454799e-07
68
+ mean_test_acc,ldlt,ldlt-resnet,121,121,87,34,0,0.71900826446281,0.02752283040909091,0.01248115980000003,1779.0,7.69296628945801e-07,4.942999546500287,0.44936359513638974,2.000171235259083e-05,6.923669660512209e-06
69
+ mean_test_acc,ldlt,ortho,121,121,78,43,0,0.6446280991735537,0.020921452971900834,0.010356299000000013,2002.0,1.264342847332638e-05,4.366186935893503,0.39692608508122756,0.0002528685694665276,0.00010114742778661104
70
+ mean_test_acc,ortho,sandwich,121,120,39,81,1,0.32644628099173556,-0.01266631395371901,-0.007894689300000035,2171.0,0.00013365710865816523,-3.8196205817909794,0.3486820589596543,0.0025394850645051393,0.0009355997606071565
71
+ mean_test_acc,sandwich,sdp,121,121,80,41,0,0.6611570247933884,0.015204562008264456,0.006305895000000006,2279.0,0.00026254907665535047,3.6496977289962866,0.33179070263602606,0.004631605001393634,0.001575294459932103
72
+ mean_test_acc,ldlt-resnet,sandwich,121,121,47,74,0,0.3884297520661157,-0.019267691390909086,-0.01009704999999994,2411.0,0.0009387558222226796,-3.308266049175231,0.3007514590159301,0.014081337333340193,0.004693779111113398
73
+ mean_test_acc,ldlt,sandwich,121,120,64,56,1,0.5330578512396694,0.008255139018181824,0.0008221223000000055,3145.0,0.2044973939148288,1.2688420787642989,0.11582890474182553,1.0,0.8179895756593152
74
+ mean_test_acc,ldlt-resnet,ortho,121,121,54,67,0,0.4462809917355372,-0.006601377437190076,-0.0023532391000000152,3206.0,0.2106004158723539,-1.2519161593438723,0.11381055994035204,1.0,0.8179895756593152
75
+ mean_test_acc,ortho,sdp,121,121,60,61,0,0.49586776859504134,0.002538248054545448,-6.572600000032125e-06,3382.0,0.42564043452591804,0.7966739195824637,0.07242490178022397,1.0,0.8512808690518361
76
+ mean_test_acc,ldlt-resnet,sdp,121,121,58,63,0,0.4793388429752066,-0.0040631293826446264,-0.000977559300000097,3627.0,0.8705530555843003,-0.16295602900550393,0.014814184455045813,1.0,0.8705530555843003
UCI_N6/wilcoxon_pairwise_all.json ADDED
@@ -0,0 +1,1427 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metric":"mean_cert_acc_108",
4
+ "alg_a":"aol",
5
+ "alg_b":"ldlt-resnet",
6
+ "n_common":121,
7
+ "n_nonzero":121,
8
+ "wins_a":1,
9
+ "wins_b":120,
10
+ "ties":0,
11
+ "win_rate_a_over_b":0.0082644628,
12
+ "mean_diff_a_minus_b":-0.2739230915,
13
+ "median_diff_a_minus_b":-0.2317528344,
14
+ "W_stat":45.0,
15
+ "p_two_sided":4.173048145e-21,
16
+ "z_equiv":-9.4281702496,
17
+ "effect_size_r":0.8571063863,
18
+ "p_holm_global":3.046325146e-19,
19
+ "p_holm_within_metric":6.259572217e-20
20
+ },
21
+ {
22
+ "metric":"mean_cert_acc_108",
23
+ "alg_a":"aol",
24
+ "alg_b":"ortho",
25
+ "n_common":121,
26
+ "n_nonzero":120,
27
+ "wins_a":3,
28
+ "wins_b":117,
29
+ "ties":1,
30
+ "win_rate_a_over_b":0.0289256198,
31
+ "mean_diff_a_minus_b":-0.2489971982,
32
+ "median_diff_a_minus_b":-0.2098822109,
33
+ "W_stat":60.0,
34
+ "p_two_sided":8.927572293e-21,
35
+ "z_equiv":-9.3480532511,
36
+ "effect_size_r":0.8533566057,
37
+ "p_holm_global":6.249300605e-19,
38
+ "p_holm_within_metric":1.249860121e-19
39
+ },
40
+ {
41
+ "metric":"mean_cert_acc_108",
42
+ "alg_a":"aol",
43
+ "alg_b":"sandwich",
44
+ "n_common":121,
45
+ "n_nonzero":121,
46
+ "wins_a":5,
47
+ "wins_b":116,
48
+ "ties":0,
49
+ "win_rate_a_over_b":0.041322314,
50
+ "mean_diff_a_minus_b":-0.2999183728,
51
+ "median_diff_a_minus_b":-0.2735294178,
52
+ "W_stat":82.0,
53
+ "p_two_sided":1.034358853e-20,
54
+ "z_equiv":-9.3324659151,
55
+ "effect_size_r":0.8484059923,
56
+ "p_holm_global":7.033640204e-19,
57
+ "p_holm_within_metric":1.34466651e-19
58
+ },
59
+ {
60
+ "metric":"mean_cert_acc_108",
61
+ "alg_a":"aol",
62
+ "alg_b":"sdp",
63
+ "n_common":121,
64
+ "n_nonzero":117,
65
+ "wins_a":1,
66
+ "wins_b":116,
67
+ "ties":4,
68
+ "win_rate_a_over_b":0.0247933884,
69
+ "mean_diff_a_minus_b":-0.2222316045,
70
+ "median_diff_a_minus_b":-0.1720663907,
71
+ "W_stat":34.0,
72
+ "p_two_sided":1.49193415e-20,
73
+ "z_equiv":-9.2935734145,
74
+ "effect_size_r":0.8591911661,
75
+ "p_holm_global":9.995958805e-19,
76
+ "p_holm_within_metric":1.79032098e-19
77
+ },
78
+ {
79
+ "metric":"mean_cert_acc_108",
80
+ "alg_a":"ldlt",
81
+ "alg_b":"sandwich",
82
+ "n_common":121,
83
+ "n_nonzero":121,
84
+ "wins_a":14,
85
+ "wins_b":107,
86
+ "ties":0,
87
+ "win_rate_a_over_b":0.1157024793,
88
+ "mean_diff_a_minus_b":-0.1491411817,
89
+ "median_diff_a_minus_b":-0.0818716213,
90
+ "W_stat":450.0,
91
+ "p_two_sided":5.266046065e-17,
92
+ "z_equiv":-8.3805957774,
93
+ "effect_size_r":0.7618723434,
94
+ "p_holm_global":0.0,
95
+ "p_holm_within_metric":5.792650671e-16
96
+ },
97
+ {
98
+ "metric":"mean_cert_acc_108",
99
+ "alg_a":"aol",
100
+ "alg_b":"ldlt",
101
+ "n_common":121,
102
+ "n_nonzero":96,
103
+ "wins_a":6,
104
+ "wins_b":90,
105
+ "ties":25,
106
+ "win_rate_a_over_b":0.152892562,
107
+ "mean_diff_a_minus_b":-0.1507771911,
108
+ "median_diff_a_minus_b":-0.0671557561,
109
+ "W_stat":113.0,
110
+ "p_two_sided":5.846618541e-16,
111
+ "z_equiv":-8.0924712901,
112
+ "effect_size_r":0.8259343925,
113
+ "p_holm_global":0.0,
114
+ "p_holm_within_metric":0.0
115
+ },
116
+ {
117
+ "metric":"mean_cert_acc_108",
118
+ "alg_a":"ldlt",
119
+ "alg_b":"ldlt-resnet",
120
+ "n_common":121,
121
+ "n_nonzero":121,
122
+ "wins_a":25,
123
+ "wins_b":96,
124
+ "ties":0,
125
+ "win_rate_a_over_b":0.2066115702,
126
+ "mean_diff_a_minus_b":-0.1231459003,
127
+ "median_diff_a_minus_b":-0.0714981307,
128
+ "W_stat":733.0,
129
+ "p_two_sided":0.0,
130
+ "z_equiv":-7.6485869487,
131
+ "effect_size_r":0.6953260862,
132
+ "p_holm_global":0.0,
133
+ "p_holm_within_metric":0.0
134
+ },
135
+ {
136
+ "metric":"mean_cert_acc_108",
137
+ "alg_a":"ortho",
138
+ "alg_b":"sandwich",
139
+ "n_common":121,
140
+ "n_nonzero":120,
141
+ "wins_a":18,
142
+ "wins_b":102,
143
+ "ties":1,
144
+ "win_rate_a_over_b":0.152892562,
145
+ "mean_diff_a_minus_b":-0.0509211747,
146
+ "median_diff_a_minus_b":-0.0375725031,
147
+ "W_stat":945.0,
148
+ "p_two_sided":0.0,
149
+ "z_equiv":-7.0303540979,
150
+ "effect_size_r":0.6417805878,
151
+ "p_holm_global":0.0000000001,
152
+ "p_holm_within_metric":0.0
153
+ },
154
+ {
155
+ "metric":"mean_cert_acc_108",
156
+ "alg_a":"sandwich",
157
+ "alg_b":"sdp",
158
+ "n_common":121,
159
+ "n_nonzero":121,
160
+ "wins_a":93,
161
+ "wins_b":28,
162
+ "ties":0,
163
+ "win_rate_a_over_b":0.7685950413,
164
+ "mean_diff_a_minus_b":0.0776867683,
165
+ "median_diff_a_minus_b":0.043483858,
166
+ "W_stat":995.0,
167
+ "p_two_sided":0.0,
168
+ "z_equiv":6.9708967963,
169
+ "effect_size_r":0.6337178906,
170
+ "p_holm_global":0.0000000001,
171
+ "p_holm_within_metric":0.0
172
+ },
173
+ {
174
+ "metric":"mean_cert_acc_108",
175
+ "alg_a":"ldlt",
176
+ "alg_b":"ortho",
177
+ "n_common":121,
178
+ "n_nonzero":120,
179
+ "wins_a":32,
180
+ "wins_b":88,
181
+ "ties":1,
182
+ "win_rate_a_over_b":0.2685950413,
183
+ "mean_diff_a_minus_b":-0.098220007,
184
+ "median_diff_a_minus_b":-0.035191671,
185
+ "W_stat":1203.0,
186
+ "p_two_sided":0.0000000002,
187
+ "z_equiv":-6.3546858702,
188
+ "effect_size_r":0.5801007995,
189
+ "p_holm_global":0.0000000077,
190
+ "p_holm_within_metric":0.0000000013
191
+ },
192
+ {
193
+ "metric":"mean_cert_acc_108",
194
+ "alg_a":"ldlt",
195
+ "alg_b":"sdp",
196
+ "n_common":121,
197
+ "n_nonzero":117,
198
+ "wins_a":35,
199
+ "wins_b":82,
200
+ "ties":4,
201
+ "win_rate_a_over_b":0.305785124,
202
+ "mean_diff_a_minus_b":-0.0714544134,
203
+ "median_diff_a_minus_b":-0.0293723642,
204
+ "W_stat":1335.0,
205
+ "p_two_sided":0.0000000087,
206
+ "z_equiv":-5.7551072125,
207
+ "effect_size_r":0.53205985,
208
+ "p_holm_global":0.0000002598,
209
+ "p_holm_within_metric":0.0000000433
210
+ },
211
+ {
212
+ "metric":"mean_cert_acc_108",
213
+ "alg_a":"ldlt-resnet",
214
+ "alg_b":"sdp",
215
+ "n_common":121,
216
+ "n_nonzero":121,
217
+ "wins_a":89,
218
+ "wins_b":32,
219
+ "ties":0,
220
+ "win_rate_a_over_b":0.7355371901,
221
+ "mean_diff_a_minus_b":0.0516914869,
222
+ "median_diff_a_minus_b":0.0233454705,
223
+ "W_stat":1603.0,
224
+ "p_two_sided":0.0000000673,
225
+ "z_equiv":5.3982417863,
226
+ "effect_size_r":0.4907492533,
227
+ "p_holm_global":0.0000018843,
228
+ "p_holm_within_metric":0.0000002692
229
+ },
230
+ {
231
+ "metric":"mean_cert_acc_108",
232
+ "alg_a":"ldlt-resnet",
233
+ "alg_b":"ortho",
234
+ "n_common":121,
235
+ "n_nonzero":121,
236
+ "wins_a":81,
237
+ "wins_b":40,
238
+ "ties":0,
239
+ "win_rate_a_over_b":0.6694214876,
240
+ "mean_diff_a_minus_b":0.0249258933,
241
+ "median_diff_a_minus_b":0.0182105228,
242
+ "W_stat":2277.0,
243
+ "p_two_sided":0.0002573114,
244
+ "z_equiv":3.6548709363,
245
+ "effect_size_r":0.3322609942,
246
+ "p_holm_global":0.004631605,
247
+ "p_holm_within_metric":0.0007719342
248
+ },
249
+ {
250
+ "metric":"mean_cert_acc_108",
251
+ "alg_a":"ldlt-resnet",
252
+ "alg_b":"sandwich",
253
+ "n_common":121,
254
+ "n_nonzero":121,
255
+ "wins_a":54,
256
+ "wins_b":67,
257
+ "ties":0,
258
+ "win_rate_a_over_b":0.4462809917,
259
+ "mean_diff_a_minus_b":-0.0259952814,
260
+ "median_diff_a_minus_b":-0.0096504689,
261
+ "W_stat":2867.0,
262
+ "p_two_sided":0.0332728975,
263
+ "z_equiv":-2.1287747916,
264
+ "effect_size_r":0.1935249811,
265
+ "p_holm_global":0.3078706868,
266
+ "p_holm_within_metric":0.066545795
267
+ },
268
+ {
269
+ "metric":"mean_cert_acc_108",
270
+ "alg_a":"ortho",
271
+ "alg_b":"sdp",
272
+ "n_common":121,
273
+ "n_nonzero":121,
274
+ "wins_a":67,
275
+ "wins_b":54,
276
+ "ties":0,
277
+ "win_rate_a_over_b":0.5537190083,
278
+ "mean_diff_a_minus_b":0.0267655936,
279
+ "median_diff_a_minus_b":0.0061113834,
280
+ "W_stat":2930.0,
281
+ "p_two_sided":0.0493195497,
282
+ "z_equiv":1.9658187626,
283
+ "effect_size_r":0.1787107966,
284
+ "p_holm_global":0.3945563974,
285
+ "p_holm_within_metric":0.066545795
286
+ },
287
+ {
288
+ "metric":"mean_cert_acc_255",
289
+ "alg_a":"aol",
290
+ "alg_b":"ldlt-resnet",
291
+ "n_common":121,
292
+ "n_nonzero":110,
293
+ "wins_a":0,
294
+ "wins_b":110,
295
+ "ties":11,
296
+ "win_rate_a_over_b":0.0454545455,
297
+ "mean_diff_a_minus_b":-0.1337634204,
298
+ "median_diff_a_minus_b":-0.0716657937,
299
+ "W_stat":0.0,
300
+ "p_two_sided":8.869456124e-20,
301
+ "z_equiv":-9.1019863804,
302
+ "effect_size_r":0.8678403502,
303
+ "p_holm_global":5.587757358e-18,
304
+ "p_holm_within_metric":1.330418419e-18
305
+ },
306
+ {
307
+ "metric":"mean_cert_acc_255",
308
+ "alg_a":"aol",
309
+ "alg_b":"sandwich",
310
+ "n_common":121,
311
+ "n_nonzero":114,
312
+ "wins_a":2,
313
+ "wins_b":112,
314
+ "ties":7,
315
+ "win_rate_a_over_b":0.0454545455,
316
+ "mean_diff_a_minus_b":-0.1626829197,
317
+ "median_diff_a_minus_b":-0.0885858461,
318
+ "W_stat":74.0,
319
+ "p_two_sided":1.351396746e-19,
320
+ "z_equiv":-9.0561471899,
321
+ "effect_size_r":0.8481858966,
322
+ "p_holm_global":8.378659827e-18,
323
+ "p_holm_within_metric":1.891955445e-18
324
+ },
325
+ {
326
+ "metric":"mean_cert_acc_255",
327
+ "alg_a":"aol",
328
+ "alg_b":"sdp",
329
+ "n_common":121,
330
+ "n_nonzero":103,
331
+ "wins_a":2,
332
+ "wins_b":101,
333
+ "ties":18,
334
+ "win_rate_a_over_b":0.0909090909,
335
+ "mean_diff_a_minus_b":-0.1051036161,
336
+ "median_diff_a_minus_b":-0.0429337709,
337
+ "W_stat":22.0,
338
+ "p_two_sided":2.407012276e-18,
339
+ "z_equiv":-8.7363791132,
340
+ "effect_size_r":0.8608210125,
341
+ "p_holm_global":1.468277489e-16,
342
+ "p_holm_within_metric":3.129115959e-17
343
+ },
344
+ {
345
+ "metric":"mean_cert_acc_255",
346
+ "alg_a":"aol",
347
+ "alg_b":"ortho",
348
+ "n_common":121,
349
+ "n_nonzero":105,
350
+ "wins_a":2,
351
+ "wins_b":103,
352
+ "ties":16,
353
+ "win_rate_a_over_b":0.0826446281,
354
+ "mean_diff_a_minus_b":-0.1135240161,
355
+ "median_diff_a_minus_b":-0.0488128485,
356
+ "W_stat":71.0,
357
+ "p_two_sided":4.454047917e-18,
358
+ "z_equiv":-8.66655163,
359
+ "effect_size_r":0.8457688368,
360
+ "p_holm_global":2.67242875e-16,
361
+ "p_holm_within_metric":5.344857501e-17
362
+ },
363
+ {
364
+ "metric":"mean_cert_acc_255",
365
+ "alg_a":"ldlt",
366
+ "alg_b":"sandwich",
367
+ "n_common":121,
368
+ "n_nonzero":114,
369
+ "wins_a":10,
370
+ "wins_b":104,
371
+ "ties":7,
372
+ "win_rate_a_over_b":0.1115702479,
373
+ "mean_diff_a_minus_b":-0.0879753088,
374
+ "median_diff_a_minus_b":-0.0350877196,
375
+ "W_stat":415.0,
376
+ "p_two_sided":5.869031305e-16,
377
+ "z_equiv":-8.0920053879,
378
+ "effect_size_r":0.7578857434,
379
+ "p_holm_global":0.0,
380
+ "p_holm_within_metric":0.0
381
+ },
382
+ {
383
+ "metric":"mean_cert_acc_255",
384
+ "alg_a":"ortho",
385
+ "alg_b":"sandwich",
386
+ "n_common":121,
387
+ "n_nonzero":114,
388
+ "wins_a":17,
389
+ "wins_b":97,
390
+ "ties":7,
391
+ "win_rate_a_over_b":0.1694214876,
392
+ "mean_diff_a_minus_b":-0.0491589036,
393
+ "median_diff_a_minus_b":-0.0273425561,
394
+ "W_stat":465.0,
395
+ "p_two_sided":0.0,
396
+ "z_equiv":-7.9506356222,
397
+ "effect_size_r":0.7446452517,
398
+ "p_holm_global":0.0,
399
+ "p_holm_within_metric":0.0
400
+ },
401
+ {
402
+ "metric":"mean_cert_acc_255",
403
+ "alg_a":"aol",
404
+ "alg_b":"ldlt",
405
+ "n_common":121,
406
+ "n_nonzero":87,
407
+ "wins_a":3,
408
+ "wins_b":84,
409
+ "ties":34,
410
+ "win_rate_a_over_b":0.1652892562,
411
+ "mean_diff_a_minus_b":-0.0747076109,
412
+ "median_diff_a_minus_b":-0.0172084123,
413
+ "W_stat":48.0,
414
+ "p_two_sided":0.0,
415
+ "z_equiv":-7.8955227184,
416
+ "effect_size_r":0.8464888875,
417
+ "p_holm_global":0.0,
418
+ "p_holm_within_metric":0.0
419
+ },
420
+ {
421
+ "metric":"mean_cert_acc_255",
422
+ "alg_a":"ldlt",
423
+ "alg_b":"ldlt-resnet",
424
+ "n_common":121,
425
+ "n_nonzero":110,
426
+ "wins_a":20,
427
+ "wins_b":90,
428
+ "ties":11,
429
+ "win_rate_a_over_b":0.2107438017,
430
+ "mean_diff_a_minus_b":-0.0590558095,
431
+ "median_diff_a_minus_b":-0.0295574367,
432
+ "W_stat":685.0,
433
+ "p_two_sided":0.0,
434
+ "z_equiv":-7.0591093586,
435
+ "effect_size_r":0.6730596687,
436
+ "p_holm_global":0.0000000001,
437
+ "p_holm_within_metric":0.0
438
+ },
439
+ {
440
+ "metric":"mean_cert_acc_255",
441
+ "alg_a":"sandwich",
442
+ "alg_b":"sdp",
443
+ "n_common":121,
444
+ "n_nonzero":114,
445
+ "wins_a":84,
446
+ "wins_b":30,
447
+ "ties":7,
448
+ "win_rate_a_over_b":0.7231404959,
449
+ "mean_diff_a_minus_b":0.0575793037,
450
+ "median_diff_a_minus_b":0.0163958966,
451
+ "W_stat":1043.0,
452
+ "p_two_sided":0.0000000003,
453
+ "z_equiv":6.3164011309,
454
+ "effect_size_r":0.5915851679,
455
+ "p_holm_global":0.0000000096,
456
+ "p_holm_within_metric":0.0000000019
457
+ },
458
+ {
459
+ "metric":"mean_cert_acc_255",
460
+ "alg_a":"ldlt-resnet",
461
+ "alg_b":"sdp",
462
+ "n_common":121,
463
+ "n_nonzero":111,
464
+ "wins_a":80,
465
+ "wins_b":31,
466
+ "ties":10,
467
+ "win_rate_a_over_b":0.7024793388,
468
+ "mean_diff_a_minus_b":0.0286598044,
469
+ "median_diff_a_minus_b":0.0146750305,
470
+ "W_stat":1338.0,
471
+ "p_two_sided":0.0000001926,
472
+ "z_equiv":5.2063487426,
473
+ "effect_size_r":0.4941647538,
474
+ "p_holm_global":0.0000052,
475
+ "p_holm_within_metric":0.0000011556
476
+ },
477
+ {
478
+ "metric":"mean_cert_acc_255",
479
+ "alg_a":"ldlt",
480
+ "alg_b":"sdp",
481
+ "n_common":121,
482
+ "n_nonzero":103,
483
+ "wins_a":27,
484
+ "wins_b":76,
485
+ "ties":18,
486
+ "win_rate_a_over_b":0.2975206612,
487
+ "mean_diff_a_minus_b":-0.0303960051,
488
+ "median_diff_a_minus_b":-0.0085921446,
489
+ "W_stat":1234.0,
490
+ "p_two_sided":0.0000020443,
491
+ "z_equiv":-4.7489976464,
492
+ "effect_size_r":0.4679326423,
493
+ "p_holm_global":0.000049814,
494
+ "p_holm_within_metric":0.0000102214
495
+ },
496
+ {
497
+ "metric":"mean_cert_acc_255",
498
+ "alg_a":"ldlt-resnet",
499
+ "alg_b":"ortho",
500
+ "n_common":121,
501
+ "n_nonzero":112,
502
+ "wins_a":79,
503
+ "wins_b":33,
504
+ "ties":9,
505
+ "win_rate_a_over_b":0.6900826446,
506
+ "mean_diff_a_minus_b":0.0202394043,
507
+ "median_diff_a_minus_b":0.0148802027,
508
+ "W_stat":1541.0,
509
+ "p_two_sided":0.0000024732,
510
+ "z_equiv":4.7103245755,
511
+ "effect_size_r":0.4450838365,
512
+ "p_holm_global":0.0000568842,
513
+ "p_holm_within_metric":0.0000102214
514
+ },
515
+ {
516
+ "metric":"mean_cert_acc_255",
517
+ "alg_a":"ldlt",
518
+ "alg_b":"ortho",
519
+ "n_common":121,
520
+ "n_nonzero":104,
521
+ "wins_a":30,
522
+ "wins_b":74,
523
+ "ties":17,
524
+ "win_rate_a_over_b":0.3181818182,
525
+ "mean_diff_a_minus_b":-0.0388164052,
526
+ "median_diff_a_minus_b":-0.0039353251,
527
+ "W_stat":1287.0,
528
+ "p_two_sided":0.0000029004,
529
+ "z_equiv":-4.6777497092,
530
+ "effect_size_r":0.4586910971,
531
+ "p_holm_global":0.0000638089,
532
+ "p_holm_within_metric":0.0000102214
533
+ },
534
+ {
535
+ "metric":"mean_cert_acc_255",
536
+ "alg_a":"ldlt-resnet",
537
+ "alg_b":"sandwich",
538
+ "n_common":121,
539
+ "n_nonzero":115,
540
+ "wins_a":45,
541
+ "wins_b":70,
542
+ "ties":6,
543
+ "win_rate_a_over_b":0.3966942149,
544
+ "mean_diff_a_minus_b":-0.0289194993,
545
+ "median_diff_a_minus_b":-0.0067800414,
546
+ "W_stat":2292.0,
547
+ "p_two_sided":0.003621671,
548
+ "z_equiv":-2.9093621184,
549
+ "effect_size_r":0.2712994164,
550
+ "p_holm_global":0.050703394,
551
+ "p_holm_within_metric":0.007243342
552
+ },
553
+ {
554
+ "metric":"mean_cert_acc_255",
555
+ "alg_a":"ortho",
556
+ "alg_b":"sdp",
557
+ "n_common":121,
558
+ "n_nonzero":107,
559
+ "wins_a":51,
560
+ "wins_b":56,
561
+ "ties":14,
562
+ "win_rate_a_over_b":0.479338843,
563
+ "mean_diff_a_minus_b":0.0084204,
564
+ "median_diff_a_minus_b":0.0,
565
+ "W_stat":2810.0,
566
+ "p_two_sided":0.8072471563,
567
+ "z_equiv":0.2439789068,
568
+ "effect_size_r":0.0235863312,
569
+ "p_holm_global":1.0,
570
+ "p_holm_within_metric":0.8072471563
571
+ },
572
+ {
573
+ "metric":"mean_cert_acc_36",
574
+ "alg_a":"aol",
575
+ "alg_b":"ldlt-resnet",
576
+ "n_common":121,
577
+ "n_nonzero":121,
578
+ "wins_a":3,
579
+ "wins_b":118,
580
+ "ties":0,
581
+ "win_rate_a_over_b":0.0247933884,
582
+ "mean_diff_a_minus_b":-0.3159544249,
583
+ "median_diff_a_minus_b":-0.2903496213,
584
+ "W_stat":53.0,
585
+ "p_two_sided":5.081865377e-21,
586
+ "z_equiv":-9.4074774205,
587
+ "effect_size_r":0.85522522,
588
+ "p_holm_global":3.608124418e-19,
589
+ "p_holm_within_metric":7.622798066e-20
590
+ },
591
+ {
592
+ "metric":"mean_cert_acc_36",
593
+ "alg_a":"aol",
594
+ "alg_b":"sdp",
595
+ "n_common":121,
596
+ "n_nonzero":121,
597
+ "wins_a":4,
598
+ "wins_b":117,
599
+ "ties":0,
600
+ "win_rate_a_over_b":0.0330578512,
601
+ "mean_diff_a_minus_b":-0.2939407802,
602
+ "median_diff_a_minus_b":-0.2717649229,
603
+ "W_stat":115.0,
604
+ "p_two_sided":2.306486848e-20,
605
+ "z_equiv":-9.2471079952,
606
+ "effect_size_r":0.8406461814,
607
+ "p_holm_global":1.52228132e-18,
608
+ "p_holm_within_metric":3.229081588e-19
609
+ },
610
+ {
611
+ "metric":"mean_cert_acc_36",
612
+ "alg_a":"aol",
613
+ "alg_b":"sandwich",
614
+ "n_common":121,
615
+ "n_nonzero":121,
616
+ "wins_a":9,
617
+ "wins_b":112,
618
+ "ties":0,
619
+ "win_rate_a_over_b":0.0743801653,
620
+ "mean_diff_a_minus_b":-0.3362883789,
621
+ "median_diff_a_minus_b":-0.3413665891,
622
+ "W_stat":135.0,
623
+ "p_two_sided":3.736856648e-20,
624
+ "z_equiv":-9.1953759225,
625
+ "effect_size_r":0.8359432657,
626
+ "p_holm_global":2.428956821e-18,
627
+ "p_holm_within_metric":4.857913642e-19
628
+ },
629
+ {
630
+ "metric":"mean_cert_acc_36",
631
+ "alg_a":"aol",
632
+ "alg_b":"ortho",
633
+ "n_common":121,
634
+ "n_nonzero":121,
635
+ "wins_a":8,
636
+ "wins_b":113,
637
+ "ties":0,
638
+ "win_rate_a_over_b":0.0661157025,
639
+ "mean_diff_a_minus_b":-0.3145207473,
640
+ "median_diff_a_minus_b":-0.298160661,
641
+ "W_stat":140.0,
642
+ "p_two_sided":4.214205424e-20,
643
+ "z_equiv":-9.1824429043,
644
+ "effect_size_r":0.8347675368,
645
+ "p_holm_global":2.697091471e-18,
646
+ "p_holm_within_metric":5.057046509e-19
647
+ },
648
+ {
649
+ "metric":"mean_cert_acc_36",
650
+ "alg_a":"ldlt",
651
+ "alg_b":"sandwich",
652
+ "n_common":121,
653
+ "n_nonzero":121,
654
+ "wins_a":22,
655
+ "wins_b":99,
656
+ "ties":0,
657
+ "win_rate_a_over_b":0.1818181818,
658
+ "mean_diff_a_minus_b":-0.1593331515,
659
+ "median_diff_a_minus_b":-0.0761357992,
660
+ "W_stat":770.0,
661
+ "p_two_sided":0.0,
662
+ "z_equiv":-7.5528826142,
663
+ "effect_size_r":0.6866256922,
664
+ "p_holm_global":0.0,
665
+ "p_holm_within_metric":0.0
666
+ },
667
+ {
668
+ "metric":"mean_cert_acc_36",
669
+ "alg_a":"aol",
670
+ "alg_b":"ldlt",
671
+ "n_common":121,
672
+ "n_nonzero":117,
673
+ "wins_a":22,
674
+ "wins_b":95,
675
+ "ties":4,
676
+ "win_rate_a_over_b":0.1983471074,
677
+ "mean_diff_a_minus_b":-0.1769552274,
678
+ "median_diff_a_minus_b":-0.1111815423,
679
+ "W_stat":872.0,
680
+ "p_two_sided":0.0,
681
+ "z_equiv":-7.0143768908,
682
+ "effect_size_r":0.648479373,
683
+ "p_holm_global":0.0000000001,
684
+ "p_holm_within_metric":0.0
685
+ },
686
+ {
687
+ "metric":"mean_cert_acc_36",
688
+ "alg_a":"ldlt",
689
+ "alg_b":"ldlt-resnet",
690
+ "n_common":121,
691
+ "n_nonzero":121,
692
+ "wins_a":34,
693
+ "wins_b":87,
694
+ "ties":0,
695
+ "win_rate_a_over_b":0.2809917355,
696
+ "mean_diff_a_minus_b":-0.1389991975,
697
+ "median_diff_a_minus_b":-0.0613140762,
698
+ "W_stat":1073.0,
699
+ "p_two_sided":0.0,
700
+ "z_equiv":-6.7691417128,
701
+ "effect_size_r":0.6153765193,
702
+ "p_holm_global":0.0000000005,
703
+ "p_holm_within_metric":0.0000000001
704
+ },
705
+ {
706
+ "metric":"mean_cert_acc_36",
707
+ "alg_a":"ldlt",
708
+ "alg_b":"sdp",
709
+ "n_common":121,
710
+ "n_nonzero":121,
711
+ "wins_a":38,
712
+ "wins_b":83,
713
+ "ties":0,
714
+ "win_rate_a_over_b":0.3140495868,
715
+ "mean_diff_a_minus_b":-0.1169855528,
716
+ "median_diff_a_minus_b":-0.0544650611,
717
+ "W_stat":1275.0,
718
+ "p_two_sided":0.0000000004,
719
+ "z_equiv":-6.2466477785,
720
+ "effect_size_r":0.5678770708,
721
+ "p_holm_global":0.0000000143,
722
+ "p_holm_within_metric":0.0000000034
723
+ },
724
+ {
725
+ "metric":"mean_cert_acc_36",
726
+ "alg_a":"ldlt",
727
+ "alg_b":"ortho",
728
+ "n_common":121,
729
+ "n_nonzero":121,
730
+ "wins_a":40,
731
+ "wins_b":81,
732
+ "ties":0,
733
+ "win_rate_a_over_b":0.3305785124,
734
+ "mean_diff_a_minus_b":-0.1375655199,
735
+ "median_diff_a_minus_b":-0.058108862,
736
+ "W_stat":1346.0,
737
+ "p_two_sided":0.0000000013,
738
+ "z_equiv":-6.0629989205,
739
+ "effect_size_r":0.55118172,
740
+ "p_holm_global":0.0000000428,
741
+ "p_holm_within_metric":0.0000000094
742
+ },
743
+ {
744
+ "metric":"mean_cert_acc_36",
745
+ "alg_a":"sandwich",
746
+ "alg_b":"sdp",
747
+ "n_common":121,
748
+ "n_nonzero":121,
749
+ "wins_a":89,
750
+ "wins_b":32,
751
+ "ties":0,
752
+ "win_rate_a_over_b":0.7355371901,
753
+ "mean_diff_a_minus_b":0.0423475987,
754
+ "median_diff_a_minus_b":0.0236002803,
755
+ "W_stat":1459.0,
756
+ "p_two_sided":0.0000000079,
757
+ "z_equiv":5.7707127097,
758
+ "effect_size_r":0.5246102463,
759
+ "p_holm_global":0.0000002447,
760
+ "p_holm_within_metric":0.0000000474
761
+ },
762
+ {
763
+ "metric":"mean_cert_acc_36",
764
+ "alg_a":"ortho",
765
+ "alg_b":"sandwich",
766
+ "n_common":121,
767
+ "n_nonzero":120,
768
+ "wins_a":33,
769
+ "wins_b":87,
770
+ "ties":1,
771
+ "win_rate_a_over_b":0.2768595041,
772
+ "mean_diff_a_minus_b":-0.0217676316,
773
+ "median_diff_a_minus_b":-0.0164444894,
774
+ "W_stat":1846.0,
775
+ "p_two_sided":0.000003001,
776
+ "z_equiv":-4.6707530392,
777
+ "effect_size_r":0.4263794667,
778
+ "p_holm_global":0.0000638089,
779
+ "p_holm_within_metric":0.0000150049
780
+ },
781
+ {
782
+ "metric":"mean_cert_acc_36",
783
+ "alg_a":"ldlt-resnet",
784
+ "alg_b":"sdp",
785
+ "n_common":121,
786
+ "n_nonzero":121,
787
+ "wins_a":81,
788
+ "wins_b":40,
789
+ "ties":0,
790
+ "win_rate_a_over_b":0.6694214876,
791
+ "mean_diff_a_minus_b":0.0220136447,
792
+ "median_diff_a_minus_b":0.0100490861,
793
+ "W_stat":2305.0,
794
+ "p_two_sided":0.000340392,
795
+ "z_equiv":3.5824460345,
796
+ "effect_size_r":0.3256769122,
797
+ "p_holm_global":0.0054462712,
798
+ "p_holm_within_metric":0.0013615678
799
+ },
800
+ {
801
+ "metric":"mean_cert_acc_36",
802
+ "alg_a":"ldlt-resnet",
803
+ "alg_b":"sandwich",
804
+ "n_common":121,
805
+ "n_nonzero":121,
806
+ "wins_a":50,
807
+ "wins_b":71,
808
+ "ties":0,
809
+ "win_rate_a_over_b":0.4132231405,
810
+ "mean_diff_a_minus_b":-0.020333954,
811
+ "median_diff_a_minus_b":-0.0093774051,
812
+ "W_stat":2753.0,
813
+ "p_two_sided":0.0153655075,
814
+ "z_equiv":-2.423647606,
815
+ "effect_size_r":0.2203316005,
816
+ "p_holm_global":0.1843860902,
817
+ "p_holm_within_metric":0.0460965226
818
+ },
819
+ {
820
+ "metric":"mean_cert_acc_36",
821
+ "alg_a":"ortho",
822
+ "alg_b":"sdp",
823
+ "n_common":121,
824
+ "n_nonzero":121,
825
+ "wins_a":65,
826
+ "wins_b":56,
827
+ "ties":0,
828
+ "win_rate_a_over_b":0.5371900826,
829
+ "mean_diff_a_minus_b":0.0205799671,
830
+ "median_diff_a_minus_b":0.0014110952,
831
+ "W_stat":2942.0,
832
+ "p_two_sided":0.0530173574,
833
+ "z_equiv":1.934779519,
834
+ "effect_size_r":0.1758890472,
835
+ "p_holm_global":0.3945563974,
836
+ "p_holm_within_metric":0.1060347149
837
+ },
838
+ {
839
+ "metric":"mean_cert_acc_36",
840
+ "alg_a":"ldlt-resnet",
841
+ "alg_b":"ortho",
842
+ "n_common":121,
843
+ "n_nonzero":121,
844
+ "wins_a":75,
845
+ "wins_b":46,
846
+ "ties":0,
847
+ "win_rate_a_over_b":0.6198347107,
848
+ "mean_diff_a_minus_b":0.0014336775,
849
+ "median_diff_a_minus_b":0.0064880252,
850
+ "W_stat":3172.0,
851
+ "p_two_sided":0.1802906425,
852
+ "z_equiv":1.3398606829,
853
+ "effect_size_r":0.1218055166,
854
+ "p_holm_global":1.0,
855
+ "p_holm_within_metric":0.1802906425
856
+ },
857
+ {
858
+ "metric":"mean_cert_acc_72",
859
+ "alg_a":"aol",
860
+ "alg_b":"sdp",
861
+ "n_common":121,
862
+ "n_nonzero":121,
863
+ "wins_a":0,
864
+ "wins_b":121,
865
+ "ties":0,
866
+ "win_rate_a_over_b":0.0,
867
+ "mean_diff_a_minus_b":-0.2656215986,
868
+ "median_diff_a_minus_b":-0.2418231331,
869
+ "W_stat":0.0,
870
+ "p_two_sided":1.36676811e-21,
871
+ "z_equiv":-9.5445674132,
872
+ "effect_size_r":0.8676879467,
873
+ "p_holm_global":1.025076083e-19,
874
+ "p_holm_within_metric":2.050152165e-20
875
+ },
876
+ {
877
+ "metric":"mean_cert_acc_72",
878
+ "alg_a":"aol",
879
+ "alg_b":"ldlt-resnet",
880
+ "n_common":121,
881
+ "n_nonzero":121,
882
+ "wins_a":1,
883
+ "wins_b":120,
884
+ "ties":0,
885
+ "win_rate_a_over_b":0.0082644628,
886
+ "mean_diff_a_minus_b":-0.3045117887,
887
+ "median_diff_a_minus_b":-0.2825206725,
888
+ "W_stat":25.0,
889
+ "p_two_sided":2.545212099e-21,
890
+ "z_equiv":-9.4799023223,
891
+ "effect_size_r":0.861809302,
892
+ "p_holm_global":1.883456953e-19,
893
+ "p_holm_within_metric":3.563296938e-20
894
+ },
895
+ {
896
+ "metric":"mean_cert_acc_72",
897
+ "alg_a":"aol",
898
+ "alg_b":"ortho",
899
+ "n_common":121,
900
+ "n_nonzero":121,
901
+ "wins_a":4,
902
+ "wins_b":117,
903
+ "ties":0,
904
+ "win_rate_a_over_b":0.0330578512,
905
+ "mean_diff_a_minus_b":-0.2930986073,
906
+ "median_diff_a_minus_b":-0.2681985311,
907
+ "W_stat":45.0,
908
+ "p_two_sided":4.173048145e-21,
909
+ "z_equiv":-9.4281702496,
910
+ "effect_size_r":0.8571063863,
911
+ "p_holm_global":3.046325146e-19,
912
+ "p_holm_within_metric":5.424962588e-20
913
+ },
914
+ {
915
+ "metric":"mean_cert_acc_72",
916
+ "alg_a":"aol",
917
+ "alg_b":"sandwich",
918
+ "n_common":121,
919
+ "n_nonzero":121,
920
+ "wins_a":6,
921
+ "wins_b":115,
922
+ "ties":0,
923
+ "win_rate_a_over_b":0.0495867769,
924
+ "mean_diff_a_minus_b":-0.332593737,
925
+ "median_diff_a_minus_b":-0.3329101392,
926
+ "W_stat":80.0,
927
+ "p_two_sided":9.850602055e-21,
928
+ "z_equiv":-9.3376391224,
929
+ "effect_size_r":0.8488762839,
930
+ "p_holm_global":6.796915418e-19,
931
+ "p_holm_within_metric":1.182072247e-19
932
+ },
933
+ {
934
+ "metric":"mean_cert_acc_72",
935
+ "alg_a":"ldlt",
936
+ "alg_b":"sandwich",
937
+ "n_common":121,
938
+ "n_nonzero":121,
939
+ "wins_a":16,
940
+ "wins_b":105,
941
+ "ties":0,
942
+ "win_rate_a_over_b":0.132231405,
943
+ "mean_diff_a_minus_b":-0.1617923106,
944
+ "median_diff_a_minus_b":-0.0864403248,
945
+ "W_stat":509.0,
946
+ "p_two_sided":1.903870686e-16,
947
+ "z_equiv":-8.227986163,
948
+ "effect_size_r":0.7479987421,
949
+ "p_holm_global":0.0,
950
+ "p_holm_within_metric":0.0
951
+ },
952
+ {
953
+ "metric":"mean_cert_acc_72",
954
+ "alg_a":"aol",
955
+ "alg_b":"ldlt",
956
+ "n_common":121,
957
+ "n_nonzero":103,
958
+ "wins_a":10,
959
+ "wins_b":93,
960
+ "ties":18,
961
+ "win_rate_a_over_b":0.1570247934,
962
+ "mean_diff_a_minus_b":-0.1708014264,
963
+ "median_diff_a_minus_b":-0.0849279724,
964
+ "W_stat":304.0,
965
+ "p_two_sided":0.0,
966
+ "z_equiv":-7.8086220392,
967
+ "effect_size_r":0.7694063917,
968
+ "p_holm_global":0.0,
969
+ "p_holm_within_metric":0.0
970
+ },
971
+ {
972
+ "metric":"mean_cert_acc_72",
973
+ "alg_a":"ldlt",
974
+ "alg_b":"ldlt-resnet",
975
+ "n_common":121,
976
+ "n_nonzero":121,
977
+ "wins_a":30,
978
+ "wins_b":91,
979
+ "ties":0,
980
+ "win_rate_a_over_b":0.2479338843,
981
+ "mean_diff_a_minus_b":-0.1337103623,
982
+ "median_diff_a_minus_b":-0.0764530534,
983
+ "W_stat":873.0,
984
+ "p_two_sided":0.0,
985
+ "z_equiv":-7.2864624398,
986
+ "effect_size_r":0.6624056763,
987
+ "p_holm_global":0.0,
988
+ "p_holm_within_metric":0.0
989
+ },
990
+ {
991
+ "metric":"mean_cert_acc_72",
992
+ "alg_a":"sandwich",
993
+ "alg_b":"sdp",
994
+ "n_common":121,
995
+ "n_nonzero":121,
996
+ "wins_a":95,
997
+ "wins_b":26,
998
+ "ties":0,
999
+ "win_rate_a_over_b":0.7851239669,
1000
+ "mean_diff_a_minus_b":0.0669721384,
1001
+ "median_diff_a_minus_b":0.039064005,
1002
+ "W_stat":1169.0,
1003
+ "p_two_sided":0.0000000001,
1004
+ "z_equiv":6.5208277639,
1005
+ "effect_size_r":0.592802524,
1006
+ "p_holm_global":0.0000000028,
1007
+ "p_holm_within_metric":0.0000000006
1008
+ },
1009
+ {
1010
+ "metric":"mean_cert_acc_72",
1011
+ "alg_a":"ortho",
1012
+ "alg_b":"sandwich",
1013
+ "n_common":121,
1014
+ "n_nonzero":120,
1015
+ "wins_a":22,
1016
+ "wins_b":98,
1017
+ "ties":1,
1018
+ "win_rate_a_over_b":0.1859504132,
1019
+ "mean_diff_a_minus_b":-0.0394951297,
1020
+ "median_diff_a_minus_b":-0.0318346173,
1021
+ "W_stat":1154.0,
1022
+ "p_two_sided":0.0000000001,
1023
+ "z_equiv":-6.4830104561,
1024
+ "effect_size_r":0.5918151779,
1025
+ "p_holm_global":0.0000000035,
1026
+ "p_holm_within_metric":0.0000000006
1027
+ },
1028
+ {
1029
+ "metric":"mean_cert_acc_72",
1030
+ "alg_a":"ldlt",
1031
+ "alg_b":"sdp",
1032
+ "n_common":121,
1033
+ "n_nonzero":121,
1034
+ "wins_a":34,
1035
+ "wins_b":87,
1036
+ "ties":0,
1037
+ "win_rate_a_over_b":0.2809917355,
1038
+ "mean_diff_a_minus_b":-0.0948201722,
1039
+ "median_diff_a_minus_b":-0.04369919,
1040
+ "W_stat":1219.0,
1041
+ "p_two_sided":0.0000000002,
1042
+ "z_equiv":-6.3914975821,
1043
+ "effect_size_r":0.5810452347,
1044
+ "p_holm_global":0.0000000062,
1045
+ "p_holm_within_metric":0.000000001
1046
+ },
1047
+ {
1048
+ "metric":"mean_cert_acc_72",
1049
+ "alg_a":"ldlt",
1050
+ "alg_b":"ortho",
1051
+ "n_common":121,
1052
+ "n_nonzero":121,
1053
+ "wins_a":36,
1054
+ "wins_b":85,
1055
+ "ties":0,
1056
+ "win_rate_a_over_b":0.2975206612,
1057
+ "mean_diff_a_minus_b":-0.1222971809,
1058
+ "median_diff_a_minus_b":-0.0452102409,
1059
+ "W_stat":1256.0,
1060
+ "p_two_sided":0.0000000003,
1061
+ "z_equiv":-6.2957932476,
1062
+ "effect_size_r":0.5723448407,
1063
+ "p_holm_global":0.0000000107,
1064
+ "p_holm_within_metric":0.0000000015
1065
+ },
1066
+ {
1067
+ "metric":"mean_cert_acc_72",
1068
+ "alg_a":"ldlt-resnet",
1069
+ "alg_b":"sdp",
1070
+ "n_common":121,
1071
+ "n_nonzero":121,
1072
+ "wins_a":89,
1073
+ "wins_b":32,
1074
+ "ties":0,
1075
+ "win_rate_a_over_b":0.7355371901,
1076
+ "mean_diff_a_minus_b":0.03889019,
1077
+ "median_diff_a_minus_b":0.0201615543,
1078
+ "W_stat":1852.0,
1079
+ "p_two_sided":0.0000019926,
1080
+ "z_equiv":4.7541774811,
1081
+ "effect_size_r":0.4321979528,
1082
+ "p_holm_global":0.000049814,
1083
+ "p_holm_within_metric":0.0000079702
1084
+ },
1085
+ {
1086
+ "metric":"mean_cert_acc_72",
1087
+ "alg_a":"ldlt-resnet",
1088
+ "alg_b":"sandwich",
1089
+ "n_common":121,
1090
+ "n_nonzero":121,
1091
+ "wins_a":49,
1092
+ "wins_b":72,
1093
+ "ties":0,
1094
+ "win_rate_a_over_b":0.4049586777,
1095
+ "mean_diff_a_minus_b":-0.0280819483,
1096
+ "median_diff_a_minus_b":-0.0133254528,
1097
+ "W_stat":2656.0,
1098
+ "p_two_sided":0.0074830028,
1099
+ "z_equiv":-2.6745481586,
1100
+ "effect_size_r":0.2431407417,
1101
+ "p_holm_global":0.0972790362,
1102
+ "p_holm_within_metric":0.0224490084
1103
+ },
1104
+ {
1105
+ "metric":"mean_cert_acc_72",
1106
+ "alg_a":"ortho",
1107
+ "alg_b":"sdp",
1108
+ "n_common":121,
1109
+ "n_nonzero":121,
1110
+ "wins_a":67,
1111
+ "wins_b":54,
1112
+ "ties":0,
1113
+ "win_rate_a_over_b":0.5537190083,
1114
+ "mean_diff_a_minus_b":0.0274770087,
1115
+ "median_diff_a_minus_b":0.0045558959,
1116
+ "W_stat":2784.0,
1117
+ "p_two_sided":0.0191056626,
1118
+ "z_equiv":2.3434628933,
1119
+ "effect_size_r":0.2130420812,
1120
+ "p_holm_global":0.2101622889,
1121
+ "p_holm_within_metric":0.0382113252
1122
+ },
1123
+ {
1124
+ "metric":"mean_cert_acc_72",
1125
+ "alg_a":"ldlt-resnet",
1126
+ "alg_b":"ortho",
1127
+ "n_common":121,
1128
+ "n_nonzero":121,
1129
+ "wins_a":74,
1130
+ "wins_b":47,
1131
+ "ties":0,
1132
+ "win_rate_a_over_b":0.6115702479,
1133
+ "mean_diff_a_minus_b":0.0114131814,
1134
+ "median_diff_a_minus_b":0.0088901073,
1135
+ "W_stat":2855.0,
1136
+ "p_two_sided":0.0307870687,
1137
+ "z_equiv":2.1598140352,
1138
+ "effect_size_r":0.1963467305,
1139
+ "p_holm_global":0.3078706868,
1140
+ "p_holm_within_metric":0.0382113252
1141
+ },
1142
+ {
1143
+ "metric":"mean_test_acc",
1144
+ "alg_a":"aol",
1145
+ "alg_b":"ldlt",
1146
+ "n_common":121,
1147
+ "n_nonzero":121,
1148
+ "wins_a":16,
1149
+ "wins_b":105,
1150
+ "ties":0,
1151
+ "win_rate_a_over_b":0.132231405,
1152
+ "mean_diff_a_minus_b":-0.1195835257,
1153
+ "median_diff_a_minus_b":-0.0631501061,
1154
+ "W_stat":409.0,
1155
+ "p_two_sided":2.126854418e-17,
1156
+ "z_equiv":-8.4866465265,
1157
+ "effect_size_r":0.7715133206,
1158
+ "p_holm_global":0.0,
1159
+ "p_holm_within_metric":3.190281628e-16
1160
+ },
1161
+ {
1162
+ "metric":"mean_test_acc",
1163
+ "alg_a":"aol",
1164
+ "alg_b":"sandwich",
1165
+ "n_common":121,
1166
+ "n_nonzero":121,
1167
+ "wins_a":23,
1168
+ "wins_b":98,
1169
+ "ties":0,
1170
+ "win_rate_a_over_b":0.1900826446,
1171
+ "mean_diff_a_minus_b":-0.1113283867,
1172
+ "median_diff_a_minus_b":-0.0656148695,
1173
+ "W_stat":698.0,
1174
+ "p_two_sided":0.0,
1175
+ "z_equiv":-7.7391180759,
1176
+ "effect_size_r":0.7035561887,
1177
+ "p_holm_global":0.0,
1178
+ "p_holm_within_metric":0.0
1179
+ },
1180
+ {
1181
+ "metric":"mean_test_acc",
1182
+ "alg_a":"aol",
1183
+ "alg_b":"ortho",
1184
+ "n_common":121,
1185
+ "n_nonzero":121,
1186
+ "wins_a":25,
1187
+ "wins_b":96,
1188
+ "ties":0,
1189
+ "win_rate_a_over_b":0.2066115702,
1190
+ "mean_diff_a_minus_b":-0.0986620727,
1191
+ "median_diff_a_minus_b":-0.0525094743,
1192
+ "W_stat":908.0,
1193
+ "p_two_sided":0.0,
1194
+ "z_equiv":-7.1959313126,
1195
+ "effect_size_r":0.6541755739,
1196
+ "p_holm_global":0.0,
1197
+ "p_holm_within_metric":0.0
1198
+ },
1199
+ {
1200
+ "metric":"mean_test_acc",
1201
+ "alg_a":"aol",
1202
+ "alg_b":"sdp",
1203
+ "n_common":121,
1204
+ "n_nonzero":121,
1205
+ "wins_a":24,
1206
+ "wins_b":97,
1207
+ "ties":0,
1208
+ "win_rate_a_over_b":0.1983471074,
1209
+ "mean_diff_a_minus_b":-0.0961238247,
1210
+ "median_diff_a_minus_b":-0.0445100629,
1211
+ "W_stat":1047.0,
1212
+ "p_two_sided":0.0,
1213
+ "z_equiv":-6.8363934073,
1214
+ "effect_size_r":0.6214903098,
1215
+ "p_holm_global":0.0000000003,
1216
+ "p_holm_within_metric":0.0000000001
1217
+ },
1218
+ {
1219
+ "metric":"mean_test_acc",
1220
+ "alg_a":"aol",
1221
+ "alg_b":"ldlt-resnet",
1222
+ "n_common":121,
1223
+ "n_nonzero":121,
1224
+ "wins_a":27,
1225
+ "wins_b":94,
1226
+ "ties":0,
1227
+ "win_rate_a_over_b":0.2231404959,
1228
+ "mean_diff_a_minus_b":-0.0920606953,
1229
+ "median_diff_a_minus_b":-0.0356908378,
1230
+ "W_stat":1307.0,
1231
+ "p_two_sided":0.0000000007,
1232
+ "z_equiv":-6.1638764622,
1233
+ "effect_size_r":0.5603524057,
1234
+ "p_holm_global":0.0000000234,
1235
+ "p_holm_within_metric":0.0000000078
1236
+ },
1237
+ {
1238
+ "metric":"mean_test_acc",
1239
+ "alg_a":"ldlt",
1240
+ "alg_b":"sdp",
1241
+ "n_common":121,
1242
+ "n_nonzero":121,
1243
+ "wins_a":86,
1244
+ "wins_b":35,
1245
+ "ties":0,
1246
+ "win_rate_a_over_b":0.7107438017,
1247
+ "mean_diff_a_minus_b":0.023459701,
1248
+ "median_diff_a_minus_b":0.0102784065,
1249
+ "W_stat":1511.0,
1250
+ "p_two_sided":0.0000000174,
1251
+ "z_equiv":5.6362093207,
1252
+ "effect_size_r":0.5123826655,
1253
+ "p_holm_global":0.0000005041,
1254
+ "p_holm_within_metric":0.0000001738
1255
+ },
1256
+ {
1257
+ "metric":"mean_test_acc",
1258
+ "alg_a":"ldlt",
1259
+ "alg_b":"ldlt-resnet",
1260
+ "n_common":121,
1261
+ "n_nonzero":121,
1262
+ "wins_a":87,
1263
+ "wins_b":34,
1264
+ "ties":0,
1265
+ "win_rate_a_over_b":0.7190082645,
1266
+ "mean_diff_a_minus_b":0.0275228304,
1267
+ "median_diff_a_minus_b":0.0124811598,
1268
+ "W_stat":1779.0,
1269
+ "p_two_sided":0.0000007693,
1270
+ "z_equiv":4.9429995465,
1271
+ "effect_size_r":0.4493635951,
1272
+ "p_holm_global":0.0000200017,
1273
+ "p_holm_within_metric":0.0000069237
1274
+ },
1275
+ {
1276
+ "metric":"mean_test_acc",
1277
+ "alg_a":"ldlt",
1278
+ "alg_b":"ortho",
1279
+ "n_common":121,
1280
+ "n_nonzero":121,
1281
+ "wins_a":78,
1282
+ "wins_b":43,
1283
+ "ties":0,
1284
+ "win_rate_a_over_b":0.6446280992,
1285
+ "mean_diff_a_minus_b":0.020921453,
1286
+ "median_diff_a_minus_b":0.010356299,
1287
+ "W_stat":2002.0,
1288
+ "p_two_sided":0.0000126434,
1289
+ "z_equiv":4.3661869359,
1290
+ "effect_size_r":0.3969260851,
1291
+ "p_holm_global":0.0002528686,
1292
+ "p_holm_within_metric":0.0001011474
1293
+ },
1294
+ {
1295
+ "metric":"mean_test_acc",
1296
+ "alg_a":"ortho",
1297
+ "alg_b":"sandwich",
1298
+ "n_common":121,
1299
+ "n_nonzero":120,
1300
+ "wins_a":39,
1301
+ "wins_b":81,
1302
+ "ties":1,
1303
+ "win_rate_a_over_b":0.326446281,
1304
+ "mean_diff_a_minus_b":-0.012666314,
1305
+ "median_diff_a_minus_b":-0.0078946893,
1306
+ "W_stat":2171.0,
1307
+ "p_two_sided":0.0001336571,
1308
+ "z_equiv":-3.8196205818,
1309
+ "effect_size_r":0.348682059,
1310
+ "p_holm_global":0.0025394851,
1311
+ "p_holm_within_metric":0.0009355998
1312
+ },
1313
+ {
1314
+ "metric":"mean_test_acc",
1315
+ "alg_a":"sandwich",
1316
+ "alg_b":"sdp",
1317
+ "n_common":121,
1318
+ "n_nonzero":121,
1319
+ "wins_a":80,
1320
+ "wins_b":41,
1321
+ "ties":0,
1322
+ "win_rate_a_over_b":0.6611570248,
1323
+ "mean_diff_a_minus_b":0.015204562,
1324
+ "median_diff_a_minus_b":0.006305895,
1325
+ "W_stat":2279.0,
1326
+ "p_two_sided":0.0002625491,
1327
+ "z_equiv":3.649697729,
1328
+ "effect_size_r":0.3317907026,
1329
+ "p_holm_global":0.004631605,
1330
+ "p_holm_within_metric":0.0015752945
1331
+ },
1332
+ {
1333
+ "metric":"mean_test_acc",
1334
+ "alg_a":"ldlt-resnet",
1335
+ "alg_b":"sandwich",
1336
+ "n_common":121,
1337
+ "n_nonzero":121,
1338
+ "wins_a":47,
1339
+ "wins_b":74,
1340
+ "ties":0,
1341
+ "win_rate_a_over_b":0.3884297521,
1342
+ "mean_diff_a_minus_b":-0.0192676914,
1343
+ "median_diff_a_minus_b":-0.01009705,
1344
+ "W_stat":2411.0,
1345
+ "p_two_sided":0.0009387558,
1346
+ "z_equiv":-3.3082660492,
1347
+ "effect_size_r":0.300751459,
1348
+ "p_holm_global":0.0140813373,
1349
+ "p_holm_within_metric":0.0046937791
1350
+ },
1351
+ {
1352
+ "metric":"mean_test_acc",
1353
+ "alg_a":"ldlt",
1354
+ "alg_b":"sandwich",
1355
+ "n_common":121,
1356
+ "n_nonzero":120,
1357
+ "wins_a":64,
1358
+ "wins_b":56,
1359
+ "ties":1,
1360
+ "win_rate_a_over_b":0.5330578512,
1361
+ "mean_diff_a_minus_b":0.008255139,
1362
+ "median_diff_a_minus_b":0.0008221223,
1363
+ "W_stat":3145.0,
1364
+ "p_two_sided":0.2044973939,
1365
+ "z_equiv":1.2688420788,
1366
+ "effect_size_r":0.1158289047,
1367
+ "p_holm_global":1.0,
1368
+ "p_holm_within_metric":0.8179895757
1369
+ },
1370
+ {
1371
+ "metric":"mean_test_acc",
1372
+ "alg_a":"ldlt-resnet",
1373
+ "alg_b":"ortho",
1374
+ "n_common":121,
1375
+ "n_nonzero":121,
1376
+ "wins_a":54,
1377
+ "wins_b":67,
1378
+ "ties":0,
1379
+ "win_rate_a_over_b":0.4462809917,
1380
+ "mean_diff_a_minus_b":-0.0066013774,
1381
+ "median_diff_a_minus_b":-0.0023532391,
1382
+ "W_stat":3206.0,
1383
+ "p_two_sided":0.2106004159,
1384
+ "z_equiv":-1.2519161593,
1385
+ "effect_size_r":0.1138105599,
1386
+ "p_holm_global":1.0,
1387
+ "p_holm_within_metric":0.8179895757
1388
+ },
1389
+ {
1390
+ "metric":"mean_test_acc",
1391
+ "alg_a":"ortho",
1392
+ "alg_b":"sdp",
1393
+ "n_common":121,
1394
+ "n_nonzero":121,
1395
+ "wins_a":60,
1396
+ "wins_b":61,
1397
+ "ties":0,
1398
+ "win_rate_a_over_b":0.4958677686,
1399
+ "mean_diff_a_minus_b":0.0025382481,
1400
+ "median_diff_a_minus_b":-0.0000065726,
1401
+ "W_stat":3382.0,
1402
+ "p_two_sided":0.4256404345,
1403
+ "z_equiv":0.7966739196,
1404
+ "effect_size_r":0.0724249018,
1405
+ "p_holm_global":1.0,
1406
+ "p_holm_within_metric":0.8512808691
1407
+ },
1408
+ {
1409
+ "metric":"mean_test_acc",
1410
+ "alg_a":"ldlt-resnet",
1411
+ "alg_b":"sdp",
1412
+ "n_common":121,
1413
+ "n_nonzero":121,
1414
+ "wins_a":58,
1415
+ "wins_b":63,
1416
+ "ties":0,
1417
+ "win_rate_a_over_b":0.479338843,
1418
+ "mean_diff_a_minus_b":-0.0040631294,
1419
+ "median_diff_a_minus_b":-0.0009775593,
1420
+ "W_stat":3627.0,
1421
+ "p_two_sided":0.8705530556,
1422
+ "z_equiv":-0.162956029,
1423
+ "effect_size_r":0.0148141845,
1424
+ "p_holm_global":1.0,
1425
+ "p_holm_within_metric":0.8705530556
1426
+ }
1427
+ ]
UCI_N6/wilcoxon_prep_all.json ADDED
The diff for this file is too large to render. See raw diff