SuperComputer commited on
Commit
1759b8f
·
verified ·
1 Parent(s): 628512f

Add files using upload-large-folder tool

Browse files
Files changed (50) hide show
  1. UCI_N4/aol/summary.json +0 -0
  2. UCI_N4/jmlr_tables.tex +469 -0
  3. UCI_N4/ldlt-resnet/summary.json +0 -0
  4. UCI_N4/ldlt/summary.json +0 -0
  5. UCI_N4/ortho/summary.json +0 -0
  6. UCI_N4/sandwich/summary.json +0 -0
  7. UCI_N4/sdp/runs/abalone/fold_0/result.json +46 -0
  8. UCI_N4/sdp/runs/abalone/fold_1/result.json +46 -0
  9. UCI_N4/sdp/runs/abalone/fold_2/result.json +46 -0
  10. UCI_N4/sdp/runs/abalone/fold_3/result.json +46 -0
  11. UCI_N4/sdp/runs/acute-inflammation/fold_0/result.json +42 -0
  12. UCI_N4/sdp/runs/acute-inflammation/fold_1/result.json +42 -0
  13. UCI_N4/sdp/runs/acute-inflammation/fold_2/result.json +42 -0
  14. UCI_N4/sdp/runs/acute-inflammation/fold_3/result.json +42 -0
  15. UCI_N4/sdp/runs/acute-nephritis/fold_0/result.json +42 -0
  16. UCI_N4/sdp/runs/acute-nephritis/fold_1/result.json +42 -0
  17. UCI_N4/sdp/runs/acute-nephritis/fold_2/result.json +42 -0
  18. UCI_N4/sdp/runs/acute-nephritis/fold_3/result.json +42 -0
  19. UCI_N4/sdp/runs/adult/fold_0/result.json +58 -0
  20. UCI_N4/sdp/runs/adult/fold_1/result.json +58 -0
  21. UCI_N4/sdp/runs/adult/fold_2/result.json +58 -0
  22. UCI_N4/sdp/runs/adult/fold_3/result.json +58 -0
  23. UCI_N4/sdp/runs/annealing/fold_0/result.json +92 -0
  24. UCI_N4/sdp/runs/annealing/fold_1/result.json +92 -0
  25. UCI_N4/sdp/runs/annealing/fold_2/result.json +92 -0
  26. UCI_N4/sdp/runs/annealing/fold_3/result.json +92 -0
  27. UCI_N4/sdp/runs/arrhythmia/fold_0/result.json +554 -0
  28. UCI_N4/sdp/runs/arrhythmia/fold_1/result.json +554 -0
  29. UCI_N4/sdp/runs/arrhythmia/fold_2/result.json +554 -0
  30. UCI_N4/sdp/runs/arrhythmia/fold_3/result.json +554 -0
  31. UCI_N4/sdp/runs/audiology-std/fold_0/result.json +148 -0
  32. UCI_N4/sdp/runs/audiology-std/fold_2/result.json +148 -0
  33. UCI_N4/sdp/runs/audiology-std/fold_3/result.json +148 -0
  34. UCI_N4/sdp/runs/balance-scale/fold_0/result.json +38 -0
  35. UCI_N4/sdp/runs/balance-scale/fold_1/result.json +38 -0
  36. UCI_N4/sdp/runs/balance-scale/fold_2/result.json +38 -0
  37. UCI_N4/sdp/runs/balance-scale/fold_3/result.json +38 -0
  38. UCI_N4/sdp/runs/blood/fold_0/result.json +38 -0
  39. UCI_N4/sdp/runs/blood/fold_1/result.json +38 -0
  40. UCI_N4/sdp/runs/blood/fold_2/result.json +38 -0
  41. UCI_N4/sdp/runs/blood/fold_3/result.json +38 -0
  42. UCI_N4/sdp/runs/car/fold_0/result.json +42 -0
  43. UCI_N4/sdp/summary.json +0 -0
  44. UCI_N4/wilcoxon_pairwise_all.csv +76 -0
  45. UCI_N4/wilcoxon_pairwise_all.json +1427 -0
  46. UCI_N4/wilcoxon_prep_all.json +0 -0
  47. UCI_N6/jmlr_tables.tex +469 -0
  48. UCI_N6/wilcoxon_pairwise_all.csv +76 -0
  49. UCI_N6/wilcoxon_pairwise_all.json +1427 -0
  50. UCI_N6/wilcoxon_prep_all.json +0 -0
UCI_N4/aol/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/jmlr_tables.tex ADDED
@@ -0,0 +1,469 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ % JMLR-ready tables for two-column papers
2
+ % Required packages (no siunitx):
3
+ % \usepackage{booktabs}
4
+ % \usepackage{threeparttable}
5
+ % \usepackage{threeparttablex} % for TableNotes + longtable
6
+ % \usepackage{longtable}
7
+ % Optional for landscape: \usepackage{pdflscape}
8
+
9
+ \begin{table*}[t]
10
+ \centering
11
+ \begin{threeparttable}
12
+ \caption{Model dimension ranges (min--max across all datasets and folds). Input/Output dimensions follow dataset label spaces.}
13
+ \label{tab:model-ranges}
14
+ \begin{tabular}{l r r r r r r}
15
+ \toprule
16
+ Algorithm & Width & Depth & Parameters & Padding & Input dim & Output dim \\
17
+ \midrule
18
+ AOL & 32--512 & 4--4 & 282--694837 & 10--524 & 3--262 & 2--100 \\
19
+ Orthogonal & 32--512 & 4--4 & 285--694840 & 10--524 & 3--262 & 2--100 \\
20
+ Sandwich & 32--512 & 4--4 & 615--1520140 & 10--524 & 3--262 & 2--100 \\
21
+ SLL & 32--512 & 4--4 & 1558--1084073 & 10--524 & 3--262 & 2--100 \\
22
+ LDLT-L & 32--512 & 4--4 & 3366--929297 & 10--524 & 3--262 & 2--100 \\
23
+ LDLT-R & 32--512 & 4--4 & 3463--1063442 & 10--524 & 3--262 & 2--100 \\
24
+ \bottomrule
25
+ \end{tabular}
26
+ \end{threeparttable}
27
+ \end{table*}
28
+
29
+ \begin{table*}[t]
30
+ \centering
31
+ \begin{threeparttable}
32
+ \caption{Sorted mean$\pm$std across $N$ datasets for each algorithm.}
33
+ \label{tab:metric_summary}
34
+ \begin{tabular}{l r lllll}
35
+ \toprule
36
+ & & & \multicolumn{4}{c}{Certified Accuracy} \\
37
+ \cmidrule(lr){4-7}
38
+ Algorithm & $N$ & Accuracy & 36/255 & 72/255 & 108/255 & 255/255 \\
39
+ \midrule
40
+ AOL & 121 & 0.6295\,\tiny$\pm$0.2278 & 0.3655\,\tiny$\pm$0.2921 & 0.2628\,\tiny$\pm$0.2971 & 0.2078\,\tiny$\pm$0.2826 & 0.0989\,\tiny$\pm$0.1874 \\
41
+ Orthogonal & 121 & 0.6969\,\tiny$\pm$0.1938 & 0.6072\,\tiny$\pm$0.2290 & 0.5114\,\tiny$\pm$0.2592 & 0.4332\,\tiny$\pm$0.2662 & 0.1957\,\tiny$\pm$0.2289 \\
42
+ Sandwich & 121 & 0.7215\,\tiny$\pm$0.1871 & \textbf{0.6393\,\tiny$\pm$0.2310} & \textbf{0.5626\,\tiny$\pm$0.2520} & \textbf{0.4870\,\tiny$\pm$0.2671} & \textbf{0.2466\,\tiny$\pm$0.2478} \\
43
+ SLL & 121 & 0.6978\,\tiny$\pm$0.1998 & 0.5929\,\tiny$\pm$0.2426 & 0.4964\,\tiny$\pm$0.2662 & 0.4126\,\tiny$\pm$0.2744 & 0.1858\,\tiny$\pm$0.2235 \\
44
+ \midrule
45
+ LDLT-L & 121 & \textbf{0.7223\,\tiny$\pm$0.1868} & 0.5299\,\tiny$\pm$0.2946 & 0.4279\,\tiny$\pm$0.3081 & 0.3505\,\tiny$\pm$0.3005 & 0.1620\,\tiny$\pm$0.2287 \\
46
+ LDLT-R & 121 & 0.7022\,\tiny$\pm$0.1944 & 0.6152\,\tiny$\pm$0.2312 & 0.5295\,\tiny$\pm$0.2548 & 0.4481\,\tiny$\pm$0.2674 & 0.2164\,\tiny$\pm$0.2322 \\
47
+ \bottomrule
48
+ \end{tabular}
49
+ \end{threeparttable}
50
+ \end{table*}
51
+
52
+ \begin{table}[t]
53
+ \centering
54
+ \begin{threeparttable}
55
+ {\small
56
+ \caption{Overall comparison on Mean Accuracy: average rank (lower is better) with Iman--Davenport $F=44.33$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
57
+ \label{tab:overall:mean_test_acc}
58
+ \setlength{\tabcolsep}{4pt}
59
+ \begin{tabular}{@{}l r r r r r r@{}}
60
+ \toprule
61
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
62
+ \midrule
63
+ LDLT-L & 2.434 & 4 & 0 & 4 & 0.800 & 0.577 \\
64
+ Sandwich & 2.566 & 4 & 0 & 4 & 0.800 & 0.517 \\
65
+ LDLT-R & 3.438 & 1 & 2 & -1 & 0.200 & 0.629 \\
66
+ SLL & 3.624 & 1 & 2 & -1 & 0.200 & 0.678 \\
67
+ Orthogonal & 3.831 & 1 & 2 & -1 & 0.200 & 0.639 \\
68
+ AOL & 5.107 & 0 & 5 & -5 & 0.000 & 0.000 \\
69
+ \bottomrule
70
+ \end{tabular}
71
+ }
72
+ \end{threeparttable}
73
+ \end{table}
74
+
75
+ \begin{table}[t]
76
+ \centering
77
+ \begin{threeparttable}
78
+ {\small
79
+ \caption{Overall comparison on Mean Certified Accuracy (36/255): average rank (lower is better) with Iman--Davenport $F=82.25$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
80
+ \label{tab:overall:mean_cert_acc_36}
81
+ \setlength{\tabcolsep}{4pt}
82
+ \begin{tabular}{@{}l r r r r r r@{}}
83
+ \toprule
84
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
85
+ \midrule
86
+ Sandwich & 2.223 & 5 & 0 & 5 & 1.000 & 0.564 \\
87
+ LDLT-R & 2.715 & 4 & 1 & 3 & 0.800 & 0.478 \\
88
+ SLL & 3.248 & 2 & 2 & 0 & 0.400 & 0.624 \\
89
+ Orthogonal & 3.380 & 2 & 2 & 0 & 0.400 & 0.627 \\
90
+ LDLT-L & 3.760 & 1 & 4 & -3 & 0.200 & 0.737 \\
91
+ AOL & 5.674 & 0 & 5 & -5 & 0.000 & 0.000 \\
92
+ \bottomrule
93
+ \end{tabular}
94
+ }
95
+ \end{threeparttable}
96
+ \end{table}
97
+
98
+ \begin{table}[t]
99
+ \centering
100
+ \begin{threeparttable}
101
+ {\small
102
+ \caption{Overall comparison on Mean Certified Accuracy (72/255): average rank (lower is better) with Iman--Davenport $F=102.13$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
103
+ \label{tab:overall:mean_cert_acc_72}
104
+ \setlength{\tabcolsep}{4pt}
105
+ \begin{tabular}{@{}l r r r r r r@{}}
106
+ \toprule
107
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
108
+ \midrule
109
+ Sandwich & 1.979 & 5 & 0 & 5 & 1.000 & 0.662 \\
110
+ LDLT-R & 2.628 & 4 & 1 & 3 & 0.800 & 0.542 \\
111
+ SLL & 3.306 & 2 & 2 & 0 & 0.400 & 0.647 \\
112
+ Orthogonal & 3.417 & 2 & 2 & 0 & 0.400 & 0.632 \\
113
+ LDLT-L & 4.008 & 1 & 4 & -3 & 0.200 & 0.754 \\
114
+ AOL & 5.661 & 0 & 5 & -5 & 0.000 & 0.000 \\
115
+ \bottomrule
116
+ \end{tabular}
117
+ }
118
+ \end{threeparttable}
119
+ \end{table}
120
+
121
+ \begin{table}[t]
122
+ \centering
123
+ \begin{threeparttable}
124
+ {\small
125
+ \caption{Overall comparison on Mean Certified Accuracy (108/255): average rank (lower is better) with Iman--Davenport $F=128.94$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
126
+ \label{tab:overall:mean_cert_acc_108}
127
+ \setlength{\tabcolsep}{4pt}
128
+ \begin{tabular}{@{}l r r r r r r@{}}
129
+ \toprule
130
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
131
+ \midrule
132
+ Sandwich & 1.876 & 5 & 0 & 5 & 1.000 & 0.680 \\
133
+ LDLT-R & 2.525 & 4 & 1 & 3 & 0.800 & 0.548 \\
134
+ SLL & 3.318 & 2 & 2 & 0 & 0.400 & 0.662 \\
135
+ Orthogonal & 3.364 & 2 & 2 & 0 & 0.400 & 0.677 \\
136
+ LDLT-L & 4.194 & 1 & 4 & -3 & 0.200 & 0.824 \\
137
+ AOL & 5.723 & 0 & 5 & -5 & 0.000 & 0.000 \\
138
+ \bottomrule
139
+ \end{tabular}
140
+ }
141
+ \end{threeparttable}
142
+ \end{table}
143
+
144
+ \begin{table}[t]
145
+ \centering
146
+ \begin{threeparttable}
147
+ {\small
148
+ \caption{Overall comparison on Mean Certified Accuracy (255/255): average rank (lower is better) with Iman--Davenport $F=89.04$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
149
+ \label{tab:overall:mean_cert_acc_255}
150
+ \setlength{\tabcolsep}{4pt}
151
+ \begin{tabular}{@{}l r r r r r r@{}}
152
+ \toprule
153
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
154
+ \midrule
155
+ Sandwich & 2.029 & 5 & 0 & 5 & 1.000 & 0.663 \\
156
+ LDLT-R & 2.517 & 4 & 1 & 3 & 0.800 & 0.584 \\
157
+ Orthogonal & 3.409 & 2 & 2 & 0 & 0.400 & 0.600 \\
158
+ SLL & 3.409 & 2 & 2 & 0 & 0.400 & 0.643 \\
159
+ LDLT-L & 4.174 & 1 & 4 & -3 & 0.200 & 0.808 \\
160
+ AOL & 5.463 & 0 & 5 & -5 & 0.000 & 0.000 \\
161
+ \bottomrule
162
+ \end{tabular}
163
+ }
164
+ \end{threeparttable}
165
+ \end{table}
166
+
167
+ \begin{table}[t]
168
+ \centering
169
+ \begin{threeparttable}
170
+ {
171
+ \caption{Pairwise Wilcoxon outcomes for Mean Accuracy (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
172
+ \label{tab:signif:mean_test_acc}
173
+ \setlength{\tabcolsep}{3pt}
174
+ \begin{tabular}{@{}l c c c c c c @{}}
175
+ \toprule
176
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
177
+ \midrule
178
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
179
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
180
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
181
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
182
+ Sandwich & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
183
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
184
+ \bottomrule
185
+ \end{tabular}
186
+ }
187
+ \end{threeparttable}
188
+ \end{table}
189
+
190
+ \begin{table}[t]
191
+ \centering
192
+ \begin{threeparttable}
193
+ {
194
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (36/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
195
+ \label{tab:signif:mean_cert_acc_36}
196
+ \setlength{\tabcolsep}{3pt}
197
+ \begin{tabular}{@{}l c c c c c c @{}}
198
+ \toprule
199
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
200
+ \midrule
201
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
202
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
203
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
204
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
205
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
206
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
207
+ \bottomrule
208
+ \end{tabular}
209
+ }
210
+ \end{threeparttable}
211
+ \end{table}
212
+
213
+ \begin{table}[t]
214
+ \centering
215
+ \begin{threeparttable}
216
+ {
217
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (72/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
218
+ \label{tab:signif:mean_cert_acc_72}
219
+ \setlength{\tabcolsep}{3pt}
220
+ \begin{tabular}{@{}l c c c c c c @{}}
221
+ \toprule
222
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
223
+ \midrule
224
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
225
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
226
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
227
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
228
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
229
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
230
+ \bottomrule
231
+ \end{tabular}
232
+ }
233
+ \end{threeparttable}
234
+ \end{table}
235
+
236
+ \begin{table}[t]
237
+ \centering
238
+ \begin{threeparttable}
239
+ {
240
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (108/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
241
+ \label{tab:signif:mean_cert_acc_108}
242
+ \setlength{\tabcolsep}{3pt}
243
+ \begin{tabular}{@{}l c c c c c c @{}}
244
+ \toprule
245
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
246
+ \midrule
247
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
248
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
249
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
250
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
251
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
252
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
253
+ \bottomrule
254
+ \end{tabular}
255
+ }
256
+ \end{threeparttable}
257
+ \end{table}
258
+
259
+ \begin{table}[t]
260
+ \centering
261
+ \begin{threeparttable}
262
+ {
263
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (255/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
264
+ \label{tab:signif:mean_cert_acc_255}
265
+ \setlength{\tabcolsep}{3pt}
266
+ \begin{tabular}{@{}l c c c c c c @{}}
267
+ \toprule
268
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
269
+ \midrule
270
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
271
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
272
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
273
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
274
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
275
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
276
+ \bottomrule
277
+ \end{tabular}
278
+ }
279
+ \end{threeparttable}
280
+ \end{table}
281
+
282
+
283
+ \begin{table*}[t]
284
+ \centering
285
+ \begin{threeparttable}
286
+ \caption[Mean Accuracy]{Wilcoxon signed-rank tests (two-sided) for Mean Accuracy; $p$-values with Holm FWER corrections within-metric and global.}
287
+ \label{tab:wilcoxon:mean_test_acc}
288
+ \begingroup
289
+ \setlength{\tabcolsep}{4pt}
290
+ \begin{tabular}{ll r r r r r r r r r r r}
291
+ \toprule
292
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
293
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
294
+ \midrule
295
+ AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.0568 & 412 & $2.3e-17^{***}$ & $3.4e-16^{***}$ & $0^{***}$ & 0.7708 \\
296
+ AOL & Sandwich & 121 & 18 & 103 & 0 & 0.1488 & -0.0595 & 518 & $2.3e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7459 \\
297
+ AOL & SLL & 121 & 22 & 99 & 0 & 0.1818 & -0.0351 & 806 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6782 \\
298
+ AOL & Orthogonal & 121 & 27 & 94 & 0 & 0.2231 & -0.0265 & 971 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6394 \\
299
+ AOL & LDLT-R & 121 & 25 & 96 & 0 & 0.2066 & -0.0313 & 1013 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6295 \\
300
+ Orthogonal & Sandwich & 121 & 31 & 89 & 1 & 0.2603 & -0.0126 & 1269 & $6.0e-10^{***}$ & $6.3e-09^{***}$ & $2.3e-08^{***}$ & 0.5643 \\
301
+ LDLT-L & Orthogonal & 121 & 94 & 27 & 0 & 0.7769 & 0.0139 & 1309 & $7.0e-10^{***}$ & $6.6e-09^{***}$ & $2.6e-08^{***}$ & 0.5599 \\
302
+ LDLT-L & SLL & 121 & 86 & 35 & 0 & 0.7107 & 0.0111 & 1503 & $1.5e-08^{***}$ & $1.2e-07^{***}$ & $5.1e-07^{***}$ & 0.5143 \\
303
+ LDLT-L & LDLT-R & 121 & 87 & 33 & 1 & 0.7231 & 0.0108 & 1689 & $3.7e-07^{***}$ & $2.6e-06^{***}$ & $1.1e-05^{***}$ & 0.4639 \\
304
+ Sandwich & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0090 & 1789 & $8.8e-07^{***}$ & $5.3e-06^{***}$ & $2.4e-05^{***}$ & 0.4470 \\
305
+ LDLT-R & Sandwich & 121 & 43 & 78 & 0 & 0.3554 & -0.0068 & 2364 & $6.0e-04^{***}$ & $3.0e-03^{**}$ & $9.1e-03^{**}$ & 0.3118 \\
306
+ LDLT-R & SLL & 121 & 66 & 54 & 1 & 0.5496 & 0.0019 & 3070 & $1.4e-01$ & $5.7e-01$ & $8.6e-01$ & 0.1338 \\
307
+ LDLT-R & Orthogonal & 121 & 71 & 50 & 0 & 0.5868 & 0.0025 & 3138 & $1.5e-01$ & $5.7e-01$ & $8.6e-01$ & 0.1298 \\
308
+ Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0004 & 3623 & $8.6e-01$ & $1.0e+00$ & $1.0e+00$ & 0.0158 \\
309
+ LDLT-L & Sandwich & 121 & 59 & 62 & 0 & 0.4876 & -0.0002 & 3624 & $8.6e-01$ & $1.0e+00$ & $1.0e+00$ & 0.0155 \\
310
+ \bottomrule
311
+ \end{tabular}
312
+ \begin{tablenotes}
313
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
314
+ \end{tablenotes}
315
+ \endgroup
316
+ \end{threeparttable}
317
+ \end{table*}
318
+
319
+
320
+
321
+ \begin{table*}[t]
322
+ \centering
323
+ \begin{threeparttable}
324
+ \caption[Mean Certified Accuracy (36/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (36/255); $p$-values with Holm FWER corrections within-metric and global.}
325
+ \label{tab:wilcoxon:mean_cert_acc_36}
326
+ \begingroup
327
+ \setlength{\tabcolsep}{4pt}
328
+ \begin{tabular}{ll r r r r r r r r r r r}
329
+ \toprule
330
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
331
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
332
+ \midrule
333
+ AOL & SLL & 121 & 4 & 117 & 0 & 0.0331 & -0.1998 & 27 & $2.7e-21^{***}$ & $4.0e-20^{***}$ & $2.0e-19^{***}$ & 0.8613 \\
334
+ AOL & Sandwich & 121 & 6 & 114 & 1 & 0.0537 & -0.2626 & 32 & $4.5e-21^{***}$ & $6.1e-20^{***}$ & $3.2e-19^{***}$ & 0.8601 \\
335
+ AOL & LDLT-R & 121 & 4 & 117 & 0 & 0.0331 & -0.2302 & 47 & $4.4e-21^{***}$ & $6.1e-20^{***}$ & $3.2e-19^{***}$ & 0.8566 \\
336
+ AOL & Orthogonal & 121 & 8 & 113 & 0 & 0.0661 & -0.2204 & 87 & $1.2e-20^{***}$ & $1.4e-19^{***}$ & $7.9e-19^{***}$ & 0.8472 \\
337
+ AOL & LDLT-L & 121 & 17 & 104 & 0 & 0.1405 & -0.1415 & 554 & $5.0e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7374 \\
338
+ LDLT-L & Sandwich & 121 & 31 & 89 & 1 & 0.2603 & -0.0387 & 998 & $0^{***}$ & $1.0e-10^{***}$ & $2.0e-10^{***}$ & 0.6291 \\
339
+ LDLT-L & LDLT-R & 121 & 40 & 81 & 0 & 0.3306 & -0.0297 & 1410 & $3.7e-09^{***}$ & $3.3e-08^{***}$ & $1.3e-07^{***}$ & 0.5361 \\
340
+ Orthogonal & Sandwich & 121 & 28 & 93 & 0 & 0.2314 & -0.0238 & 1424 & $4.6e-09^{***}$ & $3.7e-08^{***}$ & $1.6e-07^{***}$ & 0.5327 \\
341
+ Sandwich & SLL & 121 & 83 & 38 & 0 & 0.6860 & 0.0207 & 1530 & $2.3e-08^{***}$ & $1.6e-07^{***}$ & $7.4e-07^{***}$ & 0.5079 \\
342
+ LDLT-L & Orthogonal & 121 & 48 & 73 & 0 & 0.3967 & -0.0200 & 1957 & $7.4e-06^{***}$ & $4.4e-05^{***}$ & $1.8e-04^{***}$ & 0.4075 \\
343
+ LDLT-L & SLL & 121 & 47 & 73 & 1 & 0.3926 & -0.0085 & 2014 & $2.3e-05^{***}$ & $1.2e-04^{***}$ & $4.4e-04^{***}$ & 0.3862 \\
344
+ LDLT-R & SLL & 121 & 76 & 43 & 2 & 0.6364 & 0.0095 & 2285 & $6.6e-04^{***}$ & $2.6e-03^{**}$ & $9.2e-03^{**}$ & 0.3123 \\
345
+ LDLT-R & Sandwich & 121 & 44 & 77 & 0 & 0.3636 & -0.0089 & 2466 & $1.5e-03^{**}$ & $4.6e-03^{**}$ & $1.7e-02^{*}$ & 0.2878 \\
346
+ LDLT-R & Orthogonal & 121 & 78 & 42 & 1 & 0.6488 & 0.0084 & 2756 & $2.2e-02^{*}$ & $4.4e-02^{*}$ & $2.0e-01$ & 0.2088 \\
347
+ Orthogonal & SLL & 121 & 60 & 60 & 1 & 0.5000 & 0.0000 & 2916 & $6.2e-02$ & $6.2e-02$ & $4.9e-01$ & 0.1705 \\
348
+ \bottomrule
349
+ \end{tabular}
350
+ \begin{tablenotes}
351
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
352
+ \end{tablenotes}
353
+ \endgroup
354
+ \end{threeparttable}
355
+ \end{table*}
356
+
357
+
358
+
359
+ \begin{table*}[t]
360
+ \centering
361
+ \begin{threeparttable}
362
+ \caption[Mean Certified Accuracy (72/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (72/255); $p$-values with Holm FWER corrections within-metric and global.}
363
+ \label{tab:wilcoxon:mean_cert_acc_72}
364
+ \begingroup
365
+ \setlength{\tabcolsep}{4pt}
366
+ \begin{tabular}{ll r r r r r r r r r r r}
367
+ \toprule
368
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
369
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
370
+ \midrule
371
+ AOL & Sandwich & 121 & 6 & 114 & 1 & 0.0537 & -0.2723 & 58 & $8.5e-21^{***}$ & $1.3e-19^{***}$ & $5.9e-19^{***}$ & 0.8538 \\
372
+ AOL & SLL & 121 & 3 & 116 & 2 & 0.0331 & -0.1967 & 59 & $1.3e-20^{***}$ & $1.8e-19^{***}$ & $8.6e-19^{***}$ & 0.8534 \\
373
+ AOL & LDLT-R & 121 & 5 & 116 & 0 & 0.0413 & -0.2325 & 103 & $1.7e-20^{***}$ & $2.2e-19^{***}$ & $1.1e-18^{***}$ & 0.8435 \\
374
+ AOL & Orthogonal & 121 & 8 & 113 & 0 & 0.0661 & -0.2085 & 149 & $5.2e-20^{***}$ & $6.3e-19^{***}$ & $3.3e-18^{***}$ & 0.8327 \\
375
+ AOL & LDLT-L & 121 & 16 & 102 & 3 & 0.1446 & -0.1155 & 460 & $2.6e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7539 \\
376
+ LDLT-L & Sandwich & 121 & 21 & 100 & 0 & 0.1736 & -0.0748 & 670 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7101 \\
377
+ Orthogonal & Sandwich & 121 & 18 & 103 & 0 & 0.1488 & -0.0370 & 698 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7037 \\
378
+ Sandwich & SLL & 121 & 91 & 28 & 2 & 0.7603 & 0.0396 & 823 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6676 \\
379
+ LDLT-L & LDLT-R & 121 & 30 & 90 & 1 & 0.2521 & -0.0625 & 988 & $0^{***}$ & $0^{***}$ & $2.0e-10^{***}$ & 0.6315 \\
380
+ LDLT-L & SLL & 121 & 42 & 79 & 0 & 0.3471 & -0.0231 & 1813 & $1.2e-06^{***}$ & $7.2e-06^{***}$ & $3.1e-05^{***}$ & 0.4414 \\
381
+ LDLT-L & Orthogonal & 121 & 44 & 77 & 0 & 0.3636 & -0.0192 & 1857 & $2.1e-06^{***}$ & $1.1e-05^{***}$ & $5.3e-05^{***}$ & 0.4310 \\
382
+ LDLT-R & SLL & 121 & 79 & 41 & 1 & 0.6570 & 0.0156 & 1982 & $1.6e-05^{***}$ & $6.4e-05^{***}$ & $3.5e-04^{***}$ & 0.3937 \\
383
+ LDLT-R & Sandwich & 121 & 44 & 77 & 0 & 0.3636 & -0.0238 & 2090 & $3.5e-05^{***}$ & $1.1e-04^{***}$ & $6.3e-04^{***}$ & 0.3761 \\
384
+ LDLT-R & Orthogonal & 121 & 77 & 42 & 2 & 0.6446 & 0.0106 & 2346 & $1.2e-03^{**}$ & $2.4e-03^{**}$ & $1.5e-02^{*}$ & 0.2974 \\
385
+ Orthogonal & SLL & 121 & 61 & 59 & 1 & 0.5083 & 0.0002 & 3188 & $2.5e-01$ & $2.5e-01$ & $9.9e-01$ & 0.1055 \\
386
+ \bottomrule
387
+ \end{tabular}
388
+ \begin{tablenotes}
389
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
390
+ \end{tablenotes}
391
+ \endgroup
392
+ \end{threeparttable}
393
+ \end{table*}
394
+
395
+
396
+
397
+ \begin{table*}[t]
398
+ \centering
399
+ \begin{threeparttable}
400
+ \caption[Mean Certified Accuracy (108/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (108/255); $p$-values with Holm FWER corrections within-metric and global.}
401
+ \label{tab:wilcoxon:mean_cert_acc_108}
402
+ \begingroup
403
+ \setlength{\tabcolsep}{4pt}
404
+ \begin{tabular}{ll r r r r r r r r r r r}
405
+ \toprule
406
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
407
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
408
+ \midrule
409
+ AOL & LDLT-R & 121 & 1 & 119 & 1 & 0.0124 & -0.2179 & 1 & $2.0e-21^{***}$ & $3.1e-20^{***}$ & $1.5e-19^{***}$ & 0.8675 \\
410
+ AOL & SLL & 121 & 2 & 116 & 3 & 0.0289 & -0.1595 & 12 & $5.8e-21^{***}$ & $7.5e-20^{***}$ & $4.1e-19^{***}$ & 0.8648 \\
411
+ AOL & Sandwich & 121 & 4 & 116 & 1 & 0.0372 & -0.2402 & 32 & $4.5e-21^{***}$ & $6.2e-20^{***}$ & $3.2e-19^{***}$ & 0.8601 \\
412
+ AOL & Orthogonal & 121 & 6 & 113 & 2 & 0.0579 & -0.1817 & 72 & $1.8e-20^{***}$ & $2.1e-19^{***}$ & $1.2e-18^{***}$ & 0.8502 \\
413
+ AOL & LDLT-L & 121 & 12 & 99 & 10 & 0.1405 & -0.0785 & 158 & $4.0e-18^{***}$ & $4.4e-17^{***}$ & $2.5e-16^{***}$ & 0.8237 \\
414
+ LDLT-L & Sandwich & 121 & 17 & 104 & 0 & 0.1405 & -0.0905 & 492 & $1.3e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7520 \\
415
+ Orthogonal & Sandwich & 121 & 16 & 105 & 0 & 0.1322 & -0.0475 & 700 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7030 \\
416
+ Sandwich & SLL & 121 & 93 & 26 & 2 & 0.7769 & 0.0480 & 764 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6820 \\
417
+ LDLT-L & LDLT-R & 121 & 23 & 97 & 1 & 0.1942 & -0.0468 & 787 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6796 \\
418
+ LDLT-L & Orthogonal & 121 & 35 & 84 & 2 & 0.2975 & -0.0276 & 1497 & $3.9e-08^{***}$ & $2.3e-07^{***}$ & $1.2e-06^{***}$ & 0.5038 \\
419
+ LDLT-L & SLL & 121 & 37 & 82 & 2 & 0.3140 & -0.0208 & 1682 & $5.6e-07^{***}$ & $2.8e-06^{***}$ & $1.6e-05^{***}$ & 0.4588 \\
420
+ LDLT-R & SLL & 121 & 82 & 35 & 4 & 0.6942 & 0.0178 & 1875 & $1.8e-05^{***}$ & $5.4e-05^{***}$ & $3.8e-04^{***}$ & 0.3963 \\
421
+ LDLT-R & Sandwich & 121 & 41 & 79 & 1 & 0.3430 & -0.0213 & 1952 & $1.1e-05^{***}$ & $4.5e-05^{***}$ & $2.6e-04^{***}$ & 0.4010 \\
422
+ LDLT-R & Orthogonal & 121 & 77 & 42 & 2 & 0.6446 & 0.0191 & 2543 & $6.5e-03^{**}$ & $1.3e-02^{*}$ & $6.5e-02$ & 0.2495 \\
423
+ Orthogonal & SLL & 121 & 60 & 59 & 2 & 0.5041 & 0.0000 & 2941 & $9.6e-02$ & $9.6e-02$ & $6.7e-01$ & 0.1528 \\
424
+ \bottomrule
425
+ \end{tabular}
426
+ \begin{tablenotes}
427
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
428
+ \end{tablenotes}
429
+ \endgroup
430
+ \end{threeparttable}
431
+ \end{table*}
432
+
433
+
434
+
435
+ \begin{table*}[t]
436
+ \centering
437
+ \begin{threeparttable}
438
+ \caption[Mean Certified Accuracy (255/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (255/255); $p$-values with Holm FWER corrections within-metric and global.}
439
+ \label{tab:wilcoxon:mean_cert_acc_255}
440
+ \begingroup
441
+ \setlength{\tabcolsep}{4pt}
442
+ \begin{tabular}{ll r r r r r r r r r r r}
443
+ \toprule
444
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
445
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
446
+ \midrule
447
+ AOL & LDLT-R & 121 & 2 & 107 & 12 & 0.0661 & -0.0560 & 17 & $2.1e-19^{***}$ & $3.1e-18^{***}$ & $1.3e-17^{***}$ & 0.8629 \\
448
+ AOL & SLL & 121 & 2 & 99 & 20 & 0.0992 & -0.0407 & 24 & $5.5e-18^{***}$ & $7.2e-17^{***}$ & $3.3e-16^{***}$ & 0.8599 \\
449
+ AOL & Sandwich & 121 & 2 & 107 & 12 & 0.0661 & -0.0791 & 58 & $6.4e-19^{***}$ & $8.9e-18^{***}$ & $4.0e-17^{***}$ & 0.8511 \\
450
+ AOL & Orthogonal & 121 & 5 & 100 & 16 & 0.1074 & -0.0347 & 109 & $1.3e-17^{***}$ & $1.5e-16^{***}$ & $7.6e-16^{***}$ & 0.8339 \\
451
+ AOL & LDLT-L & 121 & 6 & 79 & 36 & 0.1983 & -0.0167 & 127 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.8080 \\
452
+ LDLT-L & Sandwich & 121 & 11 & 98 & 12 & 0.1405 & -0.0371 & 291 & $2.8e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7836 \\
453
+ Orthogonal & Sandwich & 121 & 16 & 95 & 10 & 0.1736 & -0.0340 & 427 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7486 \\
454
+ Sandwich & SLL & 121 & 86 & 24 & 11 & 0.7562 & 0.0261 & 845 & $0^{***}$ & $4.0e-10^{***}$ & $1.8e-09^{***}$ & 0.6276 \\
455
+ LDLT-L & LDLT-R & 121 & 20 & 89 & 12 & 0.2149 & -0.0193 & 847 & $1.0e-10^{***}$ & $6.0e-10^{***}$ & $3.1e-09^{***}$ & 0.6226 \\
456
+ LDLT-L & SLL & 121 & 29 & 72 & 20 & 0.3223 & -0.0068 & 1312 & $1.9e-05^{***}$ & $9.4e-05^{***}$ & $3.8e-04^{***}$ & 0.4257 \\
457
+ LDLT-R & SLL & 121 & 80 & 29 & 12 & 0.7107 & 0.0184 & 1331 & $4.7e-07^{***}$ & $2.8e-06^{***}$ & $1.4e-05^{***}$ & 0.4824 \\
458
+ LDLT-L & Orthogonal & 121 & 34 & 71 & 16 & 0.3471 & -0.0067 & 1607 & $1.7e-04^{***}$ & $5.2e-04^{***}$ & $2.8e-03^{**}$ & 0.3666 \\
459
+ LDLT-R & Orthogonal & 121 & 74 & 38 & 9 & 0.6488 & 0.0104 & 1829 & $1.1e-04^{***}$ & $4.3e-04^{***}$ & $1.8e-03^{**}$ & 0.3661 \\
460
+ LDLT-R & Sandwich & 121 & 45 & 68 & 8 & 0.4050 & -0.0092 & 2100 & $1.3e-03^{**}$ & $2.7e-03^{**}$ & $1.6e-02^{*}$ & 0.3018 \\
461
+ Orthogonal & SLL & 121 & 57 & 52 & 12 & 0.5207 & 0.0000 & 2967 & $9.3e-01$ & $9.3e-01$ & $1.0e+00$ & 0.0087 \\
462
+ \bottomrule
463
+ \end{tabular}
464
+ \begin{tablenotes}
465
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
466
+ \end{tablenotes}
467
+ \endgroup
468
+ \end{threeparttable}
469
+ \end{table*}
UCI_N4/ldlt-resnet/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/ldlt/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/ortho/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/sandwich/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/sdp/runs/abalone/fold_0/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 52,
3
+ "best_val_acc": 0.6253968253968254,
4
+ "test_acc": 0.6360367558929285,
5
+ "train_size": 1044,
6
+ "val_size": 630,
7
+ "test_size": 2503,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.03759131666666678,
12
+ -0.0067216787931033565,
13
+ -0.00504821235632188,
14
+ -0.010079406034482869,
15
+ 0.0077948497126437005,
16
+ -0.0035954527720305413,
17
+ 0.011847337255747069,
18
+ 0.020808682452107305
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 0.9932562075552053,
24
+ 1.0067465043023525,
25
+ 0.9980809038500921,
26
+ 0.9297052233036605,
27
+ 1.0141436995589543,
28
+ 0.9931430828536596,
29
+ 1.017739933100054,
30
+ 1.0318462596531948
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.5,
42
+ "72": 0.3539682626724243,
43
+ "108": 0.26031747460365295,
44
+ "255": 0.13968254625797272
45
+ }
46
+ }
UCI_N4/sdp/runs/abalone/fold_1/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 38,
3
+ "best_val_acc": 0.6735668789808917,
4
+ "test_acc": 0.6463073852295409,
5
+ "train_size": 1044,
6
+ "val_size": 628,
7
+ "test_size": 2505,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.005192849233716447,
12
+ -0.0023747756321838803,
13
+ -0.004999904980842867,
14
+ -0.01065197068965531,
15
+ -0.001757506036398443,
16
+ -0.0004581268045977247,
17
+ -0.008801511695402298,
18
+ -0.0025385303256705034
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 0.9921988752896624,
24
+ 1.0113577078934743,
25
+ 1.0108378611135136,
26
+ 0.93746968476643,
27
+ 1.0135082046349184,
28
+ 1.0099861173658438,
29
+ 1.0142707677051552,
30
+ 1.019381711286177
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.5143312215805054,
42
+ "72": 0.3821656107902527,
43
+ "108": 0.3200637102127075,
44
+ "255": 0.18789809942245483
45
+ }
46
+ }
UCI_N4/sdp/runs/abalone/fold_2/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 28,
3
+ "best_val_acc": 0.6888519134775375,
4
+ "test_acc": 0.6291469194312796,
5
+ "train_size": 1044,
6
+ "val_size": 601,
7
+ "test_size": 2532,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.017948929501915466,
12
+ 0.023985624319923418,
13
+ 0.023087170114942556,
14
+ 0.018317038026819783,
15
+ 0.02778346245977014,
16
+ 0.025539904827586328,
17
+ 0.018261344003831434,
18
+ 0.034770174578544095
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 0.9978233519534647,
24
+ 1.0049712832060378,
25
+ 1.0100440980049294,
26
+ 0.9634042347353897,
27
+ 1.0033357823934823,
28
+ 1.0054816988393045,
29
+ 0.9890488354165379,
30
+ 1.0152622279378631
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.5207986831665039,
42
+ "72": 0.410981684923172,
43
+ "108": 0.3211314380168915,
44
+ "255": 0.19134774804115295
45
+ }
46
+ }
UCI_N4/sdp/runs/abalone/fold_3/result.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 80,
3
+ "best_val_acc": 0.6523887973640856,
4
+ "test_acc": 0.6361836896278702,
5
+ "train_size": 1044,
6
+ "val_size": 607,
7
+ "test_size": 2526,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.039933615229885006,
12
+ 0.033357397988505864,
13
+ 0.02810616465517236,
14
+ 0.015225409386973148,
15
+ 0.03982630053544057,
16
+ 0.03327093634674338,
17
+ 0.031858401652298855,
18
+ 0.04330609419540234
19
+ ]
20
+ ],
21
+ "std": [
22
+ [
23
+ 1.000898664612302,
24
+ 1.0028361176421674,
25
+ 1.0029617333979737,
26
+ 0.9244955132147792,
27
+ 1.020547570022181,
28
+ 1.016662196023235,
29
+ 1.0053994226175234,
30
+ 1.025123395710352
31
+ ]
32
+ ]
33
+ },
34
+ "width": 32,
35
+ "in_features": 8,
36
+ "out_features": 3,
37
+ "depth": 4,
38
+ "padding": 16,
39
+ "parameters": 2355,
40
+ "cert_evals": {
41
+ "36": 0.5107083916664124,
42
+ "72": 0.40197691321372986,
43
+ "108": 0.31630972027778625,
44
+ "255": 0.18121910095214844
45
+ }
46
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_0/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 6,
3
+ "best_val_acc": 0.75,
4
+ "test_acc": 0.5945945945945946,
5
+ "train_size": 30,
6
+ "val_size": 16,
7
+ "test_size": 74,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.029776199999999933,
12
+ 0.05815319999999998,
13
+ 0.03366299999999992,
14
+ -0.07041613333333337,
15
+ 0.0829954666666666,
16
+ 0.3029878333333334
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.046299339147563,
22
+ 1.028676385077134,
23
+ 0.9895473157792913,
24
+ 1.0179845925601472,
25
+ 0.9937462864656396,
26
+ 1.0009348864350793
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.375,
38
+ "72": 0.0,
39
+ "108": 0.0,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_1/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 4,
3
+ "best_val_acc": 0.7222222222222222,
4
+ "test_acc": 0.6805555555555556,
5
+ "train_size": 30,
6
+ "val_size": 18,
7
+ "test_size": 72,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.2066000000000002,
12
+ 0.2132320000000001,
13
+ 0.16832333333333327,
14
+ -6.666666666858371e-07,
15
+ 0.08299546666666664,
16
+ -0.033663
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.073465583913181,
22
+ 1.0965727109827237,
23
+ 0.9521923485684088,
24
+ 0.9958250796083059,
25
+ 0.9937462864656397,
26
+ 0.9895473157792911
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.5,
38
+ "72": 0.1666666716337204,
39
+ "108": 0.0555555559694767,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_2/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 29,
3
+ "best_val_acc": 0.75,
4
+ "test_acc": 0.9142857142857143,
5
+ "train_size": 30,
6
+ "val_size": 20,
7
+ "test_size": 70,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.06825569999999999,
12
+ -0.09692560000000008,
13
+ 0.10099316666666662,
14
+ 0.07041479999999994,
15
+ -0.11619693333333347,
16
+ 0.16832750000000007
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9390286569686838,
22
+ 0.9304728,
23
+ 0.9733809278809981,
24
+ 0.9680526182869189,
25
+ 0.9870693041144554,
26
+ 1.0099525000000003
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.5,
38
+ "72": 0.5,
39
+ "108": 0.5,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-inflammation/fold_3/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 22,
3
+ "best_val_acc": 0.9523809523809523,
4
+ "test_acc": 0.8985507246376812,
5
+ "train_size": 30,
6
+ "val_size": 21,
7
+ "test_size": 69,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.061842666666666594,
12
+ -0.01938619999999999,
13
+ -0.03366716666666666,
14
+ -0.14083160000000008,
15
+ -0.049799466666666695,
16
+ -0.3029836666666666
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9526045937382531,
22
+ 0.9838646893399317,
23
+ 1.000934886435079,
24
+ 1.0348917799997448,
25
+ 0.9937462864656396,
26
+ 0.8932355996217098
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.6190476417541504,
38
+ "72": 0.380952388048172,
39
+ "108": 0.190476194024086,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_0/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 20,
3
+ "best_val_acc": 1.0,
4
+ "test_acc": 0.8767123287671232,
5
+ "train_size": 30,
6
+ "val_size": 17,
7
+ "test_size": 73,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.1415510333333333,
12
+ 0.21323200000000003,
13
+ -0.03366716666666671,
14
+ -6.666666667154431e-07,
15
+ 0.2821878666666666,
16
+ -0.1683233333333333
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.0909027516263303,
22
+ 1.0965727109827237,
23
+ 1.0009348864350789,
24
+ 0.9958250796083059,
25
+ 0.9598970403996372,
26
+ 0.9521923485684088
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.7647058963775635,
38
+ "72": 0.5882353186607361,
39
+ "108": 0.29411765933036804,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_1/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 29,
3
+ "best_val_acc": 0.9285714285714286,
4
+ "test_acc": 0.881578947368421,
5
+ "train_size": 30,
6
+ "val_size": 14,
7
+ "test_size": 76,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.012368109999999948,
12
+ -0.0969256,
13
+ 0.10099316666666665,
14
+ -0.21124706666666673,
15
+ -0.11619693333333339,
16
+ -0.033662999999999985
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9970611705313925,
22
+ 0.9304727999999999,
23
+ 0.9733809278809981,
24
+ 1.0468011683411809,
25
+ 0.9870693041144555,
26
+ 0.9895473157792911
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.7142857313156128,
38
+ "72": 0.5,
39
+ "108": 0.1428571492433548,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_2/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 12,
3
+ "best_val_acc": 1.0,
4
+ "test_acc": 1.0,
5
+ "train_size": 30,
6
+ "val_size": 11,
7
+ "test_size": 79,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.03252466666666676,
12
+ 0.05815320000000001,
13
+ -0.10099733333333338,
14
+ -6.666666667154431e-07,
15
+ 0.1493929333333332,
16
+ -0.033662999999999985
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 0.9744119491152714,
22
+ 1.0286763850771339,
23
+ 1.0077056618442157,
24
+ 0.9958250796083059,
25
+ 0.9870693041144553,
26
+ 0.9895473157792911
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.6363636255264282,
38
+ "72": 0.5454545617103577,
39
+ "108": 0.1818181872367859,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/acute-nephritis/fold_3/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 49,
3
+ "best_val_acc": 0.8421052631578947,
4
+ "test_acc": 0.9295774647887324,
5
+ "train_size": 30,
6
+ "val_size": 19,
7
+ "test_size": 71,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.029776590000000006,
12
+ -0.01938619999999999,
13
+ -0.10099733333333341,
14
+ -6.666666667080416e-07,
15
+ 0.01659799999999996,
16
+ -0.10099316666666663
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.0535901730675965,
22
+ 0.9838646893399317,
23
+ 1.0077056618442157,
24
+ 0.9958250796083058,
25
+ 0.995962,
26
+ 0.9733809278809978
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 2,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1818,
36
+ "cert_evals": {
37
+ "36": 0.5789473652839661,
38
+ "72": 0.4736842215061188,
39
+ "108": 0.3684210479259491,
40
+ "255": 0.0
41
+ }
42
+ }
UCI_N4/sdp/runs/adult/fold_0/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 4,
3
+ "best_val_acc": 0.8133191100274306,
4
+ "test_acc": 0.8112619716142928,
5
+ "train_size": 16281,
6
+ "val_size": 6562,
7
+ "test_size": 25999,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.7572386264801025,
54
+ "72": 0.696891188621521,
55
+ "108": 0.6298384666442871,
56
+ "255": 0.3817433714866638
57
+ }
58
+ }
UCI_N4/sdp/runs/adult/fold_1/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 3,
3
+ "best_val_acc": 0.8076100244498777,
4
+ "test_acc": 0.8065880001537457,
5
+ "train_size": 16281,
6
+ "val_size": 6544,
7
+ "test_size": 26017,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.7496944069862366,
54
+ "72": 0.6919315457344055,
55
+ "108": 0.6314181089401245,
56
+ "255": 0.3694987893104553
57
+ }
58
+ }
UCI_N4/sdp/runs/adult/fold_2/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 2,
3
+ "best_val_acc": 0.804847923421337,
4
+ "test_acc": 0.8083116086489802,
5
+ "train_size": 16281,
6
+ "val_size": 6477,
7
+ "test_size": 26084,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.748803436756134,
54
+ "72": 0.6862744688987732,
55
+ "108": 0.6271421909332275,
56
+ "255": 0.3605063855648041
57
+ }
58
+ }
UCI_N4/sdp/runs/adult/fold_3/result.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 7,
3
+ "best_val_acc": 0.8011200242167398,
4
+ "test_acc": 0.8089311859443631,
5
+ "train_size": 16281,
6
+ "val_size": 6607,
7
+ "test_size": 25954,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 5.755174894932247e-09,
12
+ -1.5212824565593372e-07,
13
+ 1.9344708602300844e-08,
14
+ -5.868804126934776e-07,
15
+ 4.3847429484189405e-07,
16
+ -1.2794054493469234e-07,
17
+ -3.0931760979923667e-08,
18
+ 1.2424912468644162e-06,
19
+ 2.0428720567267194e-07,
20
+ -1.2898470607021481e-06,
21
+ 5.428255022845695e-07,
22
+ 2.9734045846837646e-07,
23
+ 9.031386283659057e-08,
24
+ 2.0421350090431894e-07
25
+ ]
26
+ ],
27
+ "std": [
28
+ [
29
+ 0.999969279768083,
30
+ 0.9999691631254963,
31
+ 0.9999692601356567,
32
+ 0.9999684455490998,
33
+ 0.9999701766278255,
34
+ 0.9999695789931851,
35
+ 0.9999697101647755,
36
+ 0.9999695985584383,
37
+ 0.9999687129297181,
38
+ 0.999967689659048,
39
+ 0.9999708394490064,
40
+ 0.9999690163307019,
41
+ 0.9999694763882633,
42
+ 0.9999692067843523
43
+ ]
44
+ ]
45
+ },
46
+ "width": 64,
47
+ "in_features": 14,
48
+ "out_features": 2,
49
+ "depth": 4,
50
+ "padding": 28,
51
+ "parameters": 7738,
52
+ "cert_evals": {
53
+ "36": 0.7470864653587341,
54
+ "72": 0.6932042241096497,
55
+ "108": 0.6344786286354065,
56
+ "255": 0.38141366839408875
57
+ }
58
+ }
UCI_N4/sdp/runs/annealing/fold_0/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 39,
3
+ "best_val_acc": 0.8154761904761905,
4
+ "test_acc": 0.7746031746031746,
5
+ "train_size": 100,
6
+ "val_size": 168,
7
+ "test_size": 630,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.7976190447807312,
88
+ "72": 0.785714328289032,
89
+ "108": 0.7797619104385376,
90
+ "255": 0.6190476417541504
91
+ }
92
+ }
UCI_N4/sdp/runs/annealing/fold_1/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 58,
3
+ "best_val_acc": 0.8136645962732919,
4
+ "test_acc": 0.7551020408163265,
5
+ "train_size": 100,
6
+ "val_size": 161,
7
+ "test_size": 637,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.7515528202056885,
88
+ "72": 0.739130437374115,
89
+ "108": 0.695652186870575,
90
+ "255": 0.52173912525177
91
+ }
92
+ }
UCI_N4/sdp/runs/annealing/fold_2/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 62,
3
+ "best_val_acc": 0.7309941520467836,
4
+ "test_acc": 0.7400318979266348,
5
+ "train_size": 100,
6
+ "val_size": 171,
7
+ "test_size": 627,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.6783626079559326,
88
+ "72": 0.6491228342056274,
89
+ "108": 0.6257309913635254,
90
+ "255": 0.5087719559669495
91
+ }
92
+ }
UCI_N4/sdp/runs/annealing/fold_3/result.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 58,
3
+ "best_val_acc": 0.7245508982035929,
4
+ "test_acc": 0.7321711568938193,
5
+ "train_size": 100,
6
+ "val_size": 167,
7
+ "test_size": 631,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.07222222999999978,
12
+ -0.345,
13
+ 4.33,
14
+ 12.0,
15
+ 0.14,
16
+ -0.17333315999999985,
17
+ -0.07800000000000064,
18
+ 29.2,
19
+ 0.09999999999999996,
20
+ -0.010000000000000224,
21
+ 0.3,
22
+ -0.010000000000000111,
23
+ -4.132729999999996e-16,
24
+ -0.11000000000000007,
25
+ -0.11999999999999993,
26
+ -0.12999999999999998,
27
+ -0.13,
28
+ -0.029999999999999773,
29
+ -1.847940000000002e-16,
30
+ -0.05999999999999975,
31
+ -1.626729999999999e-16,
32
+ -0.03999999999999998,
33
+ -0.010000000000000222,
34
+ -0.06000000000000002,
35
+ 0.1,
36
+ 1.3318299999999998,
37
+ 771.9469999999998,
38
+ 1183.75,
39
+ 0.009999999999999986,
40
+ -0.9466666699999999,
41
+ -1.5582099999999978e-17
42
+ ]
43
+ ],
44
+ "std": [
45
+ [
46
+ 0.27504207913753365,
47
+ 0.41800119617053744,
48
+ 14.650634798533474,
49
+ 25.758493744782516,
50
+ 0.34698703145794935,
51
+ 0.2133331200000003,
52
+ 0.2543933961407015,
53
+ 110.08796482813175,
54
+ 0.29999999999999993,
55
+ 0.09949874371066192,
56
+ 0.47958315233127174,
57
+ 0.06557438524301994,
58
+ 1.0,
59
+ 0.31288975694324034,
60
+ 0.32496153618543855,
61
+ 0.3363034344160047,
62
+ 0.3363034344160045,
63
+ 0.17058722109231966,
64
+ 1.0,
65
+ 0.23748684174075815,
66
+ 1.0,
67
+ 0.19595917942265428,
68
+ 0.09949874371066192,
69
+ 0.2374868417407582,
70
+ 0.9949874371066199,
71
+ 0.9335979547428329,
72
+ 410.1759096911958,
73
+ 1742.0412703205398,
74
+ 0.09949874371066196,
75
+ 0.2436755226844934,
76
+ 1.0
77
+ ]
78
+ ]
79
+ },
80
+ "width": 128,
81
+ "in_features": 31,
82
+ "out_features": 5,
83
+ "depth": 4,
84
+ "padding": 62,
85
+ "parameters": 33083,
86
+ "cert_evals": {
87
+ "36": 0.7005988359451294,
88
+ "72": 0.6706587076187134,
89
+ "108": 0.6347305774688721,
90
+ "255": 0.5389221906661987
91
+ }
92
+ }
UCI_N4/sdp/runs/arrhythmia/fold_0/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 25,
3
+ "best_val_acc": 0.5949367088607594,
4
+ "test_acc": 0.5538461538461539,
5
+ "train_size": 113,
6
+ "val_size": 79,
7
+ "test_size": 260,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.05548900442477873,
12
+ 0.17327679646017674,
13
+ -0.09933938283185836,
14
+ -0.022536060176991165,
15
+ -0.05529378318584072,
16
+ -0.02827017327433631,
17
+ -0.005964132743362813,
18
+ 0.04588333831858407,
19
+ -0.06835887191150443,
20
+ -0.01879734327433625,
21
+ 0.08708691123893805,
22
+ -0.010227719469026567,
23
+ -0.05324860619469024,
24
+ 0.03857876283185871,
25
+ -0.0029412946902654486,
26
+ -0.14624673451327397,
27
+ 0.0106677238938053,
28
+ -0.09994685221238946,
29
+ -2.2654867242673962e-07,
30
+ -0.10041930088495568,
31
+ 0.14110856637168184,
32
+ -0.02112876106194691,
33
+ -0.021128761061946916,
34
+ -0.06659289999999989,
35
+ -0.06659289999999989,
36
+ -0.09438650000000005,
37
+ -0.024449619469026587,
38
+ -0.006156723893805307,
39
+ -0.03655609734513271,
40
+ -0.06008078761061956,
41
+ -0.05587280000000011,
42
+ -0.1535461769911505,
43
+ -2.9203539835147346e-07,
44
+ 0.1454482212389377,
45
+ -0.04703600000000003,
46
+ -0.06659289999999989,
47
+ 0.0665928778761063,
48
+ -0.053692424778761245,
49
+ 0.10382045292035355,
50
+ -0.045959752212389356,
51
+ -0.039423744247787586,
52
+ -0.042264867256637376,
53
+ -0.0339906548672566,
54
+ -0.10218601769911498,
55
+ -0.04703600000000003,
56
+ 0.04783872566371683,
57
+ 0.14110856637168165,
58
+ -2.920353982139237e-07,
59
+ -0.1056450000000003,
60
+ -0.06659289999999989,
61
+ 0.039230692920353964,
62
+ -0.048857433628318604,
63
+ -0.0949235044247789,
64
+ -0.0951867699115044,
65
+ -0.04703600000000003,
66
+ -0.07884043362831854,
67
+ -0.021128761061946947,
68
+ 0.0665928778761063,
69
+ 0.0665928778761063,
70
+ 0.06659287787610634,
71
+ 0.0665928778761063,
72
+ 1.0619469034296467e-07,
73
+ -0.14459542477876128,
74
+ 0.10166875221238943,
75
+ -0.0007696849557522316,
76
+ 0.08089214159292042,
77
+ 0.024555884070796462,
78
+ -0.06704164601769926,
79
+ -0.04703600000000003,
80
+ 0.1411085663716821,
81
+ 0.02721671504424786,
82
+ -0.04703600000000003,
83
+ 0.008643274336283235,
84
+ -0.03328283893805306,
85
+ -0.08280126353982296,
86
+ -0.04353061946902624,
87
+ 0.022193132743362702,
88
+ -0.07879264601769921,
89
+ 0.06659287787610634,
90
+ 0.07170867256637195,
91
+ 0.1411085663716824,
92
+ -0.04703600000000003,
93
+ 0.14110856637168173,
94
+ -0.05805589380530971,
95
+ 0.08516874884955755,
96
+ 0.043014315044247776,
97
+ -0.002110141592920556,
98
+ -0.07482919999999994,
99
+ 0.027698871681415955,
100
+ -0.08165009999999992,
101
+ -0.0536924247787612,
102
+ 1.0619469030955972e-07,
103
+ -0.09438650000000005,
104
+ 0.06338747787610613,
105
+ -0.0901489026548673,
106
+ -0.04849817699115047,
107
+ 0.07722033628318585,
108
+ 0.026260424778761074,
109
+ 0.0738569911504426,
110
+ 0.04712901946902665,
111
+ 0.16431531858407084,
112
+ 0.09438671238938037,
113
+ 0.09438671238938054,
114
+ -0.0386190796460177,
115
+ -0.09438650000000005,
116
+ 1.0619469029580476e-07,
117
+ 0.06704106194690244,
118
+ 0.00271023008849546,
119
+ 0.04821953097345133,
120
+ -0.022629159292035374,
121
+ 0.24075912389380558,
122
+ 0.19588278672566428,
123
+ 0.10636762831858415,
124
+ 0.07170867256637167,
125
+ 0.0665928778761063,
126
+ -0.08165009999999992,
127
+ 1.0619469029580476e-07,
128
+ 0.24495034513274322,
129
+ -0.02112876106194717,
130
+ -0.03837423008849555,
131
+ 0.0792644690265486,
132
+ -0.010963192920353986,
133
+ -0.13985853097345086,
134
+ -0.06118739999999991,
135
+ -0.05918213274336283,
136
+ -0.06659289999999989,
137
+ 0.19309768141592948,
138
+ 0.0665928778761063,
139
+ -2.920353984064934e-07,
140
+ -0.08791879646017699,
141
+ -0.009588667256637163,
142
+ 0.039876742477876134,
143
+ -0.04371391504424787,
144
+ -0.09472733274336269,
145
+ -0.08165009999999992,
146
+ -0.04703600000000003,
147
+ -0.08165009999999992,
148
+ -0.059833336283185844,
149
+ -0.07838458407079653,
150
+ -0.015475274336283125,
151
+ -0.0805356,
152
+ -0.13698139380530983,
153
+ 0.14110856637168137,
154
+ -0.04703600000000003,
155
+ 0.0665928778761063,
156
+ -0.021128761061947016,
157
+ 0.017010241592920368,
158
+ 0.09822180530973434,
159
+ 0.005761375398230098,
160
+ 0.0322361946902655,
161
+ -0.034939104424778704,
162
+ 0.06566965486725665,
163
+ 0.061632838053097376,
164
+ 0.0004023300884955741,
165
+ 0.07045262681415927,
166
+ 0.028733457522123865,
167
+ 0.02147898230088495,
168
+ -0.05026543539823011,
169
+ 0.060225181415929224,
170
+ -0.07029714159292026,
171
+ 0.06618380000000008,
172
+ 0.011594984955752213,
173
+ 0.040387401769911555,
174
+ -0.0058615916814159065,
175
+ 0.04742410654867257,
176
+ -0.015766054867256643,
177
+ -0.062290848053097175,
178
+ -0.05214830601769914,
179
+ 0.04644970973451337,
180
+ -0.05739616814159293,
181
+ 0.05439313274336291,
182
+ -0.0036409858407079588,
183
+ -0.009598277876106183,
184
+ -0.011235967256637188,
185
+ -0.002634908849557516,
186
+ -0.005508535398230053,
187
+ -0.05590965752212387,
188
+ -0.06772527787610619,
189
+ 0.08251315044247781,
190
+ -0.08976234513274321,
191
+ 0.04703600000000003,
192
+ -0.04274165486725669,
193
+ -0.05909215752212393,
194
+ 0.027935999115044265,
195
+ -0.036451818017699096,
196
+ 0.03197787610619467,
197
+ 0.1596792035398229,
198
+ 0.0024668168141592844,
199
+ -0.015842806194690306,
200
+ 0.07878208849557493,
201
+ 0.006463776548672604,
202
+ 0.06462291946902653,
203
+ 0.025483634513274327,
204
+ 0.06707996637168136,
205
+ -0.07861038619469025,
206
+ -0.0949829097345134,
207
+ -0.08679084778761066,
208
+ 0.09411216159292037,
209
+ -0.061483929203539976,
210
+ -0.03750280353982299,
211
+ 0.024982454867256657,
212
+ 0.010920844247787605,
213
+ -0.036973680442477924,
214
+ -0.00325765690265486,
215
+ -0.06706977168141595,
216
+ 0.054682415929203546,
217
+ 0.07233616902654867,
218
+ 0.024967183185840673,
219
+ 0.0201886814159292,
220
+ 0.0625599000000001,
221
+ 0.016163015929203547,
222
+ -0.19404511061946894,
223
+ 0.1314095771681416,
224
+ -0.02607840336283184,
225
+ -0.07232390353982299,
226
+ 0.06542182300884967,
227
+ 0.09097714132743363,
228
+ -0.0490932584955752,
229
+ 0.17395115044247766,
230
+ -0.08915754336283198,
231
+ 0.005843493805309704,
232
+ -0.1311985026548673,
233
+ 0.0822022767256637,
234
+ -0.0316962311504425,
235
+ -0.15503262123893807,
236
+ 0.050416203539823005,
237
+ 0.012278147787610633,
238
+ 0.0764223432743363,
239
+ 0.20117684424778776,
240
+ -0.15312840973451328,
241
+ -0.006850403539823016,
242
+ -0.22191862300884949,
243
+ 0.1207021007964602,
244
+ -0.08917110283185833,
245
+ -0.07690047646017703,
246
+ 0.030319972566371638,
247
+ -0.1126870734513274,
248
+ 0.06241866831858403,
249
+ -0.1273596991150443,
250
+ 0.06213639999999999,
251
+ -0.07254762831858405,
252
+ -0.08504349999999997,
253
+ 0.034207636283185856,
254
+ -0.02238689532743362,
255
+ 0.10946240796460185,
256
+ 0.021622823008849552,
257
+ -0.1487953611504425,
258
+ 0.02685327893805308,
259
+ -0.04490421946902649,
260
+ -0.04955592035398229,
261
+ 0.06734868938053096,
262
+ -0.08363668734513273,
263
+ 0.022693176017699095,
264
+ 0.09933861353982294,
265
+ -0.00604589380530972,
266
+ -0.10963647433628322,
267
+ 0.03259297079646029,
268
+ -0.07945840000000003,
269
+ -0.007002541592920362,
270
+ 0.10658185398230094,
271
+ -0.0866022876106194,
272
+ 0.06365430106194689
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 0.9732374444872444,
278
+ 0.9655808459932996,
279
+ 0.2507734231833244,
280
+ 0.85756632700396,
281
+ 0.9152499916483915,
282
+ 0.9319460220789437,
283
+ 0.9577523305438101,
284
+ 1.1527478213503135,
285
+ 0.9576681124104236,
286
+ 1.0097636409421697,
287
+ 0.9939501739346246,
288
+ 0.8077223719814682,
289
+ 0.9956881527950738,
290
+ 1.065832253077651,
291
+ 0.8648866626310105,
292
+ 0.7884428876814543,
293
+ 0.8846283104978594,
294
+ 1.0392968702844574,
295
+ 0.9547571784517959,
296
+ 0.830419971626617,
297
+ 1.9911349325902201,
298
+ 0.8944357999064113,
299
+ 0.8944357999064099,
300
+ 1.0,
301
+ 1.0,
302
+ 1.0,
303
+ 1.0288388455432311,
304
+ 1.0366372636701484,
305
+ 1.0104922342254585,
306
+ 0.6029602666961917,
307
+ 1.0,
308
+ 0.9119059418676891,
309
+ 0.9988936769842922,
310
+ 1.3401171108416883,
311
+ 1.0,
312
+ 1.0,
313
+ 1.409505785723462,
314
+ 0.7576328500006007,
315
+ 1.1142082921935355,
316
+ 1.100915710823559,
317
+ 0.9521761840451372,
318
+ 0.8352521125885086,
319
+ 0.7194469320515606,
320
+ 0.9886952789548065,
321
+ 1.0,
322
+ 1.111662684055426,
323
+ 1.9911349325902201,
324
+ 0.9988936769842919,
325
+ 1.0,
326
+ 1.0,
327
+ 0.9092993788613446,
328
+ 1.061138924056677,
329
+ 0.8860454459362529,
330
+ 0.77869888137794,
331
+ 1.0,
332
+ 0.9971658374137916,
333
+ 0.8944357999064098,
334
+ 1.4095057857234619,
335
+ 1.409505785723463,
336
+ 1.4095057857234636,
337
+ 1.4095057857234625,
338
+ 0.9988939483461562,
339
+ 0.8359429042688657,
340
+ 0.9455652546275832,
341
+ 1.047159553008427,
342
+ 1.2373317065584502,
343
+ 0.9367499049873408,
344
+ 0.7094990007768702,
345
+ 1.0,
346
+ 1.9911349325902201,
347
+ 1.152138074538977,
348
+ 1.0,
349
+ 1.076296523650441,
350
+ 1.0790204523971971,
351
+ 0.9278040585020654,
352
+ 0.6623289850929874,
353
+ 1.0736843273720698,
354
+ 1.059187675645061,
355
+ 1.4095057857234636,
356
+ 1.1978616378928757,
357
+ 1.9911349325902201,
358
+ 1.0,
359
+ 1.9911349325902201,
360
+ 0.9142231440920847,
361
+ 1.3486308966826843,
362
+ 0.9779239267203217,
363
+ 1.072217573812213,
364
+ 1.0,
365
+ 1.0670736267417575,
366
+ 1.0,
367
+ 0.7576328500006009,
368
+ 0.9988939483461562,
369
+ 1.0,
370
+ 1.2592635987036094,
371
+ 0.6360290623787335,
372
+ 0.8549033709264361,
373
+ 1.300841714365119,
374
+ 0.979322007928904,
375
+ 1.2296324368044147,
376
+ 1.3300447893255654,
377
+ 1.2339107860310472,
378
+ 1.4063287585864288,
379
+ 1.4063287585864277,
380
+ 0.817419899167048,
381
+ 1.0,
382
+ 0.9988939483461566,
383
+ 1.2178666747421332,
384
+ 0.9179155627028488,
385
+ 1.1674686384124506,
386
+ 0.937597875841375,
387
+ 1.9128860722576218,
388
+ 1.9849443701676805,
389
+ 1.2128492302504466,
390
+ 1.1978616378928766,
391
+ 1.409505785723462,
392
+ 1.0,
393
+ 0.9988939483461566,
394
+ 1.9776639067090993,
395
+ 0.8944357999064088,
396
+ 0.9089427774812973,
397
+ 1.1565813541259533,
398
+ 0.9312031818896745,
399
+ 0.37790291497240225,
400
+ 1.0,
401
+ 1.0103067336455187,
402
+ 1.0,
403
+ 1.612796005825811,
404
+ 1.4095057857234625,
405
+ 0.9988936769842919,
406
+ 0.9869575017654069,
407
+ 1.0625408223089012,
408
+ 0.8572543250334869,
409
+ 0.4626232154331089,
410
+ 0.8399894436428749,
411
+ 1.0,
412
+ 1.0,
413
+ 1.0,
414
+ 0.9949165069017805,
415
+ 0.9763809111647539,
416
+ 0.9886383527662114,
417
+ 1.0,
418
+ 0.8853802248708618,
419
+ 1.9911349325902201,
420
+ 1.0,
421
+ 1.4095057857234612,
422
+ 0.8944357999064094,
423
+ 0.8545082434186259,
424
+ 0.8796291945635648,
425
+ 0.9389113833926183,
426
+ 0.8861374760427413,
427
+ 0.39441056751713705,
428
+ 0.8648668783726172,
429
+ 0.9862191391833568,
430
+ 0.8481954658017612,
431
+ 0.9206020572467216,
432
+ 0.886517128434336,
433
+ 1.0192902215038742,
434
+ 0.956622629021229,
435
+ 0.8523688961466389,
436
+ 0.2992587051477164,
437
+ 1.0,
438
+ 0.8898404778961094,
439
+ 1.0071877733497892,
440
+ 0.950155747946548,
441
+ 1.0050918229648342,
442
+ 0.7815635141616576,
443
+ 0.9972744785704897,
444
+ 0.9594844360499902,
445
+ 0.9255046483391078,
446
+ 0.4876909595587591,
447
+ 0.5036861467715275,
448
+ 0.8566188861170654,
449
+ 0.7638467720219689,
450
+ 1.0032544884403838,
451
+ 1.0560420525550518,
452
+ 0.8986819691295396,
453
+ 0.9372189161919664,
454
+ 0.8101867430665612,
455
+ 0.8950623205358443,
456
+ 0.7725356624236849,
457
+ 1.0,
458
+ 0.872460731649835,
459
+ 1.045597205130584,
460
+ 0.881115812189619,
461
+ 0.9553256168269835,
462
+ 0.8848742890899297,
463
+ 0.5907365616618244,
464
+ 0.9525692591339604,
465
+ 0.9761188977078773,
466
+ 1.2163938242844157,
467
+ 0.9319895550002153,
468
+ 0.8335462617896103,
469
+ 0.9176414735582966,
470
+ 0.9775951517497435,
471
+ 0.8425042883529639,
472
+ 1.2598848541968266,
473
+ 0.949252647471748,
474
+ 0.838972165335258,
475
+ 0.23456841787874302,
476
+ 1.1642248030770597,
477
+ 0.8628119131177865,
478
+ 0.8751618803772816,
479
+ 0.9228296916565395,
480
+ 0.9809394578124714,
481
+ 0.5915262659968897,
482
+ 0.8563703331027254,
483
+ 1.223677024967222,
484
+ 0.9284798655045788,
485
+ 1.2965375076317172,
486
+ 1.0,
487
+ 0.9389878405072626,
488
+ 0.8540110671890598,
489
+ 1.316521539927867,
490
+ 1.4340416104694482,
491
+ 0.8735072262525767,
492
+ 0.676363014728904,
493
+ 1.1134658692256694,
494
+ 1.0134545560863548,
495
+ 1.7552329970203224,
496
+ 1.7155564074285294,
497
+ 0.873049365917997,
498
+ 1.030474558081803,
499
+ 1.0170344415415917,
500
+ 1.0766146909852692,
501
+ 0.7111765255105056,
502
+ 0.6923440560955865,
503
+ 1.0058025631570486,
504
+ 0.9240158601820535,
505
+ 1.9435205267323648,
506
+ 1.9899491083438348,
507
+ 0.8387690283436754,
508
+ 0.9708565551581373,
509
+ 0.8493149601758292,
510
+ 0.985055690803851,
511
+ 0.8279931417986857,
512
+ 0.9098729896957297,
513
+ 0.9370725829078755,
514
+ 0.8393620512490872,
515
+ 0.28080206241297245,
516
+ 1.0,
517
+ 0.8220194136548338,
518
+ 0.9761698379739507,
519
+ 0.7917031329595748,
520
+ 0.9270879739715543,
521
+ 0.847139011361557,
522
+ 1.0122054789755355,
523
+ 0.9745187015121873,
524
+ 0.8548335912371546,
525
+ 0.16972156566241,
526
+ 0.8245729285934237,
527
+ 1.06901211839648,
528
+ 0.8750748380574906,
529
+ 1.0605384058291198,
530
+ 0.814622435544981,
531
+ 1.1662691506968674,
532
+ 1.0027045465050628,
533
+ 0.707221379699125,
534
+ 1.0,
535
+ 0.8738904193642293,
536
+ 1.0307627522011051,
537
+ 0.9112504790758761,
538
+ 1.0340966211802813
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.49367091059684753,
550
+ "72": 0.4556962251663208,
551
+ "108": 0.40506330132484436,
552
+ "255": 0.2405063360929489
553
+ }
554
+ }
UCI_N4/sdp/runs/arrhythmia/fold_1/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 13,
3
+ "best_val_acc": 0.5263157894736842,
4
+ "test_acc": 0.4858156028368794,
5
+ "train_size": 113,
6
+ "val_size": 57,
7
+ "test_size": 282,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.08236052831858409,
12
+ 0.04887446902654869,
13
+ 0.0825547600000001,
14
+ 0.07080902389380533,
15
+ 0.06969351327433632,
16
+ -0.02017880672566372,
17
+ 0.0033134920353982203,
18
+ -0.0904622607964602,
19
+ 0.0008566455575221136,
20
+ 0.05502761778761062,
21
+ 0.0029605046017698983,
22
+ 0.16618478141592918,
23
+ 0.10348846991150445,
24
+ -0.12880789292035386,
25
+ 0.001393306194690269,
26
+ -0.009972053097345045,
27
+ -0.13480514867256632,
28
+ 0.15853807787610613,
29
+ -0.022554120353982243,
30
+ -0.17088875221238942,
31
+ -0.04703600000000003,
32
+ -0.02112876106194702,
33
+ 0.14790371681415893,
34
+ 0.0665928778761063,
35
+ 0.0665928778761063,
36
+ 0.09438671238938028,
37
+ -0.033913831858407135,
38
+ -0.05746374070796462,
39
+ 0.020589044247787618,
40
+ -0.08296883185840712,
41
+ -0.016433217699115002,
42
+ -0.02482472566371683,
43
+ -0.13408300000000029,
44
+ -0.0661125929203539,
45
+ 0.14110856637168206,
46
+ 0.19977865575221251,
47
+ 0.06659287787610634,
48
+ 0.16107630088495584,
49
+ -0.04968823575221234,
50
+ 0.16085886725663703,
51
+ -0.040819525663716834,
52
+ -0.04226484955752222,
53
+ 0.03399069026548677,
54
+ 0.08868894690265484,
55
+ 0.14110856637168143,
56
+ 0.1435154159292037,
57
+ -0.04703600000000003,
58
+ -2.920353984457933e-07,
59
+ -0.02112876106194691,
60
+ 0.1997786557522125,
61
+ -0.14194291681415921,
62
+ 0.11196102831858407,
63
+ 0.0592675752212388,
64
+ 0.09347194690265491,
65
+ -0.04703600000000003,
66
+ 0.13773737168141595,
67
+ -0.1056450000000003,
68
+ -0.06659289999999989,
69
+ 0.0665928778761063,
70
+ -0.06659289999999989,
71
+ 0.0665928778761063,
72
+ 0.09438671238938029,
73
+ -0.09931298230088502,
74
+ -0.11574543716814155,
75
+ 0.19007244637168158,
76
+ 0.006741415929203616,
77
+ -0.17417296814159283,
78
+ -2.920353982846636e-07,
79
+ -0.04703600000000003,
80
+ -0.04703600000000003,
81
+ 0.027216715044247736,
82
+ 0.14110856637168231,
83
+ -0.00288054867256639,
84
+ 0.04904841858407081,
85
+ 0.02098572858407086,
86
+ -0.1192364601769909,
87
+ -0.0031704955752213143,
88
+ 0.01358514159292034,
89
+ -0.06659289999999989,
90
+ 0.014341504424779012,
91
+ -0.04703600000000003,
92
+ -0.04703600000000003,
93
+ -0.04703600000000003,
94
+ 0.07784732743362836,
95
+ 0.10888657327433629,
96
+ -0.1186584123893806,
97
+ -0.02180679646017706,
98
+ -0.07482919999999994,
99
+ 0.08863622212389385,
100
+ 0.13608353008849555,
101
+ 0.08948672566371674,
102
+ 1.0619469028597977e-07,
103
+ -0.09438650000000005,
104
+ -0.02112876106194696,
105
+ 0.09014838938053121,
106
+ -0.048498132743362864,
107
+ 0.05329288938053096,
108
+ 0.07878135752212394,
109
+ 0.006330884955752202,
110
+ 0.04712901946902665,
111
+ 0.11292442477876118,
112
+ -0.09438650000000005,
113
+ 0.09438671238938054,
114
+ -0.03861907964601756,
115
+ 1.0619469029580476e-07,
116
+ -0.09438650000000005,
117
+ 0.06704106194690229,
118
+ -0.07101396460177,
119
+ 0.11338092035398238,
120
+ 0.022629575221239016,
121
+ 0.15994504424778788,
122
+ 0.039176644247788044,
123
+ 0.11334270796460184,
124
+ -0.100392831858407,
125
+ 0.0665928778761063,
126
+ -0.08165009999999992,
127
+ 1.0619469028597977e-07,
128
+ 0.027216715044247736,
129
+ -0.0211287610619469,
130
+ 0.007675044247787407,
131
+ 0.017898353982300903,
132
+ 0.022447520353982425,
133
+ -0.10415006194690236,
134
+ -0.06118739999999991,
135
+ -0.031867106194690256,
136
+ 0.0665928778761063,
137
+ 0.0386198407079645,
138
+ -0.06659289999999989,
139
+ 0.06704106194690229,
140
+ 0.03697516814159319,
141
+ -0.044993100884955714,
142
+ -0.005112693362831841,
143
+ -0.08742769999999993,
144
+ -0.04059785840707965,
145
+ 0.027216715044247736,
146
+ 0.1411085663716819,
147
+ 0.13608353008849491,
148
+ 0.03589945132743362,
149
+ -0.0453806460176991,
150
+ 0.003572176991150533,
151
+ 0.05211161769911493,
152
+ -0.012922732743362846,
153
+ 0.1411085663716814,
154
+ -0.04703600000000003,
155
+ 0.1997786557522125,
156
+ 0.14790371681415954,
157
+ 0.14316932831858414,
158
+ 0.03571657522123903,
159
+ -0.10441322884955753,
160
+ -0.23222040176991168,
161
+ -0.03493910442477871,
162
+ 0.05546864601769913,
163
+ 0.12581869469026555,
164
+ -0.18030577079646018,
165
+ -0.07161228646017702,
166
+ -0.03718444513274338,
167
+ 0.013523787610619589,
168
+ 0.10059417451327425,
169
+ 0.01624747876106193,
170
+ 0.05021323893805318,
171
+ -0.05147623362831883,
172
+ 0.1827229362831858,
173
+ 0.0034618557522124397,
174
+ 0.05241511327433623,
175
+ 0.030558143362831823,
176
+ -0.19202160176991148,
177
+ 0.11133997495575228,
178
+ 0.12129543628318586,
179
+ 0.060097776106194795,
180
+ 0.11579815929203502,
181
+ -0.027196398230088462,
182
+ 0.17599128230088495,
183
+ -0.1195051539823009,
184
+ 0.18247482389380532,
185
+ 0.06219380353982303,
186
+ -0.09025506017699113,
187
+ 0.08350311504424779,
188
+ 0.1271729522123894,
189
+ -0.0951591353982304,
190
+ 0.10388311504424796,
191
+ 0.04703600000000003,
192
+ -0.14397143362831855,
193
+ -0.056712807079646044,
194
+ 0.11911974769911506,
195
+ 0.07255731355752211,
196
+ 0.17956833628318594,
197
+ 0.03657456283185836,
198
+ -0.12767188938053103,
199
+ -0.21526490619469008,
200
+ 0.019409734513274046,
201
+ -0.20038580796460184,
202
+ 0.13453505858407078,
203
+ -0.20150050008849554,
204
+ -0.10956924336283183,
205
+ -0.1755137388495575,
206
+ 0.07771356637168146,
207
+ 0.1258815132743363,
208
+ 0.05789021663716825,
209
+ 0.059674265486725525,
210
+ 0.04250356814159293,
211
+ 0.18101372743362842,
212
+ -0.08988732212389382,
213
+ 0.148077411681416,
214
+ 0.041530495575221225,
215
+ -0.07796867964601775,
216
+ -0.08606286725663721,
217
+ 0.216610610619469,
218
+ 0.09511035132743359,
219
+ -0.05938040707964593,
220
+ 0.0625599000000001,
221
+ -0.09312924070796465,
222
+ -0.07196051769911511,
223
+ 0.13021555911504423,
224
+ 0.10358608645132746,
225
+ -0.0039450442477876055,
226
+ 0.015811640707964647,
227
+ 0.042050546725663725,
228
+ -0.11399942584070796,
229
+ 0.01275024778761036,
230
+ -0.012157897345132696,
231
+ -0.07146561415929208,
232
+ -0.03644905008849562,
233
+ -0.0460240963716814,
234
+ -0.04567296300884947,
235
+ -0.0159320159292035,
236
+ -0.020865886725663647,
237
+ 0.006243656991150445,
238
+ -0.04104453495575228,
239
+ 0.04250217699115046,
240
+ 0.034307366371681414,
241
+ -0.11968876460176998,
242
+ -0.0937977030973451,
243
+ -0.007898124601769923,
244
+ -0.06254813724778759,
245
+ 0.027666705132743385,
246
+ -0.0678103380530974,
247
+ 0.0033648314159292177,
248
+ 0.014861656991150381,
249
+ -0.08490639823008855,
250
+ 0.06213639999999999,
251
+ 0.10985744247787621,
252
+ -0.1141806185840708,
253
+ -0.0051085477876106,
254
+ -0.07652198922123891,
255
+ 0.1186390026548673,
256
+ -0.006018964601769793,
257
+ -0.03378361716814159,
258
+ 0.011641800000000063,
259
+ -0.06094139999999994,
260
+ 0.1415026725663717,
261
+ -0.08340849911504429,
262
+ -0.021807159292035423,
263
+ -0.08355237141592924,
264
+ 0.10080485079646004,
265
+ -0.0028213893805309528,
266
+ -0.039560768141592914,
267
+ -0.03811751592920355,
268
+ 0.06180052389380527,
269
+ 0.08721472743362838,
270
+ -0.045456217699115044,
271
+ -0.04452998026548677,
272
+ -0.08741183716814158
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 1.0288523625377175,
278
+ 0.9926765498781311,
279
+ 1.5821926864265932,
280
+ 1.2345480341843558,
281
+ 1.0919259987637373,
282
+ 0.8553411989728208,
283
+ 0.9770372253740158,
284
+ 1.0941619685910755,
285
+ 0.9070109264400832,
286
+ 1.1660151450666374,
287
+ 0.82811358045681,
288
+ 0.8585451804478106,
289
+ 0.9271539318095082,
290
+ 0.826139795075132,
291
+ 0.9407871254954377,
292
+ 1.1098127265333941,
293
+ 0.9673996715099642,
294
+ 1.0170784936919917,
295
+ 0.7160692020317576,
296
+ 0.8881539469849713,
297
+ 1.0,
298
+ 0.8944357999064094,
299
+ 1.5353137244867066,
300
+ 1.409505785723462,
301
+ 1.4095057857234625,
302
+ 1.4063287585864295,
303
+ 0.8810006273224485,
304
+ 0.9386543902953636,
305
+ 0.9544080465249254,
306
+ 0.605561339519823,
307
+ 0.41738930632162535,
308
+ 0.9435148318250272,
309
+ 1.0,
310
+ 0.7880462841530468,
311
+ 1.9911349325902201,
312
+ 1.9844233966366362,
313
+ 1.4095057857234636,
314
+ 1.494834216304884,
315
+ 0.8945327921343991,
316
+ 1.0465252306595956,
317
+ 0.9657902518204129,
318
+ 0.8818849232826983,
319
+ 1.01289922968906,
320
+ 0.9542609489006632,
321
+ 1.9911349325902201,
322
+ 1.303101066939662,
323
+ 1.0,
324
+ 0.9988936769842933,
325
+ 0.8944357999064099,
326
+ 1.9844233966366385,
327
+ 0.9721978598866062,
328
+ 0.9751070654641969,
329
+ 1.053405494669145,
330
+ 1.2277188687789828,
331
+ 1.0,
332
+ 0.9710532649972081,
333
+ 1.0,
334
+ 1.0,
335
+ 1.4095057857234625,
336
+ 1.0,
337
+ 1.409505785723463,
338
+ 1.4063287585864295,
339
+ 0.9944538524514821,
340
+ 1.0084398738408038,
341
+ 1.096956593110858,
342
+ 0.9848747659663566,
343
+ 1.0176485758563296,
344
+ 0.9988936769842915,
345
+ 1.0,
346
+ 1.0,
347
+ 1.1521380745389784,
348
+ 1.9911349325902201,
349
+ 0.8886796764360778,
350
+ 1.0626176220464763,
351
+ 0.9820129092696263,
352
+ 0.48071756015968203,
353
+ 0.8052609158630751,
354
+ 0.9014845427415126,
355
+ 1.0,
356
+ 1.0421263616247836,
357
+ 1.0,
358
+ 1.0,
359
+ 1.0,
360
+ 1.0603166366167238,
361
+ 1.3948018100222412,
362
+ 1.0002378777841179,
363
+ 1.0521891063258038,
364
+ 1.0,
365
+ 1.170667828978199,
366
+ 1.6220790112596297,
367
+ 1.3004892166096398,
368
+ 0.9988939483461562,
369
+ 1.0,
370
+ 0.8944357999064098,
371
+ 1.2549059943840741,
372
+ 0.9010506624821365,
373
+ 1.2640911636544077,
374
+ 0.947031285603356,
375
+ 0.991260918816901,
376
+ 1.3300447893255651,
377
+ 1.1497030038124454,
378
+ 1.0,
379
+ 1.4063287585864277,
380
+ 0.8174198991670485,
381
+ 0.9988939483461566,
382
+ 1.0,
383
+ 1.217866674742133,
384
+ 0.8282680988206665,
385
+ 1.073085103116072,
386
+ 0.9693454139903576,
387
+ 1.7234040703162494,
388
+ 1.1056144342459158,
389
+ 1.074119172644369,
390
+ 0.6071170412907283,
391
+ 1.409505785723462,
392
+ 1.0,
393
+ 0.9988939483461562,
394
+ 1.1521380745389787,
395
+ 0.8944357999064119,
396
+ 1.058370875443875,
397
+ 1.0846522644237848,
398
+ 1.0598613115637294,
399
+ 0.5613288969768316,
400
+ 1.0,
401
+ 1.077530223972941,
402
+ 1.4095057857234625,
403
+ 1.15083399388167,
404
+ 1.0,
405
+ 1.2178666747421318,
406
+ 1.0966395583377115,
407
+ 1.0389053330759344,
408
+ 1.0429545495698374,
409
+ 1.0,
410
+ 1.0244696199828591,
411
+ 1.152138074538978,
412
+ 1.9911349325902201,
413
+ 1.6220790112596353,
414
+ 1.1329428844818097,
415
+ 1.0304640926757396,
416
+ 1.0027828154445004,
417
+ 1.4038062005460157,
418
+ 1.0648539403871593,
419
+ 1.9911349325902201,
420
+ 1.0,
421
+ 1.9844233966366391,
422
+ 1.5353137244867094,
423
+ 0.6866407429573802,
424
+ 0.9470876233472572,
425
+ 0.8928451459276403,
426
+ 1.3503062413436946,
427
+ 0.39441056751713693,
428
+ 1.0739060999830787,
429
+ 0.8074286630470415,
430
+ 0.8622816943277237,
431
+ 0.9235511168325403,
432
+ 0.8884646840941383,
433
+ 0.9253177369109523,
434
+ 1.0067482855890655,
435
+ 0.8717444615689396,
436
+ 1.7004798113300974,
437
+ 1.2451967529281143,
438
+ 1.0189016467998342,
439
+ 0.9159576992318523,
440
+ 0.9716842292520014,
441
+ 0.8537203439878127,
442
+ 0.6934639134127168,
443
+ 0.6814900866218891,
444
+ 1.08628728041417,
445
+ 0.8695100152450093,
446
+ 1.7244969164094923,
447
+ 0.9957413253735008,
448
+ 0.886998298843266,
449
+ 1.0086098935045376,
450
+ 0.9474117590718318,
451
+ 0.9527864599550645,
452
+ 0.8622024829086022,
453
+ 0.928715896349544,
454
+ 1.165972778898159,
455
+ 1.1444020655792773,
456
+ 1.249832703644339,
457
+ 1.0,
458
+ 1.04414181114218,
459
+ 0.7888691092407913,
460
+ 0.8896110919230731,
461
+ 0.8385172959457787,
462
+ 0.6963004767756463,
463
+ 1.0524770129026086,
464
+ 0.8728215158868736,
465
+ 1.2422671085343606,
466
+ 1.0395955941659785,
467
+ 0.9729248895409327,
468
+ 0.942112878700215,
469
+ 0.9029124312015971,
470
+ 0.9945356002953412,
471
+ 0.9067257721352653,
472
+ 0.6559269963983796,
473
+ 1.0530222495928638,
474
+ 0.7742650861348659,
475
+ 1.7415209866320729,
476
+ 0.31751695199855035,
477
+ 0.9401556411866103,
478
+ 0.9925662855482592,
479
+ 0.9703437391049544,
480
+ 0.9315271035229352,
481
+ 0.76726349356305,
482
+ 1.113451820498087,
483
+ 1.5950728246019172,
484
+ 0.9108834606609704,
485
+ 0.6187680270209445,
486
+ 1.0,
487
+ 1.026218169309107,
488
+ 0.9226908311101232,
489
+ 1.3695879042350074,
490
+ 1.390915117042367,
491
+ 0.9165066682832561,
492
+ 1.0788295714407763,
493
+ 0.8648263176100378,
494
+ 0.9635758583333331,
495
+ 0.8878642706591297,
496
+ 0.9006687498171835,
497
+ 0.8634669309414519,
498
+ 1.0263681887473621,
499
+ 1.1035216758671196,
500
+ 0.9668823371087334,
501
+ 0.9093839574625667,
502
+ 1.2537251227686863,
503
+ 0.925393016008483,
504
+ 0.9198488449490679,
505
+ 0.9988290268424753,
506
+ 0.1771101235529094,
507
+ 1.05614751420039,
508
+ 0.9497863099739803,
509
+ 1.0994839009481026,
510
+ 0.92792429034674,
511
+ 0.9973731985207415,
512
+ 1.4008749618490997,
513
+ 0.9833759189369512,
514
+ 0.7900467121392818,
515
+ 0.5512800744398914,
516
+ 1.0,
517
+ 1.160435495736531,
518
+ 0.840523823247663,
519
+ 1.0569742675732663,
520
+ 0.8576934466322704,
521
+ 0.9349861286126709,
522
+ 0.8587290535040432,
523
+ 0.9574488028099564,
524
+ 0.8825111948837125,
525
+ 1.0,
526
+ 0.9946462418130932,
527
+ 0.8401625258336195,
528
+ 1.0609041780534152,
529
+ 0.8625411201961046,
530
+ 0.8578849236354916,
531
+ 0.9245113485505083,
532
+ 0.9397104471617286,
533
+ 0.949988633400937,
534
+ 1.4949439323664353,
535
+ 1.0752730715733643,
536
+ 0.854508526946672,
537
+ 1.0304209489391347,
538
+ 0.9286338973772724
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.38596493005752563,
550
+ "72": 0.2982456088066101,
551
+ "108": 0.24561403691768646,
552
+ "255": 0.08771929889917374
553
+ }
554
+ }
UCI_N4/sdp/runs/arrhythmia/fold_2/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 60,
3
+ "best_val_acc": 0.5538461538461539,
4
+ "test_acc": 0.6496350364963503,
5
+ "train_size": 113,
6
+ "val_size": 65,
7
+ "test_size": 274,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.003089986725663709,
12
+ -0.004440814159291977,
13
+ 0.06255539469026555,
14
+ 0.0030673203539822954,
15
+ 0.001728016814159293,
16
+ 0.11026861433628313,
17
+ 0.017892446017699123,
18
+ -0.06960080176991157,
19
+ 0.039233834283185866,
20
+ 0.15144875398230093,
21
+ 0.006497817787610628,
22
+ -0.01399969203539821,
23
+ 0.12535314601769912,
24
+ 0.032636741592920446,
25
+ -0.04566848761061949,
26
+ -0.12298024778761062,
27
+ -0.000969959292035392,
28
+ 0.11890371504424775,
29
+ -0.09021629999999985,
30
+ -0.11451322123893802,
31
+ -0.04703600000000003,
32
+ 0.06338747787610569,
33
+ -0.1056450000000003,
34
+ -0.06659289999999989,
35
+ 0.0665928778761063,
36
+ -0.09438650000000005,
37
+ -0.04968765486725668,
38
+ 0.10877121769911505,
39
+ -0.018068128318584065,
40
+ -0.08296883185840709,
41
+ -0.05587280000000011,
42
+ -0.06895776106194693,
43
+ -2.920353983278935e-07,
44
+ -0.013222389380530894,
45
+ -0.04703600000000003,
46
+ 0.06659287787610632,
47
+ -0.06659289999999989,
48
+ -0.1252820000000002,
49
+ 0.010099320973451271,
50
+ 0.07353538053097344,
51
+ -0.007326469911504469,
52
+ -0.07684545132743385,
53
+ -0.0339906548672566,
54
+ 0.05784047787610613,
55
+ 0.14110856637168143,
56
+ 3.805309734868323e-07,
57
+ -0.04703600000000003,
58
+ -0.06704164601769919,
59
+ -0.02112876106194691,
60
+ -0.06659289999999989,
61
+ 0.15620863893805323,
62
+ -0.03053643008849556,
63
+ -0.18165605309734498,
64
+ -0.11233752212389378,
65
+ -0.04703600000000003,
66
+ -0.016779973451327427,
67
+ -0.021128761061946985,
68
+ -0.06659289999999989,
69
+ 0.0665928778761063,
70
+ -0.06659289999999989,
71
+ -0.06659289999999989,
72
+ -0.09438650000000005,
73
+ -0.00463133628318579,
74
+ -0.07507774690265485,
75
+ -0.0007694676106195044,
76
+ -0.08089127433628311,
77
+ -0.10792991415929203,
78
+ -2.9203539847723323e-07,
79
+ -0.04703600000000003,
80
+ -0.04703600000000003,
81
+ 0.027216715044247893,
82
+ -0.04703600000000003,
83
+ -0.02592799999999999,
84
+ 0.08057962389380531,
85
+ 0.024038425752212503,
86
+ -0.16465999999999992,
87
+ -0.07926050000000014,
88
+ -0.09237758407079648,
89
+ -0.06659289999999989,
90
+ -0.043025663716814114,
91
+ 0.14110856637168245,
92
+ 0.1411085663716826,
93
+ -0.04703600000000003,
94
+ -0.023750336283185847,
95
+ 0.03126479168141594,
96
+ 0.008899934513274312,
97
+ -0.02743449557522126,
98
+ 0.06331698053097352,
99
+ 0.05539779646017699,
100
+ 0.027216715044247736,
101
+ 0.017897150442477798,
102
+ 1.0619469029187476e-07,
103
+ 1.061946903233147e-07,
104
+ -0.02112876106194691,
105
+ -0.1502479999999999,
106
+ -0.016447008849557545,
107
+ -0.0054378495575221125,
108
+ 0.07474130442477876,
109
+ -0.07807693805309734,
110
+ -0.07854839999999999,
111
+ -0.008790955752212368,
112
+ 1.0619469031152472e-07,
113
+ 1.0619469029973474e-07,
114
+ 0.038619840707964564,
115
+ 1.061946903233147e-07,
116
+ 1.0619469035868464e-07,
117
+ -2.920353983829134e-07,
118
+ -0.06884565486725683,
119
+ -0.043006230088495565,
120
+ 0.13900964601769922,
121
+ -0.06902842477876096,
122
+ -0.06529410000000001,
123
+ -0.07149334513274326,
124
+ -0.043025663716814044,
125
+ -0.06659289999999989,
126
+ 0.02721671504424799,
127
+ 1.0619469029187476e-07,
128
+ -0.08165009999999992,
129
+ -0.1056450000000003,
130
+ -0.0844234336283186,
131
+ 0.045172380530973465,
132
+ 0.08091592477876108,
133
+ -0.08034439823008824,
134
+ -0.06118739999999991,
135
+ 0.009105318584070807,
136
+ 0.0665928778761063,
137
+ 0.03861984070796471,
138
+ -0.06659289999999989,
139
+ -2.920353983475435e-07,
140
+ -0.01561157522123892,
141
+ 0.034667146902654884,
142
+ 0.04805644646017698,
143
+ 0.07649909380531038,
144
+ 0.0778107902654868,
145
+ -0.08165009999999992,
146
+ -0.04703600000000003,
147
+ 0.027216715044247736,
148
+ 0.003988389380530976,
149
+ 0.07484829203539822,
150
+ 0.06071553097345137,
151
+ 0.014212502654867237,
152
+ 0.06978295752212389,
153
+ -0.04703600000000003,
154
+ -0.04703600000000003,
155
+ -0.06659289999999989,
156
+ -0.1056450000000003,
157
+ -0.05670110707964598,
158
+ 0.09375696460176995,
159
+ -0.16628776973451334,
160
+ -0.004178826548672555,
161
+ -0.07220739999999994,
162
+ -0.06694404424778763,
163
+ -0.06819787345132745,
164
+ -0.049705195575221274,
165
+ -0.11667001238938055,
166
+ -0.12676487345132748,
167
+ 0.06602797345132745,
168
+ 0.0027255099115044237,
169
+ 0.08367987168141594,
170
+ -0.07531826548672561,
171
+ 0.06618380000000008,
172
+ -0.05077870088495575,
173
+ -0.03939802035398229,
174
+ 0.0725209725663717,
175
+ 0.018818907079646008,
176
+ -0.0012129309734513318,
177
+ 0.08232463584070795,
178
+ 0.06279675221238941,
179
+ 0.05451436991150446,
180
+ -0.09364632743362859,
181
+ -0.013597840707964663,
182
+ -0.02791582300884959,
183
+ 0.02277181946902653,
184
+ 0.09624579256637165,
185
+ 0.10685669557522126,
186
+ 0.05720445840707966,
187
+ -0.11690305221238939,
188
+ -0.07600262831858408,
189
+ 0.20486032743362856,
190
+ -0.11598514159292016,
191
+ 0.04703600000000003,
192
+ 0.12372530088495573,
193
+ 0.07733639557522128,
194
+ 0.009731815840707961,
195
+ 0.06515634630088495,
196
+ -0.004099914159292028,
197
+ -0.062444362831858426,
198
+ -0.14432490088495575,
199
+ 0.010303688495575204,
200
+ -0.03996258407079658,
201
+ -0.01723771946902648,
202
+ -0.03748595911504427,
203
+ -0.09338390796460176,
204
+ -0.12455748761061945,
205
+ -0.07069998663716814,
206
+ 0.09306433097345132,
207
+ 0.05574491150442479,
208
+ 0.05271592371681417,
209
+ -0.10488400000000016,
210
+ 0.0725061,
211
+ -0.06092212743362833,
212
+ -0.021001579646017662,
213
+ 0.08582514876106195,
214
+ 0.05783091212389381,
215
+ 0.07796875840707959,
216
+ -0.0484065486725664,
217
+ -0.06359218141592915,
218
+ 0.12465353274336273,
219
+ -0.03740971681415926,
220
+ -0.006256027433628239,
221
+ 0.02847770973451326,
222
+ 0.03523589380530972,
223
+ -0.007258076106194675,
224
+ 0.029468245840707955,
225
+ 0.07720809823008848,
226
+ -0.029801646017699017,
227
+ -0.07590199938053097,
228
+ -0.0023667877876106243,
229
+ -0.06193052212389384,
230
+ 0.0729473,
231
+ -0.08944441592920359,
232
+ -0.008905622654867247,
233
+ -0.09599750318584069,
234
+ -0.11731536725663715,
235
+ 0.03799221946902657,
236
+ 0.04264000707964609,
237
+ -0.05476776486725663,
238
+ -0.08099349336283189,
239
+ -0.06403644955752204,
240
+ 0.0510427,
241
+ -0.1728837920353984,
242
+ 0.04379192212389381,
243
+ -0.08503633221238939,
244
+ -0.04843164778761059,
245
+ -0.013288855929203541,
246
+ 0.05900416725663712,
247
+ 0.01502987168141596,
248
+ -0.028499033982300897,
249
+ -0.06898648672566376,
250
+ 0.06213639999999999,
251
+ -0.020727761061946872,
252
+ 0.056635334513274314,
253
+ -0.009026141592920364,
254
+ 0.03156841769911506,
255
+ -0.12126076106194686,
256
+ 0.06353122123893817,
257
+ 0.031937667522123854,
258
+ 0.029336698938053133,
259
+ 0.12508993982300817,
260
+ -0.07582650442477877,
261
+ 0.006734969026548675,
262
+ 0.06509837044247789,
263
+ 0.03657155663716816,
264
+ -0.13086254787610632,
265
+ -0.01249529203539823,
266
+ 0.041217141592920364,
267
+ 0.050712616814159305,
268
+ 0.008828665486725618,
269
+ -0.04774530973451326,
270
+ -0.06531424955752214,
271
+ 0.08627439557522125,
272
+ 0.019008834867256633
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 0.9244692810470073,
278
+ 0.9993356910018533,
279
+ 1.1547522998507793,
280
+ 0.9432810092169331,
281
+ 1.03584004279498,
282
+ 0.8753158130277445,
283
+ 1.0465755215467378,
284
+ 0.9102607240673849,
285
+ 1.023778543447583,
286
+ 0.9297280045159075,
287
+ 1.0069835198754635,
288
+ 0.9525566546794436,
289
+ 0.9399759480360307,
290
+ 0.9978150756585966,
291
+ 0.9862811329995884,
292
+ 0.9613244275752023,
293
+ 1.111865207612389,
294
+ 0.9715796850385696,
295
+ 1.0,
296
+ 1.0813226579822182,
297
+ 1.0,
298
+ 1.2592635987036094,
299
+ 1.0,
300
+ 1.0,
301
+ 1.4095057857234625,
302
+ 1.0,
303
+ 1.010538238524329,
304
+ 1.0722512669094082,
305
+ 1.0593646908068974,
306
+ 0.605561339519823,
307
+ 1.0,
308
+ 0.9556792785074675,
309
+ 0.9988936769842924,
310
+ 0.9607982608538026,
311
+ 1.0,
312
+ 1.4095057857234632,
313
+ 1.0,
314
+ 1.0,
315
+ 0.972373648410722,
316
+ 1.0584533172538098,
317
+ 1.0284056325027326,
318
+ 0.8751294762374062,
319
+ 0.7194469320515607,
320
+ 0.9753483226530357,
321
+ 1.9911349325902201,
322
+ 0.99889397212978,
323
+ 1.0,
324
+ 0.7094990007768706,
325
+ 0.8944357999064104,
326
+ 1.0,
327
+ 0.9004941973725803,
328
+ 1.0121581074927941,
329
+ 0.761525664661198,
330
+ 0.6638398438080123,
331
+ 1.0,
332
+ 1.0084273596642825,
333
+ 0.8944357999064123,
334
+ 1.0,
335
+ 1.4095057857234632,
336
+ 1.0,
337
+ 1.0,
338
+ 1.0,
339
+ 1.0674172345021198,
340
+ 1.0415595393603108,
341
+ 0.9952640371583976,
342
+ 0.7847375185646767,
343
+ 1.0253922671299165,
344
+ 0.9988936769842935,
345
+ 1.0,
346
+ 1.0,
347
+ 1.1521380745389769,
348
+ 1.0,
349
+ 0.9380600926852771,
350
+ 0.9688329579782285,
351
+ 1.0699750013871834,
352
+ 1.0,
353
+ 1.0,
354
+ 0.9022130416875166,
355
+ 1.0,
356
+ 0.8547515543653855,
357
+ 1.9911349325902201,
358
+ 1.9911349325902201,
359
+ 1.0,
360
+ 0.9833161542151768,
361
+ 0.9113836368578456,
362
+ 1.0154070458101938,
363
+ 0.8175726795277899,
364
+ 1.0291658658053822,
365
+ 1.0023879541161114,
366
+ 1.1521380745389784,
367
+ 1.0666606471785436,
368
+ 0.9988939483461562,
369
+ 0.9988939483461564,
370
+ 0.8944357999064111,
371
+ 1.0,
372
+ 1.0194849042181624,
373
+ 0.9377289254070391,
374
+ 0.9868393622488469,
375
+ 0.7115324821514019,
376
+ 1.0,
377
+ 0.9291878599599749,
378
+ 0.9988939483461571,
379
+ 0.9988939483461564,
380
+ 1.150833993881672,
381
+ 0.9988939483461564,
382
+ 0.9988939483461563,
383
+ 0.9988936769842928,
384
+ 0.8446756150368765,
385
+ 0.8840822390425243,
386
+ 0.879273891482901,
387
+ 0.356357040154056,
388
+ 1.0,
389
+ 0.8575361470050674,
390
+ 0.8547515543653872,
391
+ 1.0,
392
+ 1.1521380745389762,
393
+ 0.9988939483461562,
394
+ 1.0,
395
+ 1.0,
396
+ 0.7707096318942795,
397
+ 0.9479029615796615,
398
+ 0.8861435214681488,
399
+ 0.709392406059319,
400
+ 1.0,
401
+ 0.9648083778490988,
402
+ 1.4095057857234619,
403
+ 1.1508339938816696,
404
+ 1.0,
405
+ 0.9988936769842918,
406
+ 0.8265732991714976,
407
+ 1.0190844405952648,
408
+ 0.9459831021380053,
409
+ 1.7348381185160544,
410
+ 1.1517740759366022,
411
+ 1.0,
412
+ 1.0,
413
+ 1.152138074538978,
414
+ 0.912843060712004,
415
+ 1.1388119070973806,
416
+ 0.9915799039109703,
417
+ 1.002719667279991,
418
+ 1.085125621845705,
419
+ 1.0,
420
+ 1.0,
421
+ 1.0,
422
+ 1.0,
423
+ 1.5001714286910226,
424
+ 0.9966194693620798,
425
+ 0.9443805992812078,
426
+ 0.8655175815339226,
427
+ 1.0,
428
+ 0.7897012658620092,
429
+ 1.1164175335449071,
430
+ 1.264530190302258,
431
+ 0.8921583865445091,
432
+ 1.0648052330194941,
433
+ 0.8695758038727032,
434
+ 0.8660581580725691,
435
+ 0.8367831000825393,
436
+ 0.37197924168302665,
437
+ 1.0,
438
+ 0.9262178979224102,
439
+ 0.9242646117464632,
440
+ 0.973591105652927,
441
+ 0.9951600891998066,
442
+ 1.1111862475284577,
443
+ 0.6670563380647561,
444
+ 0.9442962334551489,
445
+ 0.990332316811185,
446
+ 0.480719441273429,
447
+ 1.223234975369157,
448
+ 0.940394811395897,
449
+ 0.9089632031900003,
450
+ 1.0458338698053655,
451
+ 0.9721165818563446,
452
+ 1.374767108546496,
453
+ 0.8594004341053223,
454
+ 0.7653673558229712,
455
+ 0.6670525311692612,
456
+ 0.645642563256581,
457
+ 1.0,
458
+ 0.891254315503885,
459
+ 1.0775980834755503,
460
+ 1.007431548670928,
461
+ 0.9530753484316439,
462
+ 1.4811962251096449,
463
+ 1.2176806384389702,
464
+ 0.9602107117788192,
465
+ 0.8795846242039457,
466
+ 1.1116750216535782,
467
+ 0.9501349187678776,
468
+ 1.0821885258200035,
469
+ 1.1407026156836266,
470
+ 0.9231893015164008,
471
+ 0.8990327480493145,
472
+ 0.6422405879838027,
473
+ 0.9092214790537131,
474
+ 0.9351958368508632,
475
+ 1.0,
476
+ 1.0,
477
+ 0.9288775753611616,
478
+ 0.8531876075690629,
479
+ 1.034017858801366,
480
+ 1.0285706599327553,
481
+ 1.5382840820664052,
482
+ 1.0793433921827003,
483
+ 0.7014984131399681,
484
+ 0.9478974831267535,
485
+ 0.8121083950620509,
486
+ 0.5317226069000799,
487
+ 0.877495299738119,
488
+ 1.105656776922663,
489
+ 0.9679617815757274,
490
+ 0.7155463726091819,
491
+ 1.108302722756925,
492
+ 1.0944778308312668,
493
+ 0.7749616919771513,
494
+ 0.8850563716056123,
495
+ 0.5693811287198752,
496
+ 1.0,
497
+ 0.9220528856937216,
498
+ 0.8553127512283658,
499
+ 0.9975197765961968,
500
+ 0.8796722204092665,
501
+ 1.1740947078133768,
502
+ 0.9516756586234943,
503
+ 0.9063555755946218,
504
+ 0.9537956983823893,
505
+ 0.21590336552059824,
506
+ 1.0,
507
+ 1.1291952185180558,
508
+ 1.0007499385498189,
509
+ 1.0111383561599954,
510
+ 0.9704983147288865,
511
+ 1.1385710361021162,
512
+ 0.7564588026775311,
513
+ 1.0046465692486821,
514
+ 0.9312841189336238,
515
+ 0.6375502285227569,
516
+ 1.0,
517
+ 0.829387189699574,
518
+ 1.0544363475675953,
519
+ 0.9771879250820691,
520
+ 1.0137760206245479,
521
+ 1.0423498864484522,
522
+ 0.43681029699877133,
523
+ 0.8991224001063718,
524
+ 0.8257144621838688,
525
+ 1.968770644943309,
526
+ 0.8856828178067617,
527
+ 1.0398871114616712,
528
+ 0.8345338516516961,
529
+ 0.9722595951185294,
530
+ 1.285772740124495,
531
+ 0.8915167876690523,
532
+ 0.8875667705363124,
533
+ 0.6453390579256484,
534
+ 0.9343424770462008,
535
+ 0.8887305596443167,
536
+ 1.0443061214405034,
537
+ 1.027608228431771,
538
+ 0.9189390661089004
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.4923076927661896,
550
+ "72": 0.4769230782985687,
551
+ "108": 0.4615384638309479,
552
+ "255": 0.3076923191547394
553
+ }
554
+ }
UCI_N4/sdp/runs/arrhythmia/fold_3/result.json ADDED
@@ -0,0 +1,554 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 28,
3
+ "best_val_acc": 0.5373134328358209,
4
+ "test_acc": 0.5992647058823529,
5
+ "train_size": 113,
6
+ "val_size": 67,
7
+ "test_size": 272,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.04070993805309734,
12
+ 0.11996151327433617,
13
+ -0.07505505699115043,
14
+ -0.053473368141592904,
15
+ -0.0023036168141593112,
16
+ -0.04386066761061949,
17
+ 0.1000648973451327,
18
+ 0.21898467610619468,
19
+ 0.0844638663362832,
20
+ -0.21027526176991146,
21
+ 0.08278053309734511,
22
+ 0.02691175840707965,
23
+ -0.10311968407079651,
24
+ -0.019989650442477833,
25
+ -0.029568291150442447,
26
+ 0.06979861946902657,
27
+ -0.09989179115044242,
28
+ -0.0017227557522123856,
29
+ -2.2654867243656462e-07,
30
+ 0.06518417699115044,
31
+ -0.04703600000000003,
32
+ -0.1056450000000003,
33
+ -0.1056450000000003,
34
+ 0.19977865575221251,
35
+ 0.0665928778761063,
36
+ 0.09438671238938035,
37
+ -0.10331811504424784,
38
+ -0.11287559292035391,
39
+ 0.1063068938053097,
40
+ 0.04291548672566383,
41
+ -0.05587280000000011,
42
+ -0.032180318584070916,
43
+ 0.06704106194690261,
44
+ -0.1718930000000004,
45
+ -0.04703600000000003,
46
+ 0.0665928778761063,
47
+ -0.06659289999999989,
48
+ 0.08948672566371665,
49
+ -0.025450121504424723,
50
+ -0.17311484513274336,
51
+ 0.07640526460176993,
52
+ 0.11526853982300869,
53
+ 0.1133023008849558,
54
+ -0.07326554867256642,
55
+ -0.04703600000000003,
56
+ 0.047838725663716816,
57
+ -0.04703600000000003,
58
+ 0.06704106194690251,
59
+ -0.02112876106194691,
60
+ -0.06659289999999989,
61
+ -0.013552253982300916,
62
+ -0.020357922123893812,
63
+ -0.027464973451327517,
64
+ -0.006002522123893788,
65
+ -0.04703600000000003,
66
+ -0.04337743362831858,
67
+ 0.14790371681415934,
68
+ 0.0665928778761063,
69
+ -0.06659289999999989,
70
+ 0.06659287787610634,
71
+ -0.06659289999999989,
72
+ 1.0619469029580476e-07,
73
+ 0.044767823008849614,
74
+ 0.08289923362831852,
75
+ -0.12235442831858409,
76
+ -0.11459614159292028,
77
+ 0.14790476371681416,
78
+ -2.9203539830824354e-07,
79
+ -0.04703600000000003,
80
+ 0.14110856637168223,
81
+ 0.027216715044247736,
82
+ -0.04703600000000003,
83
+ -0.055889752212389385,
84
+ -0.12962760265486717,
85
+ 0.10187851619469035,
86
+ -0.01324823008849549,
87
+ 0.022193132743362702,
88
+ -0.07879260176991155,
89
+ 0.0665928778761063,
90
+ 0.12907584070796485,
91
+ -0.04703600000000003,
92
+ -0.04703600000000003,
93
+ -0.04703600000000003,
94
+ -0.002639044247787606,
95
+ 0.054982569292035384,
96
+ 0.05932991150442477,
97
+ -0.06964141592920373,
98
+ -0.07482919999999994,
99
+ -0.033238396460177,
100
+ 0.13608353008849555,
101
+ 0.0894867256637167,
102
+ -0.09438650000000005,
103
+ -0.09438650000000005,
104
+ -0.1056450000000003,
105
+ 0.030049292035398203,
106
+ 0.0004219557522123656,
107
+ 0.04024157522123887,
108
+ 0.01212035575221241,
109
+ -0.06541580530973452,
110
+ -0.07854839999999999,
111
+ 0.02907596460176992,
112
+ -0.09438650000000005,
113
+ 0.09438671238938048,
114
+ -0.03861907964601766,
115
+ 1.0619469030366473e-07,
116
+ 1.0619469029580476e-07,
117
+ -0.0670416460176993,
118
+ -0.04499362831858416,
119
+ 0.0430065663716814,
120
+ 0.05495734513274337,
121
+ 0.025254761061947018,
122
+ -0.06529410000000001,
123
+ 0.06800543362831867,
124
+ -0.15775999999999976,
125
+ 0.0665928778761063,
126
+ -0.08165009999999992,
127
+ 1.0619469029580476e-07,
128
+ -0.08165009999999992,
129
+ -0.021128761061946954,
130
+ 0.0199548849557522,
131
+ -0.04005870796460183,
132
+ 0.07256339026548671,
133
+ 0.0029753097345135682,
134
+ 0.008741072566371728,
135
+ -0.12291731858407075,
136
+ 0.0665928778761063,
137
+ -0.03861907964601771,
138
+ 0.0665928778761063,
139
+ -2.9203539835933345e-07,
140
+ -0.15365226548672545,
141
+ -0.02139016460176988,
142
+ 0.03374174115044254,
143
+ -0.03278541946902662,
144
+ -0.16577226814159277,
145
+ 0.027216715044247785,
146
+ 0.14110856637168206,
147
+ -0.08165009999999992,
148
+ -0.17471278761061948,
149
+ -0.05009553982300891,
150
+ 0.10357247787610621,
151
+ 0.01421250265486715,
152
+ -0.16799606460176988,
153
+ 0.1411085663716814,
154
+ -0.04703600000000003,
155
+ 0.1997786557522125,
156
+ -0.02112876106194691,
157
+ 0.10064383539823014,
158
+ -0.09822227433628321,
159
+ 0.010812114336283181,
160
+ -0.0005969424778760985,
161
+ -0.034939104424778704,
162
+ -0.021039132743362887,
163
+ 0.1549942769911504,
164
+ -0.05473569823008849,
165
+ 0.09371048247787614,
166
+ 0.1284547699115043,
167
+ 0.08193819469026561,
168
+ -0.1894623433628318,
169
+ -0.03994628938053097,
170
+ 0.005021592920354035,
171
+ 0.06618380000000008,
172
+ 0.046780255752212445,
173
+ 0.12412912743362833,
174
+ -0.15687404504424782,
175
+ -0.04040450761061948,
176
+ 0.01819149026548674,
177
+ 0.047322232477876085,
178
+ -0.1316860601769911,
179
+ -0.08258592566371675,
180
+ 0.05638880530973452,
181
+ -0.10198681415929205,
182
+ 0.1290602176991152,
183
+ -0.03669845398230087,
184
+ -0.10499076469026546,
185
+ -0.12757559911504432,
186
+ -0.06652606637168137,
187
+ 0.05155422566371681,
188
+ 0.031605256637168136,
189
+ 0.0629123805309736,
190
+ 0.023197380530973564,
191
+ 0.04703600000000003,
192
+ -0.03599286283185842,
193
+ -0.1574473318584071,
194
+ 0.10887992823008849,
195
+ -0.053605181415929175,
196
+ -0.012299078761061958,
197
+ -0.05887616991150452,
198
+ 0.07308711769911504,
199
+ 0.09051549646017694,
200
+ -0.10846913274336303,
201
+ -0.15513741725663718,
202
+ 0.12073644318584073,
203
+ 0.05041307504424779,
204
+ 0.1529646697345132,
205
+ 0.0776218637168141,
206
+ 0.057565741592920404,
207
+ -0.17276489823008853,
208
+ -0.014984845840707986,
209
+ -0.04701723008849572,
210
+ -0.03750280353982299,
211
+ 0.06355189203539817,
212
+ 0.06636549999999998,
213
+ -0.1410115592035399,
214
+ -0.08766313362831851,
215
+ -0.09892783274336285,
216
+ -0.013420267079645989,
217
+ 0.09777304070796461,
218
+ 0.07535415840707965,
219
+ -0.10688448672566354,
220
+ 0.0625599000000001,
221
+ -0.011544922123893811,
222
+ -0.09627820707964604,
223
+ 0.08584640530973452,
224
+ 0.007022314424778771,
225
+ -0.05128431504424778,
226
+ -0.06365885663716808,
227
+ 0.02538907345132746,
228
+ 0.071253879380531,
229
+ -0.032786734513274456,
230
+ 0.0729473,
231
+ 0.04719471592920353,
232
+ 0.014598110265486715,
233
+ 0.026159213575221246,
234
+ 0.059101831504424836,
235
+ -0.07843545663716811,
236
+ 0.0003891433628318023,
237
+ 0.014624393274336253,
238
+ 0.03384382522123893,
239
+ -0.07310352920353969,
240
+ 0.0510427,
241
+ 0.14306325132743355,
242
+ -0.011243908849557487,
243
+ 0.02559352380530976,
244
+ 0.03617407230973455,
245
+ -0.012417333274336301,
246
+ -0.10102372743362834,
247
+ -0.09638603628318594,
248
+ 0.02360371292035396,
249
+ -0.0742930973451328,
250
+ -0.014339143362831862,
251
+ 0.03523714159292039,
252
+ 0.03915302300884953,
253
+ -0.08945827723893807,
254
+ -0.02228378656637163,
255
+ 0.10421852477876106,
256
+ 0.0697730088495576,
257
+ -0.12811908238938052,
258
+ -0.10229047238938055,
259
+ -0.048111653097345074,
260
+ 0.041196920353982314,
261
+ 0.10879424867256633,
262
+ -0.10693692778761064,
263
+ 0.02704163566371678,
264
+ 0.12719723849557518,
265
+ 0.1358370884955751,
266
+ -0.11345866194690264,
267
+ -0.11236356814159291,
268
+ 0.008828665486725625,
269
+ 0.04901849557522122,
270
+ 0.10906433185840712,
271
+ -0.12028646725663718,
272
+ 0.005514894867256633
273
+ ]
274
+ ],
275
+ "std": [
276
+ [
277
+ 1.0502669179700934,
278
+ 0.9792224218294541,
279
+ 0.24305352147883325,
280
+ 1.043042266446498,
281
+ 1.0744571502175468,
282
+ 0.9508826739984755,
283
+ 0.9451555552883207,
284
+ 1.1810283789026603,
285
+ 1.0064552702700122,
286
+ 1.1190882010665817,
287
+ 0.9034793296608571,
288
+ 1.1336521923679663,
289
+ 0.9786491101919341,
290
+ 0.9206985848676537,
291
+ 0.8610889538505271,
292
+ 0.9619675032812017,
293
+ 0.9308084274399617,
294
+ 0.9863758024756076,
295
+ 0.9547571784517959,
296
+ 0.9496800506935921,
297
+ 1.0,
298
+ 1.0,
299
+ 1.0,
300
+ 1.9844233966366367,
301
+ 1.4095057857234627,
302
+ 1.40632875858643,
303
+ 0.892002130496044,
304
+ 1.0129634785032875,
305
+ 0.978487303853688,
306
+ 1.1394715296586964,
307
+ 1.0,
308
+ 1.0267988761241287,
309
+ 1.217866674742132,
310
+ 1.0,
311
+ 1.0,
312
+ 1.4095057857234627,
313
+ 1.0,
314
+ 1.30048921660964,
315
+ 1.101075351501756,
316
+ 0.9423320679555461,
317
+ 0.9745566669040967,
318
+ 1.0784150005489006,
319
+ 1.3072548131334407,
320
+ 1.020520797792866,
321
+ 1.0,
322
+ 1.1116626840554256,
323
+ 1.0,
324
+ 1.2178666747421323,
325
+ 0.8944357999064103,
326
+ 1.0,
327
+ 0.9763859814864452,
328
+ 0.9882312110151381,
329
+ 0.9941548135105892,
330
+ 1.0805382570058093,
331
+ 1.0,
332
+ 0.9455390825539804,
333
+ 1.5353137244867092,
334
+ 1.4095057857234619,
335
+ 1.0,
336
+ 1.4095057857234636,
337
+ 1.0,
338
+ 0.9988939483461567,
339
+ 0.9028116049768871,
340
+ 1.0263167291591377,
341
+ 0.9964436627027657,
342
+ 0.4280387316306564,
343
+ 1.0514551909197751,
344
+ 0.9988936769842915,
345
+ 1.0,
346
+ 1.9911349325902201,
347
+ 1.152138074538978,
348
+ 1.0,
349
+ 0.9644113662850948,
350
+ 0.9806946309645141,
351
+ 0.9930268680075975,
352
+ 0.8905664891946655,
353
+ 1.0736843273720693,
354
+ 1.0058668086951204,
355
+ 1.409505785723462,
356
+ 1.3330925209888196,
357
+ 1.0,
358
+ 1.0,
359
+ 1.0,
360
+ 1.0450036005861865,
361
+ 1.3244456183776097,
362
+ 0.932189980942975,
363
+ 0.9625014477361986,
364
+ 1.0,
365
+ 1.0074707737922228,
366
+ 1.62207901125963,
367
+ 1.3004892166096393,
368
+ 1.0,
369
+ 1.0,
370
+ 1.0,
371
+ 1.0917543201475843,
372
+ 1.0127130749629136,
373
+ 1.2877909824303606,
374
+ 0.9604994075919616,
375
+ 0.8657450013263874,
376
+ 1.0,
377
+ 1.0599660091906427,
378
+ 1.0,
379
+ 1.4063287585864277,
380
+ 0.8174198991670479,
381
+ 0.9988939483461567,
382
+ 0.9988939483461567,
383
+ 0.7094990007768708,
384
+ 0.8740833234525124,
385
+ 1.010657132912493,
386
+ 0.9328151962443406,
387
+ 1.3541564903516528,
388
+ 1.0,
389
+ 1.0437864539647888,
390
+ 1.0,
391
+ 1.409505785723462,
392
+ 1.0,
393
+ 0.9988939483461567,
394
+ 1.0,
395
+ 0.8944357999064098,
396
+ 1.2065791134004533,
397
+ 1.0500123468485083,
398
+ 0.9959504427215604,
399
+ 1.0958354145667224,
400
+ 0.7400533918928887,
401
+ 0.9943642075886404,
402
+ 1.4095057857234627,
403
+ 0.8174198991670482,
404
+ 1.4095057857234627,
405
+ 0.9988936769842922,
406
+ 0.9193790839730072,
407
+ 1.0436031910295362,
408
+ 0.9868834993023391,
409
+ 0.5782795414175284,
410
+ 0.9541173647907301,
411
+ 1.1521380745389775,
412
+ 1.9911349325902201,
413
+ 1.0,
414
+ 0.9325216486314452,
415
+ 1.0303184562115624,
416
+ 0.9698188611354921,
417
+ 1.0027196672799903,
418
+ 1.0327882823860284,
419
+ 1.9911349325902201,
420
+ 1.0,
421
+ 1.9844233966366391,
422
+ 0.8944357999064109,
423
+ 0.7112349595162911,
424
+ 1.0528496975740775,
425
+ 0.9693293962135208,
426
+ 1.098217436491506,
427
+ 0.39441056751713705,
428
+ 1.131185111941341,
429
+ 0.8933013668038887,
430
+ 0.8692841653701331,
431
+ 0.9535583303775852,
432
+ 0.9578421783922644,
433
+ 0.9351032690489206,
434
+ 0.9587912379925385,
435
+ 0.8874155629442673,
436
+ 0.7402206710271984,
437
+ 1.0,
438
+ 1.0688089329251667,
439
+ 0.997681462694144,
440
+ 0.9866601266296527,
441
+ 0.9496581319654654,
442
+ 0.9257831061652533,
443
+ 0.9073562336120353,
444
+ 0.9768579353882867,
445
+ 0.9602672008044747,
446
+ 0.7793988687883875,
447
+ 1.2643817992013762,
448
+ 0.8858997832358527,
449
+ 1.0783739453909889,
450
+ 0.9243425987503827,
451
+ 0.9894525958813807,
452
+ 0.8138319611992417,
453
+ 0.9527697944043735,
454
+ 1.1413505837251008,
455
+ 0.8792523651290115,
456
+ 1.0992317647014969,
457
+ 1.0,
458
+ 1.065433498566479,
459
+ 0.9150528093441637,
460
+ 1.0062463574228966,
461
+ 1.011250604668206,
462
+ 0.7913263564369651,
463
+ 0.9735543146496928,
464
+ 0.9610800849612564,
465
+ 0.9880567372837797,
466
+ 0.3866698577857632,
467
+ 0.9853949011817834,
468
+ 0.990227174214131,
469
+ 0.8869793376043191,
470
+ 1.0049463863071384,
471
+ 0.9992217219580515,
472
+ 0.9135057665522096,
473
+ 0.9794517412025064,
474
+ 0.8334338014885702,
475
+ 0.37518500497353446,
476
+ 1.1642248030770597,
477
+ 0.9506854878365382,
478
+ 1.1083600583283926,
479
+ 0.9361744720072924,
480
+ 1.0051395038183164,
481
+ 0.7234663786843327,
482
+ 1.1371317753211319,
483
+ 1.5356103741191347,
484
+ 0.8479920793399001,
485
+ 0.46656712729960265,
486
+ 1.0,
487
+ 1.0891589322731212,
488
+ 0.8545812844441173,
489
+ 1.3469557389840487,
490
+ 1.3298686360213214,
491
+ 0.8184103746992143,
492
+ 1.2426545134673366,
493
+ 0.9345647421429395,
494
+ 0.8739291157345797,
495
+ 0.7954155323258645,
496
+ 1.0,
497
+ 0.9396031266002715,
498
+ 0.8729340873197525,
499
+ 1.1022147706138496,
500
+ 0.9052007430680863,
501
+ 0.8002297286948205,
502
+ 1.1474637082252046,
503
+ 1.0050624674836923,
504
+ 0.8958786752659496,
505
+ 0.1199464140766847,
506
+ 1.0,
507
+ 0.9484606934407114,
508
+ 0.924743989986394,
509
+ 1.1045533858189263,
510
+ 0.9763355497679247,
511
+ 0.8775711016746042,
512
+ 1.4892483405130004,
513
+ 0.9479162196372228,
514
+ 0.824520740664537,
515
+ 0.48200134691826974,
516
+ 0.8093410764663572,
517
+ 1.0307538015892828,
518
+ 0.8557116942728363,
519
+ 0.9675781578595044,
520
+ 0.9316537658305905,
521
+ 0.961482671503125,
522
+ 0.9499524026348503,
523
+ 1.0156281171297905,
524
+ 0.9533815998673338,
525
+ 0.13577727875330386,
526
+ 1.0944930405696027,
527
+ 0.9984202119037168,
528
+ 1.0610893586418122,
529
+ 1.0416564535479678,
530
+ 0.953141207852886,
531
+ 0.9699518518482332,
532
+ 1.0661304370514315,
533
+ 0.9605383246803934,
534
+ 0.9343424770461999,
535
+ 1.1428421085341074,
536
+ 0.9995106529728873,
537
+ 1.0191031224939573,
538
+ 1.0275583030415119
539
+ ]
540
+ ]
541
+ },
542
+ "width": 512,
543
+ "in_features": 262,
544
+ "out_features": 13,
545
+ "depth": 4,
546
+ "padding": 524,
547
+ "parameters": 1084073,
548
+ "cert_evals": {
549
+ "36": 0.4925372898578644,
550
+ "72": 0.3731343150138855,
551
+ "108": 0.3432835638523102,
552
+ "255": 0.17910447716712952
553
+ }
554
+ }
UCI_N4/sdp/runs/audiology-std/fold_0/result.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 5,
3
+ "best_val_acc": 0.1935483870967742,
4
+ "test_acc": 0.1,
5
+ "train_size": 25,
6
+ "val_size": 31,
7
+ "test_size": 140,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -1.7763568394002505e-17,
12
+ -8.399999999486596e-07,
13
+ 7.99999999756551e-08,
14
+ -1.2800000001833566e-06,
15
+ -3.6000000007696543e-07,
16
+ -8.799999999986596e-07,
17
+ 0.0,
18
+ 0.0,
19
+ 0.0,
20
+ 0.0,
21
+ 0.0,
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0,
26
+ 0.0,
27
+ -8.000000002006402e-08,
28
+ 7.99999999756551e-08,
29
+ 0.0,
30
+ 0.0,
31
+ 0.0,
32
+ 0.0,
33
+ 7.99999999756551e-08,
34
+ 0.0,
35
+ -3.199999999159431e-07,
36
+ 0.0,
37
+ 0.0,
38
+ 0.0,
39
+ 0.0,
40
+ 0.0,
41
+ 0.0,
42
+ 0.0,
43
+ -3.3306690738754695e-17,
44
+ -3.999999999981796e-07,
45
+ 0.0,
46
+ 7.99999999756551e-08,
47
+ 0.0,
48
+ 0.0,
49
+ 0.0,
50
+ 0.0,
51
+ 0.0,
52
+ 0.0,
53
+ -8.659739592076221e-17,
54
+ 0.0,
55
+ -8.659739592076221e-17,
56
+ 0.0,
57
+ 0.0,
58
+ 0.0,
59
+ -7.199999999940587e-07,
60
+ -4.800000000759752e-07,
61
+ 2.799999999325564e-07,
62
+ 0.0,
63
+ 2.220446049250313e-18,
64
+ 0.0,
65
+ -1.5999999996907377e-07,
66
+ 0.0,
67
+ -4.0000000006479297e-07,
68
+ 0.0,
69
+ 0.0
70
+ ]
71
+ ],
72
+ "std": [
73
+ [
74
+ 0.9797958971132714,
75
+ 0.979795399156076,
76
+ 0.979796007645425,
77
+ 0.9797944438980055,
78
+ 0.979795825808005,
79
+ 0.9797970293219844,
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0,
84
+ 1.0,
85
+ 1.0,
86
+ 1.0,
87
+ 1.0,
88
+ 0.9797958971132714,
89
+ 1.0,
90
+ 0.9797961795409461,
91
+ 0.979796007645425,
92
+ 1.0,
93
+ 1.0,
94
+ 1.0,
95
+ 1.0,
96
+ 0.9797960076454252,
97
+ 1.0,
98
+ 0.9797960772142222,
99
+ 1.0,
100
+ 1.0,
101
+ 1.0,
102
+ 1.0,
103
+ 1.0,
104
+ 1.0,
105
+ 1.0,
106
+ 0.9797958971132711,
107
+ 0.9797952000000001,
108
+ 1.0,
109
+ 0.9797960076454251,
110
+ 1.0,
111
+ 1.0,
112
+ 1.0,
113
+ 1.0,
114
+ 1.0,
115
+ 1.0,
116
+ 0.9797958971132709,
117
+ 1.0,
118
+ 0.9797958971132709,
119
+ 1.0,
120
+ 1.0,
121
+ 1.0,
122
+ 0.9797942770355633,
123
+ 0.9797949007791427,
124
+ 0.9797958854236333,
125
+ 1.0,
126
+ 0.979795897113271,
127
+ 1.0,
128
+ 0.9797957933341287,
129
+ 1.0,
130
+ 0.9797952,
131
+ 1.0,
132
+ 1.0
133
+ ]
134
+ ]
135
+ },
136
+ "width": 256,
137
+ "in_features": 59,
138
+ "out_features": 18,
139
+ "depth": 4,
140
+ "padding": 118,
141
+ "parameters": 125022,
142
+ "cert_evals": {
143
+ "36": 0.09677419066429138,
144
+ "72": 0.0,
145
+ "108": 0.0,
146
+ "255": 0.0
147
+ }
148
+ }
UCI_N4/sdp/runs/audiology-std/fold_2/result.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 30,
3
+ "best_val_acc": 0.36,
4
+ "test_acc": 0.3561643835616438,
5
+ "train_size": 25,
6
+ "val_size": 25,
7
+ "test_size": 146,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -1.7763568394002505e-17,
12
+ -8.399999999486596e-07,
13
+ 7.99999999756551e-08,
14
+ -1.2800000001833566e-06,
15
+ -3.6000000007696543e-07,
16
+ -8.799999999986596e-07,
17
+ 0.0,
18
+ 0.0,
19
+ 0.0,
20
+ 0.0,
21
+ 0.0,
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0,
26
+ 0.0,
27
+ -8.000000002006402e-08,
28
+ 7.99999999756551e-08,
29
+ 0.0,
30
+ 0.0,
31
+ 0.0,
32
+ 0.0,
33
+ 7.99999999756551e-08,
34
+ 0.0,
35
+ -3.199999999159431e-07,
36
+ 0.0,
37
+ 0.0,
38
+ 0.0,
39
+ 0.0,
40
+ 0.0,
41
+ 0.0,
42
+ 0.0,
43
+ -3.3306690738754695e-17,
44
+ -3.999999999981796e-07,
45
+ 0.0,
46
+ 7.99999999756551e-08,
47
+ 0.0,
48
+ 0.0,
49
+ 0.0,
50
+ 0.0,
51
+ 0.0,
52
+ 0.0,
53
+ -8.659739592076221e-17,
54
+ 0.0,
55
+ -8.659739592076221e-17,
56
+ 0.0,
57
+ 0.0,
58
+ 0.0,
59
+ -7.199999999940587e-07,
60
+ -4.800000000759752e-07,
61
+ 2.799999999325564e-07,
62
+ 0.0,
63
+ 2.220446049250313e-18,
64
+ 0.0,
65
+ -1.5999999996907377e-07,
66
+ 0.0,
67
+ -4.0000000006479297e-07,
68
+ 0.0,
69
+ 0.0
70
+ ]
71
+ ],
72
+ "std": [
73
+ [
74
+ 0.9797958971132714,
75
+ 0.979795399156076,
76
+ 0.979796007645425,
77
+ 0.9797944438980055,
78
+ 0.979795825808005,
79
+ 0.9797970293219844,
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0,
84
+ 1.0,
85
+ 1.0,
86
+ 1.0,
87
+ 1.0,
88
+ 0.9797958971132714,
89
+ 1.0,
90
+ 0.9797961795409461,
91
+ 0.979796007645425,
92
+ 1.0,
93
+ 1.0,
94
+ 1.0,
95
+ 1.0,
96
+ 0.9797960076454252,
97
+ 1.0,
98
+ 0.9797960772142222,
99
+ 1.0,
100
+ 1.0,
101
+ 1.0,
102
+ 1.0,
103
+ 1.0,
104
+ 1.0,
105
+ 1.0,
106
+ 0.9797958971132711,
107
+ 0.9797952000000001,
108
+ 1.0,
109
+ 0.9797960076454251,
110
+ 1.0,
111
+ 1.0,
112
+ 1.0,
113
+ 1.0,
114
+ 1.0,
115
+ 1.0,
116
+ 0.9797958971132709,
117
+ 1.0,
118
+ 0.9797958971132709,
119
+ 1.0,
120
+ 1.0,
121
+ 1.0,
122
+ 0.9797942770355633,
123
+ 0.9797949007791427,
124
+ 0.9797958854236333,
125
+ 1.0,
126
+ 0.979795897113271,
127
+ 1.0,
128
+ 0.9797957933341287,
129
+ 1.0,
130
+ 0.9797952,
131
+ 1.0,
132
+ 1.0
133
+ ]
134
+ ]
135
+ },
136
+ "width": 256,
137
+ "in_features": 59,
138
+ "out_features": 18,
139
+ "depth": 4,
140
+ "padding": 118,
141
+ "parameters": 125022,
142
+ "cert_evals": {
143
+ "36": 0.2800000011920929,
144
+ "72": 0.23999999463558197,
145
+ "108": 0.23999999463558197,
146
+ "255": 0.07999999821186066
147
+ }
148
+ }
UCI_N4/sdp/runs/audiology-std/fold_3/result.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 45,
3
+ "best_val_acc": 0.5,
4
+ "test_acc": 0.3546099290780142,
5
+ "train_size": 25,
6
+ "val_size": 30,
7
+ "test_size": 141,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -1.7763568394002505e-17,
12
+ -8.399999999486596e-07,
13
+ 7.99999999756551e-08,
14
+ -1.2800000001833566e-06,
15
+ -3.6000000007696543e-07,
16
+ -8.799999999986596e-07,
17
+ 0.0,
18
+ 0.0,
19
+ 0.0,
20
+ 0.0,
21
+ 0.0,
22
+ 0.0,
23
+ 0.0,
24
+ 0.0,
25
+ 0.0,
26
+ 0.0,
27
+ -8.000000002006402e-08,
28
+ 7.99999999756551e-08,
29
+ 0.0,
30
+ 0.0,
31
+ 0.0,
32
+ 0.0,
33
+ 7.99999999756551e-08,
34
+ 0.0,
35
+ -3.199999999159431e-07,
36
+ 0.0,
37
+ 0.0,
38
+ 0.0,
39
+ 0.0,
40
+ 0.0,
41
+ 0.0,
42
+ 0.0,
43
+ -3.3306690738754695e-17,
44
+ -3.999999999981796e-07,
45
+ 0.0,
46
+ 7.99999999756551e-08,
47
+ 0.0,
48
+ 0.0,
49
+ 0.0,
50
+ 0.0,
51
+ 0.0,
52
+ 0.0,
53
+ -8.659739592076221e-17,
54
+ 0.0,
55
+ -8.659739592076221e-17,
56
+ 0.0,
57
+ 0.0,
58
+ 0.0,
59
+ -7.199999999940587e-07,
60
+ -4.800000000759752e-07,
61
+ 2.799999999325564e-07,
62
+ 0.0,
63
+ 2.220446049250313e-18,
64
+ 0.0,
65
+ -1.5999999996907377e-07,
66
+ 0.0,
67
+ -4.0000000006479297e-07,
68
+ 0.0,
69
+ 0.0
70
+ ]
71
+ ],
72
+ "std": [
73
+ [
74
+ 0.9797958971132714,
75
+ 0.979795399156076,
76
+ 0.979796007645425,
77
+ 0.9797944438980055,
78
+ 0.979795825808005,
79
+ 0.9797970293219844,
80
+ 1.0,
81
+ 1.0,
82
+ 1.0,
83
+ 1.0,
84
+ 1.0,
85
+ 1.0,
86
+ 1.0,
87
+ 1.0,
88
+ 0.9797958971132714,
89
+ 1.0,
90
+ 0.9797961795409461,
91
+ 0.979796007645425,
92
+ 1.0,
93
+ 1.0,
94
+ 1.0,
95
+ 1.0,
96
+ 0.9797960076454252,
97
+ 1.0,
98
+ 0.9797960772142222,
99
+ 1.0,
100
+ 1.0,
101
+ 1.0,
102
+ 1.0,
103
+ 1.0,
104
+ 1.0,
105
+ 1.0,
106
+ 0.9797958971132711,
107
+ 0.9797952000000001,
108
+ 1.0,
109
+ 0.9797960076454251,
110
+ 1.0,
111
+ 1.0,
112
+ 1.0,
113
+ 1.0,
114
+ 1.0,
115
+ 1.0,
116
+ 0.9797958971132709,
117
+ 1.0,
118
+ 0.9797958971132709,
119
+ 1.0,
120
+ 1.0,
121
+ 1.0,
122
+ 0.9797942770355633,
123
+ 0.9797949007791427,
124
+ 0.9797958854236333,
125
+ 1.0,
126
+ 0.979795897113271,
127
+ 1.0,
128
+ 0.9797957933341287,
129
+ 1.0,
130
+ 0.9797952,
131
+ 1.0,
132
+ 1.0
133
+ ]
134
+ ]
135
+ },
136
+ "width": 256,
137
+ "in_features": 59,
138
+ "out_features": 18,
139
+ "depth": 4,
140
+ "padding": 118,
141
+ "parameters": 125022,
142
+ "cert_evals": {
143
+ "36": 0.36666667461395264,
144
+ "72": 0.2666666805744171,
145
+ "108": 0.20000001788139343,
146
+ "255": 0.10000000894069672
147
+ }
148
+ }
UCI_N4/sdp/runs/balance-scale/fold_0/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 40,
3
+ "best_val_acc": 0.7108433734939759,
4
+ "test_acc": 0.694300518134715,
5
+ "train_size": 156,
6
+ "val_size": 83,
7
+ "test_size": 386,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.05887832692307693,
12
+ -2.5641025661690044e-08,
13
+ 0.09964028205128199,
14
+ -0.09058207692307692
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 0.9464310236223092,
20
+ 0.9765235538802873,
21
+ 0.9974316897506468,
22
+ 1.0391308031314608
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.6024096012115479,
34
+ "72": 0.40963852405548096,
35
+ "108": 0.3012048006057739,
36
+ "255": 0.048192769289016724
37
+ }
38
+ }
UCI_N4/sdp/runs/balance-scale/fold_1/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 54,
3
+ "best_val_acc": 0.8556701030927835,
4
+ "test_acc": 0.7688172043010753,
5
+ "train_size": 156,
6
+ "val_size": 97,
7
+ "test_size": 372,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.09511109615384612,
12
+ -3.416070845000482e-17,
13
+ 0.00905823076923074,
14
+ 0.08152388461538454
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.0090351712085057,
20
+ 1.0055834762270852,
21
+ 0.9532661180714023,
22
+ 1.002273371607005
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.6391752362251282,
34
+ "72": 0.3711340129375458,
35
+ "108": 0.22680412232875824,
36
+ "255": 0.0824742242693901
37
+ }
38
+ }
UCI_N4/sdp/runs/balance-scale/fold_2/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 70,
3
+ "best_val_acc": 0.7634408602150538,
4
+ "test_acc": 0.7207446808510638,
5
+ "train_size": 156,
6
+ "val_size": 93,
7
+ "test_size": 376,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.00452913461538464,
12
+ 0.06340748717948716,
13
+ -1.2820512825151571e-08,
14
+ 0.09964030769230771
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 0.9879158233594086,
20
+ 0.9907460042778667,
21
+ 1.027617579941566,
22
+ 0.9614936385801037
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.6236559152603149,
34
+ "72": 0.47311827540397644,
35
+ "108": 0.3333333432674408,
36
+ "255": 0.04301075264811516
37
+ }
38
+ }
UCI_N4/sdp/runs/balance-scale/fold_3/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 17,
3
+ "best_val_acc": 0.8260869565217391,
4
+ "test_acc": 0.8143236074270557,
5
+ "train_size": 156,
6
+ "val_size": 92,
7
+ "test_size": 377,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.05434929487179499,
12
+ -0.08605298076923085,
13
+ 0.06793655769230768,
14
+ -0.16757685256410257
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.0569029867956488,
20
+ 1.0161657906649941,
21
+ 0.9625917447832895,
22
+ 0.9469510608150327
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 3,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1569,
32
+ "cert_evals": {
33
+ "36": 0.5978261232376099,
34
+ "72": 0.3695652186870575,
35
+ "108": 0.260869562625885,
36
+ "255": 0.032608695328235626
37
+ }
38
+ }
UCI_N4/sdp/runs/blood/fold_0/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 10,
3
+ "best_val_acc": 0.7704918032786885,
4
+ "test_acc": 0.7015945330296127,
5
+ "train_size": 187,
6
+ "val_size": 122,
7
+ "test_size": 439,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.08207599251336908,
12
+ 0.07211877540106948,
13
+ 0.07211877540106948,
14
+ 0.12092969090909093
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.0915037898164763,
20
+ 0.9154190444987925,
21
+ 0.9154190444987925,
22
+ 1.0234960637376278
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 2,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1558,
32
+ "cert_evals": {
33
+ "36": 0.24590162932872772,
34
+ "72": 0.049180325120687485,
35
+ "108": 0.008196720853447914,
36
+ "255": 0.0
37
+ }
38
+ }
UCI_N4/sdp/runs/blood/fold_1/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 23,
3
+ "best_val_acc": 0.603448275862069,
4
+ "test_acc": 0.7056179775280899,
5
+ "train_size": 187,
6
+ "val_size": 116,
7
+ "test_size": 445,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ -0.0044589358288771265,
12
+ -0.03777642245989305,
13
+ -0.03777642245989305,
14
+ -0.04118699946524062
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.0355747128653376,
20
+ 1.0168425706533084,
21
+ 1.0168425706533084,
22
+ 0.9389071377082803
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 2,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1558,
32
+ "cert_evals": {
33
+ "36": 0.43103447556495667,
34
+ "72": 0.3448275923728943,
35
+ "108": 0.24137930572032928,
36
+ "255": 0.025862067937850952
37
+ }
38
+ }
UCI_N4/sdp/runs/blood/fold_2/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 1,
3
+ "best_val_acc": 0.7727272727272727,
4
+ "test_acc": 0.7450110864745011,
5
+ "train_size": 187,
6
+ "val_size": 110,
7
+ "test_size": 451,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.05565309197860972,
12
+ -0.04876601497326191,
13
+ -0.04876601497326191,
14
+ 0.022211831550802065
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.2081413746481122,
20
+ 0.9472357528176619,
21
+ 0.9472357528176619,
22
+ 0.9442482982599183
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 2,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1558,
32
+ "cert_evals": {
33
+ "36": 0.5181818008422852,
34
+ "72": 0.0181818176060915,
35
+ "108": 0.0181818176060915,
36
+ "255": 0.0
37
+ }
38
+ }
UCI_N4/sdp/runs/blood/fold_3/result.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 20,
3
+ "best_val_acc": 0.6864406779661016,
4
+ "test_acc": 0.672686230248307,
5
+ "train_size": 187,
6
+ "val_size": 118,
7
+ "test_size": 443,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.02856966417112282,
12
+ -0.11561878823529406,
13
+ -0.11561878823529406,
14
+ -0.0299989443850266
15
+ ]
16
+ ],
17
+ "std": [
18
+ [
19
+ 1.1041996654221626,
20
+ 0.9454192748690525,
21
+ 0.9454192748690525,
22
+ 0.9892882254644951
23
+ ]
24
+ ]
25
+ },
26
+ "width": 32,
27
+ "in_features": 4,
28
+ "out_features": 2,
29
+ "depth": 4,
30
+ "padding": 10,
31
+ "parameters": 1558,
32
+ "cert_evals": {
33
+ "36": 0.4406779706478119,
34
+ "72": 0.24576270580291748,
35
+ "108": 0.1355932205915451,
36
+ "255": 0.016949152573943138
37
+ }
38
+ }
UCI_N4/sdp/runs/car/fold_0/result.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 48,
3
+ "best_val_acc": 0.7481481481481481,
4
+ "test_acc": 0.7426900584795322,
5
+ "train_size": 432,
6
+ "val_size": 270,
7
+ "test_size": 1026,
8
+ "stats": {
9
+ "mean": [
10
+ [
11
+ 0.08486305092592587,
12
+ -0.024837976851851778,
13
+ -1.3287037036350012e-06,
14
+ 0.011336944444444445,
15
+ -0.03684506944444444,
16
+ -0.03401083333333333
17
+ ]
18
+ ],
19
+ "std": [
20
+ [
21
+ 1.0016589891278265,
22
+ 1.0231915721256846,
23
+ 0.9608720065155524,
24
+ 0.9785956932593036,
25
+ 0.9832757136677825,
26
+ 1.0299163223065575
27
+ ]
28
+ ]
29
+ },
30
+ "width": 32,
31
+ "in_features": 6,
32
+ "out_features": 4,
33
+ "depth": 4,
34
+ "padding": 12,
35
+ "parameters": 1844,
36
+ "cert_evals": {
37
+ "36": 0.67037034034729,
38
+ "72": 0.5629629492759705,
39
+ "108": 0.4444444477558136,
40
+ "255": 0.10370370000600815
41
+ }
42
+ }
UCI_N4/sdp/summary.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N4/wilcoxon_pairwise_all.csv ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ metric,alg_a,alg_b,n_common,n_nonzero,wins_a,wins_b,ties,win_rate_a_over_b,mean_diff_a_minus_b,median_diff_a_minus_b,W_stat,p_two_sided,z_equiv,effect_size_r,p_holm_global,p_holm_within_metric
2
+ mean_cert_acc_108,aol,ldlt-resnet,121,120,1,119,1,0.012396694214876033,-0.24023560125702478,-0.2178627868,1.0,2.047798018733893e-21,-9.502566527959253,0.8674616735928048,1.5358485140504197e-19,3.071697028100839e-20
3
+ mean_cert_acc_108,aol,sandwich,121,120,4,116,1,0.0371900826446281,-0.2791979140619835,-0.24018719700000002,32.0,4.451739109777974e-21,-9.421385624393324,0.8600509049058529,3.2052521590401414e-19,6.232434753689163e-20
4
+ mean_cert_acc_108,aol,sdp,121,118,2,116,3,0.028925619834710745,-0.20478923102975205,-0.159539476,12.0,5.792775287386205e-21,-9.393701780851549,0.8647603427558215,4.0549427011703434e-19,7.530607873602066e-20
5
+ mean_cert_acc_108,aol,ortho,121,119,6,113,2,0.05785123966942149,-0.2254036970661157,-0.1816607546,72.0,1.7810463144421207e-20,-9.274708948644408,0.8502111753596431,1.1576801043873786e-18,2.1372555773305449e-19
6
+ mean_cert_acc_108,aol,ldlt,121,111,12,99,10,0.14049586776859505,-0.14268145603305787,-0.07846696670000008,158.0,4.019802318228132e-18,-8.678228661432334,0.8237010122967007,2.4520794141191604e-16,4.421782550050945e-17
7
+ mean_cert_acc_108,ldlt,sandwich,121,121,17,104,0,0.14049586776859505,-0.13651645802892565,-0.0904583447,492.0,1.3177243514651385e-16,-8.271961883738362,0.7519965348853056,7.51102880335129e-15,1.3177243514651386e-15
8
+ mean_cert_acc_108,ortho,sandwich,121,121,16,105,0,0.1322314049586777,-0.05379421699586777,-0.047495976100000004,700.5,1.053266221565602e-14,-7.7326548003239015,0.7029686182112638,5.16100448567145e-13,9.479395994090418e-14
9
+ mean_cert_acc_108,ldlt,ldlt-resnet,121,120,23,97,1,0.19421487603305784,-0.09755414522396695,-0.046755802799999996,787.0,9.758136579089918e-14,-7.444135415660514,0.6795534813800599,4.488742826381363e-12,7.806509263271935e-13
10
+ mean_cert_acc_108,sandwich,sdp,121,119,93,26,2,0.7768595041322314,0.07440868303223143,0.04801563549999999,764.0,1.009480241756313e-13,7.439655741364371,0.6819921236516022,4.542661087903409e-12,7.806509263271935e-13
11
+ mean_cert_acc_108,ldlt,ortho,121,119,35,84,2,0.2975206611570248,-0.08272224103305786,-0.027626114000000004,1497.0,3.8877059773136556e-08,-5.495878283363984,0.503806336220975,1.2051888529672332e-06,2.3326235863881932e-07
12
+ mean_cert_acc_108,ldlt,sdp,121,119,37,82,2,0.3140495867768595,-0.06210777499669422,-0.0208054809,1682.0,5.577705136195286e-07,-5.005293249625825,0.45883447991174453,1.5617574381346803e-05,2.788852568097643e-06
13
+ mean_cert_acc_108,ldlt-resnet,sandwich,121,120,41,79,1,0.34297520661157027,-0.03896231280495868,-0.021271005300000034,1952.0,1.1171848825351552e-05,-4.393152914607039,0.4010381583166403,0.0002569525229830857,4.4687395301406206e-05
14
+ mean_cert_acc_108,ldlt-resnet,sdp,121,117,82,35,4,0.6942148760330579,0.03544637022727273,0.01778079570000002,1875.0,1.815816313643977e-05,4.286412555226042,0.39627898091436187,0.00038132142586523517,5.447448940931931e-05
15
+ mean_cert_acc_108,ldlt-resnet,ortho,121,119,77,42,2,0.6446280991735537,0.014831904190909085,0.019129688799999996,2543.0,0.006487165385754149,2.722083984498495,0.24953302973743355,0.06487165385754148,0.012974330771508297
16
+ mean_cert_acc_108,ortho,sdp,121,119,60,59,2,0.5041322314049587,0.020614466036363646,0.0,2941.0,0.09558139242277705,1.6666632092131553,0.15278276589379147,0.6690697469594393,0.09558139242277705
17
+ mean_cert_acc_255,aol,ldlt-resnet,121,109,2,107,12,0.06611570247933884,-0.11753305529173554,-0.05601204380000001,17.0,2.0740776437226692e-19,-9.009283140067824,0.8629328202556713,1.3066689155452815e-17,3.1111164655840036e-18
18
+ mean_cert_acc_255,aol,sandwich,121,109,2,107,12,0.06611570247933884,-0.14770040981735538,-0.0791132376,58.0,6.372844948293353e-19,-8.885334991426987,0.8510607407784022,3.951163867941879e-17,8.921982927610695e-18
19
+ mean_cert_acc_255,aol,sdp,121,101,2,99,20,0.09917355371900827,-0.08689903849586776,-0.04067984229999999,24.0,5.530458211785927e-18,-8.641861221158155,0.8598973307685877,3.3182749270715563e-16,7.189595675321704e-17
20
+ mean_cert_acc_255,aol,ortho,121,105,5,100,16,0.10743801652892562,-0.09676086119917354,-0.03474230319999999,109.0,1.2845521334047947e-17,-8.54507285389116,0.8339137221462913,7.578857587088289e-16,1.5414625600857537e-16
21
+ mean_cert_acc_255,ldlt,sandwich,121,109,11,98,12,0.14049586776859505,-0.08465275803801653,-0.0371107189,291.0,2.816907595311407e-16,-8.180917484450982,0.783589780383245,1.5211301014681596e-14,3.0985983548425475e-15
22
+ mean_cert_acc_255,ortho,sandwich,121,111,16,95,10,0.17355371900826447,-0.05093954861818182,-0.0340253412,427.0,3.1013866504941554e-15,-7.886757730791445,0.7485779160743535,1.6127210582569609e-13,3.101386650494156e-14
23
+ mean_cert_acc_255,aol,ldlt,121,85,6,79,36,0.19834710743801653,-0.06304765177933884,-0.0166666675,127.0,9.405252007994125e-14,-7.448996986141906,0.8079571632467769,4.420468443757239e-12,8.464726807194712e-13
24
+ mean_cert_acc_255,sandwich,sdp,121,110,86,24,11,0.756198347107438,0.060801371321487614,0.0260695191,845.0,4.6434585276704845e-11,6.581941003154479,0.6275634511129401,1.8109488257914889e-09,3.7147668221363876e-10
25
+ mean_cert_acc_255,ldlt,ldlt-resnet,121,109,20,89,12,0.21487603305785125,-0.05448540351239671,-0.019285964800000006,847.0,8.032740235539502e-11,-6.499986158102626,0.6225857595804342,3.0524412895050106e-09,5.622918164877651e-10
26
+ mean_cert_acc_255,ldlt-resnet,sdp,121,109,80,29,12,0.7107438016528925,0.030634016795867774,0.018369630000000026,1331.0,4.735434554374733e-07,5.036733460185569,0.48243156998186193,1.3732760207686725e-05,2.8412607326248398e-06
27
+ mean_cert_acc_255,ldlt,sdp,121,101,29,72,20,0.32231404958677684,-0.023851386716528936,-0.0067567569,1312.0,1.8808503646691013e-05,-4.278585151831732,0.42573513475528263,0.00038132142586523517,9.404251823345507e-05
28
+ mean_cert_acc_255,ldlt-resnet,ortho,121,112,74,38,9,0.6487603305785123,0.020772194092561983,0.010416667000000001,1829.0,0.0001069650723295461,3.874223818787645,0.366079740996967,0.0018184062296022836,0.0004278602893181844
29
+ mean_cert_acc_255,ldlt,ortho,121,105,34,71,16,0.34710743801652894,-0.03371320941983471,-0.006727611699999997,1607.0,0.00017247727930010974,-3.756251628627802,0.3665726238390919,0.002759636468801756,0.0005174318379003293
30
+ mean_cert_acc_255,ldlt-resnet,sandwich,121,113,45,68,8,0.4049586776859504,-0.030167354525619836,-0.0091719143,2100.0,0.001333709618315114,-3.2086257723300147,0.3018421222864282,0.016004515419781366,0.002667419236630228
31
+ mean_cert_acc_255,ortho,sdp,121,109,57,52,12,0.5206611570247934,0.009861822703305786,0.0,2967.0,0.9277329720348793,0.09069748127585056,0.008687243156936288,1.0,0.9277329720348793
32
+ mean_cert_acc_36,aol,sdp,121,121,4,117,0,0.03305785123966942,-0.22732832963305788,-0.19977375490000004,27.0,2.674537391703659e-21,-9.4747291150343,0.8613390104576637,1.9791576698607075e-19,4.011806087555488e-20
33
+ mean_cert_acc_36,aol,ldlt-resnet,121,121,4,117,0,0.03305785123966942,-0.24963761973471077,-0.2301754896,47.0,4.3839246911816975e-21,-9.42299704233414,0.8566360947576491,3.2002650245626393e-19,6.137494567654376e-20
34
+ mean_cert_acc_36,aol,sandwich,121,120,6,114,1,0.05371900826446281,-0.2737254626123968,-0.26255667769999996,32.0,4.451910362421393e-21,-9.421381585871135,0.8600505362409027,3.2052521590401414e-19,6.137494567654376e-20
35
+ mean_cert_acc_36,aol,ortho,121,121,8,113,0,0.06611570247933884,-0.241676944838843,-0.22040875259999992,87.0,1.168493059599824e-20,-9.319536793967892,0.8472306176334446,7.945752805278803e-19,1.402191671519789e-19
36
+ mean_cert_acc_36,aol,ldlt,121,121,17,104,0,0.14049586776859505,-0.16436359131074382,-0.14151147009999998,554.0,4.996204614399906e-16,-8.111588999385086,0.7374171817622805,2.64798844563195e-14,5.495825075839896e-15
37
+ mean_cert_acc_36,ldlt,sandwich,121,120,31,89,1,0.2603305785123967,-0.1093618713016529,-0.0386904776,998.0,5.518615109807926e-12,-6.891554035641388,0.6291099335977582,2.2074460439231703e-10,5.518615109807926e-11
38
+ mean_cert_acc_36,ldlt,ldlt-resnet,121,121,40,81,0,0.3305785123966942,-0.08527402842396696,-0.029671715599999995,1410.0,3.6914801764267954e-09,-5.8974562878182395,0.5361323898016581,1.2920180617493783e-07,3.3223321587841155e-08
39
+ mean_cert_acc_36,ortho,sandwich,121,121,28,93,0,0.23140495867768596,-0.03204851777355372,-0.023770898600000034,1424.5,4.629982341997365e-09,-5.859952985493828,0.532722998681257,1.5741939962791043e-07,3.703985873597892e-08
40
+ mean_cert_acc_36,sandwich,sdp,121,121,83,38,0,0.6859504132231405,0.04639713297933885,0.020703285900000035,1530.0,2.309408306793832e-08,5.587063851617279,0.5079148956015708,7.390106581740263e-07,1.6165858147556826e-07
41
+ mean_cert_acc_36,ldlt,ortho,121,121,48,73,0,0.39669421487603307,-0.07731335352809918,-0.020019561100000027,1957.0,7.374456547924547e-06,-4.4825840994688635,0.40750764540626033,0.00017698695715018912,4.424673928754728e-05
42
+ mean_cert_acc_36,ldlt,sdp,121,120,47,73,1,0.3925619834710744,-0.06296473832231406,-0.00853426749999997,2014.0,2.3287734119139806e-05,-4.230784843977044,0.3862160491662003,0.0004424669482636563,0.00011643867059569903
43
+ mean_cert_acc_36,ldlt-resnet,sdp,121,119,76,43,2,0.6363636363636364,0.022309290101652897,0.0094590336,2285.0,0.000658615446347901,3.406251220738739,0.31225053745517123,0.009220616248870614,0.002634461785391604
44
+ mean_cert_acc_36,ldlt-resnet,sandwich,121,121,44,77,0,0.36363636363636365,-0.02408784287768595,-0.008888855599999967,2466.0,0.0015454857645281082,-3.1660041731381345,0.2878185611943759,0.01700034340980919,0.0046364572935843245
45
+ mean_cert_acc_36,ldlt-resnet,ortho,121,120,78,42,1,0.6487603305785123,0.007960674895867772,0.008435804399999997,2756.0,0.022161865883233774,2.2875821585152014,0.20882672506085573,0.19945679294910396,0.04432373176646755
46
+ mean_cert_acc_36,ortho,sdp,121,120,60,60,1,0.5,0.014348615205785124,0.0,2916.5,0.06186606048113158,1.8672544684343122,0.17045623216063183,0.49492848384905264,0.06186606048113158
47
+ mean_cert_acc_72,aol,sandwich,121,120,6,114,1,0.05371900826446281,-0.2997736487107438,-0.27226908129999994,58.0,8.496209443695367e-21,-9.3532909892811,0.8538347436231781,5.862384516149803e-19,1.274431416554305e-19
48
+ mean_cert_acc_72,aol,sdp,121,119,3,116,2,0.03305785123966942,-0.23363383370082644,-0.1966586188,59.0,1.2882001582431401e-20,-9.309182491555736,0.8533713598570484,8.630941060229038e-19,1.8034802215403961e-19
49
+ mean_cert_acc_72,aol,ldlt-resnet,121,121,5,116,0,0.04132231404958678,-0.2667177943008265,-0.2325268835,103.0,1.7245108797059084e-20,-9.278147238773693,0.8434679307976084,1.1381771806058995e-18,2.241864143617681e-19
50
+ mean_cert_acc_72,aol,ortho,121,121,8,113,0,0.06611570247933884,-0.2485917486933885,-0.20847125350000006,149.0,5.230116370195061e-20,-9.159163471563327,0.8326512246875751,3.347274476924839e-18,6.276139644234073e-19
51
+ mean_cert_acc_72,aol,ldlt,121,118,16,102,3,0.1446280991735537,-0.16507800779917356,-0.11549707690000001,460.5,2.627903655908365e-16,-8.189281444338008,0.7538844636483291,1.445347010749601e-14,2.8906940214992015e-15
52
+ mean_cert_acc_72,ldlt,sandwich,121,121,21,100,0,0.17355371900826447,-0.13469564091157024,-0.07480691379999999,670.0,5.6490615474408414e-15,-7.8115462441806915,0.7101405676527901,2.881021389194829e-13,5.649061547440841e-14
53
+ mean_cert_acc_72,ortho,sandwich,121,121,18,103,0,0.1487603305785124,-0.05118190001735537,-0.03697755559999999,697.5,9.909313284775937e-15,-7.74041461447375,0.70367405586125,4.954656642387969e-13,8.918381956298343e-14
54
+ mean_cert_acc_72,sandwich,sdp,121,119,91,28,2,0.7603305785123967,0.06613981500991735,0.039577659200000004,823.0,3.259960550690419e-13,7.283198892766795,0.6676497478556854,1.4343826423037844e-11,2.6079684405523354e-12
55
+ mean_cert_acc_72,ldlt,ldlt-resnet,121,120,30,90,1,0.25206611570247933,-0.1016397865016529,-0.06253699959999992,988.0,4.5889669321993215e-12,-6.917742726637553,0.6315006230661137,1.881476442201722e-10,3.212276852539525e-11
56
+ mean_cert_acc_72,ldlt,sdp,121,121,42,79,0,0.34710743801652894,-0.06855582590165288,-0.02310658990000003,1813.0,1.203520876920646e-06,-4.855057053088463,0.4413688230080421,3.1291542799936796e-05,7.221125261523876e-06
57
+ mean_cert_acc_72,ldlt,ortho,121,121,44,77,0,0.36363636363636365,-0.08351374089421487,-0.019215077100000033,1857.0,2.124094459650997e-06,-4.741244462969663,0.431022223906333,5.310236149127492e-05,1.0620472298254984e-05
58
+ mean_cert_acc_72,ldlt-resnet,sdp,121,120,79,41,1,0.6570247933884298,0.0330839606,0.015625,1982.5,1.6085073523390747e-05,4.313279255976596,0.3937467242195802,0.00035387161751459644,6.434029409356299e-05
59
+ mean_cert_acc_72,ldlt-resnet,sandwich,121,121,44,77,0,0.36363636363636365,-0.03305585440991736,-0.0237561315,2090.5,3.514559575987584e-05,-4.1372742442274895,0.3761158403843172,0.0006326207236777651,0.00010543678727962753
60
+ mean_cert_acc_72,ldlt-resnet,ortho,121,119,77,42,2,0.6446280991735537,0.01812604560743802,0.010571103499999956,2346.0,0.0011766083878145118,3.244490750154806,0.2974219794288845,0.015295909041588654,0.0023532167756290237
61
+ mean_cert_acc_72,ortho,sdp,121,120,61,59,1,0.5082644628099173,0.01495791499256198,0.00017112490000004144,3188.0,0.24758680258859866,1.1562307074807803,0.10554894002789676,0.9903472103543947,0.24758680258859866
62
+ mean_test_acc,aol,ldlt,121,121,16,105,0,0.1322314049586777,-0.09281452340082647,-0.056798912199999996,412.0,2.273589154706615e-17,-8.478886715556222,0.7708078832323838,1.3186817097298367e-15,3.4103837320599226e-16
63
+ mean_test_acc,aol,sandwich,121,121,18,103,0,0.1487603305785124,-0.09203259326611571,-0.05946643780000005,518.0,2.311544436918459e-16,-8.204706730245373,0.7458824300223067,1.2944648846743371e-14,3.2361622116858428e-15
64
+ mean_test_acc,aol,sdp,121,121,22,99,0,0.18181818181818182,-0.06835675380991735,-0.03513440550000002,806.0,8.667701016468735e-14,-7.459764883363071,0.6781604439420974,4.1604964879049924e-12,1.1268011321409356e-12
65
+ mean_test_acc,aol,ortho,121,121,27,94,0,0.2231404958677686,-0.0674542894,-0.02649849470000004,971.0,2.0217519208624917e-12,-7.032975283586752,0.6393613894169774,8.693533259708715e-11,2.42610230503499e-11
66
+ mean_test_acc,aol,ldlt-resnet,121,121,25,96,0,0.2066115702479339,-0.07273327814214876,-0.031338923699999965,1013.0,4.3801917672420244e-12,-6.924337930916415,0.6294852664469468,1.8396805422416503e-10,4.818210943966227e-11
67
+ mean_test_acc,ortho,sandwich,121,120,31,89,1,0.2603305785123967,-0.024578303866115706,-0.012561727300000047,1269.0,6.335852078999485e-10,-6.181840509645258,0.5643222490053234,2.3442652692298095e-08,6.335852078999485e-09
68
+ mean_test_acc,ldlt,ortho,121,121,94,27,0,0.7768595041322314,0.02536023400082645,0.013893890999999992,1309.0,7.334300863478093e-10,6.158703254954046,0.5598821140867315,2.6403483108521137e-08,6.600870777130284e-09
69
+ mean_test_acc,ldlt,sdp,121,121,86,35,0,0.7107438016528925,0.024457769590909093,0.011069503199999942,1503.0,1.5412957513923103e-08,5.6569021497624945,0.5142638317965904,5.086275979594624e-07,1.2330366011138482e-07
70
+ mean_test_acc,ldlt,ldlt-resnet,121,120,87,33,1,0.7231404958677686,0.020081245258677688,0.01084393090000002,1689.0,3.7364765861695115e-07,5.081915487806236,0.46391329133439085,1.1209429758508535e-05,2.615533610318658e-06
71
+ mean_test_acc,sandwich,sdp,121,121,83,38,0,0.6859504132231405,0.02367583945619835,0.008980192799999953,1789.0,8.782065986480298e-07,4.917133510150208,0.44701213728638256,2.3711578163496805e-05,5.269239591888179e-06
72
+ mean_test_acc,ldlt-resnet,sandwich,121,121,43,78,0,0.35537190082644626,-0.019299315123966942,-0.006794625399999976,2364.0,0.0006039452283418727,-3.4298364200206075,0.3118033109109643,0.00905917842512809,0.0030197261417093633
73
+ mean_test_acc,ldlt-resnet,sdp,121,120,66,54,1,0.5495867768595041,0.004376524332231406,0.0019017287000000493,3070.0,0.14285074221929925,1.4652572612355523,0.133759075754492,0.8571044533157954,0.571402968877197
74
+ mean_test_acc,ldlt-resnet,ortho,121,121,71,50,0,0.5867768595041323,0.005278988742148763,0.002452642000000005,3138.0,0.15334793383215564,1.4278052065244156,0.12980047332040143,0.8571044533157954,0.571402968877197
75
+ mean_test_acc,ortho,sdp,121,121,60,61,0,0.49586776859504134,-0.0009024644099173576,-0.00036599980000007193,3623.0,0.862413703083493,-0.17330244354553592,0.01575476759504872,1.0,1.0
76
+ mean_test_acc,ldlt,sandwich,121,121,59,62,0,0.48760330578512395,0.000781930134710744,-0.00016415209999998126,3624.0,0.8644472072224189,0.170715839910528,0.015519621810048,1.0,1.0
UCI_N4/wilcoxon_pairwise_all.json ADDED
@@ -0,0 +1,1427 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metric":"mean_cert_acc_108",
4
+ "alg_a":"aol",
5
+ "alg_b":"ldlt-resnet",
6
+ "n_common":121,
7
+ "n_nonzero":120,
8
+ "wins_a":1,
9
+ "wins_b":119,
10
+ "ties":1,
11
+ "win_rate_a_over_b":0.0123966942,
12
+ "mean_diff_a_minus_b":-0.2402356013,
13
+ "median_diff_a_minus_b":-0.2178627868,
14
+ "W_stat":1.0,
15
+ "p_two_sided":2.047798019e-21,
16
+ "z_equiv":-9.502566528,
17
+ "effect_size_r":0.8674616736,
18
+ "p_holm_global":1.535848514e-19,
19
+ "p_holm_within_metric":3.071697028e-20
20
+ },
21
+ {
22
+ "metric":"mean_cert_acc_108",
23
+ "alg_a":"aol",
24
+ "alg_b":"sandwich",
25
+ "n_common":121,
26
+ "n_nonzero":120,
27
+ "wins_a":4,
28
+ "wins_b":116,
29
+ "ties":1,
30
+ "win_rate_a_over_b":0.0371900826,
31
+ "mean_diff_a_minus_b":-0.2791979141,
32
+ "median_diff_a_minus_b":-0.240187197,
33
+ "W_stat":32.0,
34
+ "p_two_sided":4.45173911e-21,
35
+ "z_equiv":-9.4213856244,
36
+ "effect_size_r":0.8600509049,
37
+ "p_holm_global":3.205252159e-19,
38
+ "p_holm_within_metric":6.232434754e-20
39
+ },
40
+ {
41
+ "metric":"mean_cert_acc_108",
42
+ "alg_a":"aol",
43
+ "alg_b":"sdp",
44
+ "n_common":121,
45
+ "n_nonzero":118,
46
+ "wins_a":2,
47
+ "wins_b":116,
48
+ "ties":3,
49
+ "win_rate_a_over_b":0.0289256198,
50
+ "mean_diff_a_minus_b":-0.204789231,
51
+ "median_diff_a_minus_b":-0.159539476,
52
+ "W_stat":12.0,
53
+ "p_two_sided":5.792775287e-21,
54
+ "z_equiv":-9.3937017809,
55
+ "effect_size_r":0.8647603428,
56
+ "p_holm_global":4.054942701e-19,
57
+ "p_holm_within_metric":7.530607874e-20
58
+ },
59
+ {
60
+ "metric":"mean_cert_acc_108",
61
+ "alg_a":"aol",
62
+ "alg_b":"ortho",
63
+ "n_common":121,
64
+ "n_nonzero":119,
65
+ "wins_a":6,
66
+ "wins_b":113,
67
+ "ties":2,
68
+ "win_rate_a_over_b":0.0578512397,
69
+ "mean_diff_a_minus_b":-0.2254036971,
70
+ "median_diff_a_minus_b":-0.1816607546,
71
+ "W_stat":72.0,
72
+ "p_two_sided":1.781046314e-20,
73
+ "z_equiv":-9.2747089486,
74
+ "effect_size_r":0.8502111754,
75
+ "p_holm_global":1.157680104e-18,
76
+ "p_holm_within_metric":2.137255577e-19
77
+ },
78
+ {
79
+ "metric":"mean_cert_acc_108",
80
+ "alg_a":"aol",
81
+ "alg_b":"ldlt",
82
+ "n_common":121,
83
+ "n_nonzero":111,
84
+ "wins_a":12,
85
+ "wins_b":99,
86
+ "ties":10,
87
+ "win_rate_a_over_b":0.1404958678,
88
+ "mean_diff_a_minus_b":-0.142681456,
89
+ "median_diff_a_minus_b":-0.0784669667,
90
+ "W_stat":158.0,
91
+ "p_two_sided":4.019802318e-18,
92
+ "z_equiv":-8.6782286614,
93
+ "effect_size_r":0.8237010123,
94
+ "p_holm_global":2.452079414e-16,
95
+ "p_holm_within_metric":4.42178255e-17
96
+ },
97
+ {
98
+ "metric":"mean_cert_acc_108",
99
+ "alg_a":"ldlt",
100
+ "alg_b":"sandwich",
101
+ "n_common":121,
102
+ "n_nonzero":121,
103
+ "wins_a":17,
104
+ "wins_b":104,
105
+ "ties":0,
106
+ "win_rate_a_over_b":0.1404958678,
107
+ "mean_diff_a_minus_b":-0.136516458,
108
+ "median_diff_a_minus_b":-0.0904583447,
109
+ "W_stat":492.0,
110
+ "p_two_sided":1.317724351e-16,
111
+ "z_equiv":-8.2719618837,
112
+ "effect_size_r":0.7519965349,
113
+ "p_holm_global":0.0,
114
+ "p_holm_within_metric":0.0
115
+ },
116
+ {
117
+ "metric":"mean_cert_acc_108",
118
+ "alg_a":"ortho",
119
+ "alg_b":"sandwich",
120
+ "n_common":121,
121
+ "n_nonzero":121,
122
+ "wins_a":16,
123
+ "wins_b":105,
124
+ "ties":0,
125
+ "win_rate_a_over_b":0.132231405,
126
+ "mean_diff_a_minus_b":-0.053794217,
127
+ "median_diff_a_minus_b":-0.0474959761,
128
+ "W_stat":700.5,
129
+ "p_two_sided":0.0,
130
+ "z_equiv":-7.7326548003,
131
+ "effect_size_r":0.7029686182,
132
+ "p_holm_global":0.0,
133
+ "p_holm_within_metric":0.0
134
+ },
135
+ {
136
+ "metric":"mean_cert_acc_108",
137
+ "alg_a":"ldlt",
138
+ "alg_b":"ldlt-resnet",
139
+ "n_common":121,
140
+ "n_nonzero":120,
141
+ "wins_a":23,
142
+ "wins_b":97,
143
+ "ties":1,
144
+ "win_rate_a_over_b":0.194214876,
145
+ "mean_diff_a_minus_b":-0.0975541452,
146
+ "median_diff_a_minus_b":-0.0467558028,
147
+ "W_stat":787.0,
148
+ "p_two_sided":0.0,
149
+ "z_equiv":-7.4441354157,
150
+ "effect_size_r":0.6795534814,
151
+ "p_holm_global":0.0,
152
+ "p_holm_within_metric":0.0
153
+ },
154
+ {
155
+ "metric":"mean_cert_acc_108",
156
+ "alg_a":"sandwich",
157
+ "alg_b":"sdp",
158
+ "n_common":121,
159
+ "n_nonzero":119,
160
+ "wins_a":93,
161
+ "wins_b":26,
162
+ "ties":2,
163
+ "win_rate_a_over_b":0.7768595041,
164
+ "mean_diff_a_minus_b":0.074408683,
165
+ "median_diff_a_minus_b":0.0480156355,
166
+ "W_stat":764.0,
167
+ "p_two_sided":0.0,
168
+ "z_equiv":7.4396557414,
169
+ "effect_size_r":0.6819921237,
170
+ "p_holm_global":0.0,
171
+ "p_holm_within_metric":0.0
172
+ },
173
+ {
174
+ "metric":"mean_cert_acc_108",
175
+ "alg_a":"ldlt",
176
+ "alg_b":"ortho",
177
+ "n_common":121,
178
+ "n_nonzero":119,
179
+ "wins_a":35,
180
+ "wins_b":84,
181
+ "ties":2,
182
+ "win_rate_a_over_b":0.2975206612,
183
+ "mean_diff_a_minus_b":-0.082722241,
184
+ "median_diff_a_minus_b":-0.027626114,
185
+ "W_stat":1497.0,
186
+ "p_two_sided":0.0000000389,
187
+ "z_equiv":-5.4958782834,
188
+ "effect_size_r":0.5038063362,
189
+ "p_holm_global":0.0000012052,
190
+ "p_holm_within_metric":0.0000002333
191
+ },
192
+ {
193
+ "metric":"mean_cert_acc_108",
194
+ "alg_a":"ldlt",
195
+ "alg_b":"sdp",
196
+ "n_common":121,
197
+ "n_nonzero":119,
198
+ "wins_a":37,
199
+ "wins_b":82,
200
+ "ties":2,
201
+ "win_rate_a_over_b":0.3140495868,
202
+ "mean_diff_a_minus_b":-0.062107775,
203
+ "median_diff_a_minus_b":-0.0208054809,
204
+ "W_stat":1682.0,
205
+ "p_two_sided":0.0000005578,
206
+ "z_equiv":-5.0052932496,
207
+ "effect_size_r":0.4588344799,
208
+ "p_holm_global":0.0000156176,
209
+ "p_holm_within_metric":0.0000027889
210
+ },
211
+ {
212
+ "metric":"mean_cert_acc_108",
213
+ "alg_a":"ldlt-resnet",
214
+ "alg_b":"sandwich",
215
+ "n_common":121,
216
+ "n_nonzero":120,
217
+ "wins_a":41,
218
+ "wins_b":79,
219
+ "ties":1,
220
+ "win_rate_a_over_b":0.3429752066,
221
+ "mean_diff_a_minus_b":-0.0389623128,
222
+ "median_diff_a_minus_b":-0.0212710053,
223
+ "W_stat":1952.0,
224
+ "p_two_sided":0.0000111718,
225
+ "z_equiv":-4.3931529146,
226
+ "effect_size_r":0.4010381583,
227
+ "p_holm_global":0.0002569525,
228
+ "p_holm_within_metric":0.0000446874
229
+ },
230
+ {
231
+ "metric":"mean_cert_acc_108",
232
+ "alg_a":"ldlt-resnet",
233
+ "alg_b":"sdp",
234
+ "n_common":121,
235
+ "n_nonzero":117,
236
+ "wins_a":82,
237
+ "wins_b":35,
238
+ "ties":4,
239
+ "win_rate_a_over_b":0.694214876,
240
+ "mean_diff_a_minus_b":0.0354463702,
241
+ "median_diff_a_minus_b":0.0177807957,
242
+ "W_stat":1875.0,
243
+ "p_two_sided":0.0000181582,
244
+ "z_equiv":4.2864125552,
245
+ "effect_size_r":0.3962789809,
246
+ "p_holm_global":0.0003813214,
247
+ "p_holm_within_metric":0.0000544745
248
+ },
249
+ {
250
+ "metric":"mean_cert_acc_108",
251
+ "alg_a":"ldlt-resnet",
252
+ "alg_b":"ortho",
253
+ "n_common":121,
254
+ "n_nonzero":119,
255
+ "wins_a":77,
256
+ "wins_b":42,
257
+ "ties":2,
258
+ "win_rate_a_over_b":0.6446280992,
259
+ "mean_diff_a_minus_b":0.0148319042,
260
+ "median_diff_a_minus_b":0.0191296888,
261
+ "W_stat":2543.0,
262
+ "p_two_sided":0.0064871654,
263
+ "z_equiv":2.7220839845,
264
+ "effect_size_r":0.2495330297,
265
+ "p_holm_global":0.0648716539,
266
+ "p_holm_within_metric":0.0129743308
267
+ },
268
+ {
269
+ "metric":"mean_cert_acc_108",
270
+ "alg_a":"ortho",
271
+ "alg_b":"sdp",
272
+ "n_common":121,
273
+ "n_nonzero":119,
274
+ "wins_a":60,
275
+ "wins_b":59,
276
+ "ties":2,
277
+ "win_rate_a_over_b":0.5041322314,
278
+ "mean_diff_a_minus_b":0.020614466,
279
+ "median_diff_a_minus_b":0.0,
280
+ "W_stat":2941.0,
281
+ "p_two_sided":0.0955813924,
282
+ "z_equiv":1.6666632092,
283
+ "effect_size_r":0.1527827659,
284
+ "p_holm_global":0.669069747,
285
+ "p_holm_within_metric":0.0955813924
286
+ },
287
+ {
288
+ "metric":"mean_cert_acc_255",
289
+ "alg_a":"aol",
290
+ "alg_b":"ldlt-resnet",
291
+ "n_common":121,
292
+ "n_nonzero":109,
293
+ "wins_a":2,
294
+ "wins_b":107,
295
+ "ties":12,
296
+ "win_rate_a_over_b":0.0661157025,
297
+ "mean_diff_a_minus_b":-0.1175330553,
298
+ "median_diff_a_minus_b":-0.0560120438,
299
+ "W_stat":17.0,
300
+ "p_two_sided":2.074077644e-19,
301
+ "z_equiv":-9.0092831401,
302
+ "effect_size_r":0.8629328203,
303
+ "p_holm_global":1.306668916e-17,
304
+ "p_holm_within_metric":3.111116466e-18
305
+ },
306
+ {
307
+ "metric":"mean_cert_acc_255",
308
+ "alg_a":"aol",
309
+ "alg_b":"sandwich",
310
+ "n_common":121,
311
+ "n_nonzero":109,
312
+ "wins_a":2,
313
+ "wins_b":107,
314
+ "ties":12,
315
+ "win_rate_a_over_b":0.0661157025,
316
+ "mean_diff_a_minus_b":-0.1477004098,
317
+ "median_diff_a_minus_b":-0.0791132376,
318
+ "W_stat":58.0,
319
+ "p_two_sided":6.372844948e-19,
320
+ "z_equiv":-8.8853349914,
321
+ "effect_size_r":0.8510607408,
322
+ "p_holm_global":3.951163868e-17,
323
+ "p_holm_within_metric":8.921982928e-18
324
+ },
325
+ {
326
+ "metric":"mean_cert_acc_255",
327
+ "alg_a":"aol",
328
+ "alg_b":"sdp",
329
+ "n_common":121,
330
+ "n_nonzero":101,
331
+ "wins_a":2,
332
+ "wins_b":99,
333
+ "ties":20,
334
+ "win_rate_a_over_b":0.0991735537,
335
+ "mean_diff_a_minus_b":-0.0868990385,
336
+ "median_diff_a_minus_b":-0.0406798423,
337
+ "W_stat":24.0,
338
+ "p_two_sided":5.530458212e-18,
339
+ "z_equiv":-8.6418612212,
340
+ "effect_size_r":0.8598973308,
341
+ "p_holm_global":3.318274927e-16,
342
+ "p_holm_within_metric":7.189595675e-17
343
+ },
344
+ {
345
+ "metric":"mean_cert_acc_255",
346
+ "alg_a":"aol",
347
+ "alg_b":"ortho",
348
+ "n_common":121,
349
+ "n_nonzero":105,
350
+ "wins_a":5,
351
+ "wins_b":100,
352
+ "ties":16,
353
+ "win_rate_a_over_b":0.1074380165,
354
+ "mean_diff_a_minus_b":-0.0967608612,
355
+ "median_diff_a_minus_b":-0.0347423032,
356
+ "W_stat":109.0,
357
+ "p_two_sided":1.284552133e-17,
358
+ "z_equiv":-8.5450728539,
359
+ "effect_size_r":0.8339137221,
360
+ "p_holm_global":7.578857587e-16,
361
+ "p_holm_within_metric":1.54146256e-16
362
+ },
363
+ {
364
+ "metric":"mean_cert_acc_255",
365
+ "alg_a":"ldlt",
366
+ "alg_b":"sandwich",
367
+ "n_common":121,
368
+ "n_nonzero":109,
369
+ "wins_a":11,
370
+ "wins_b":98,
371
+ "ties":12,
372
+ "win_rate_a_over_b":0.1404958678,
373
+ "mean_diff_a_minus_b":-0.084652758,
374
+ "median_diff_a_minus_b":-0.0371107189,
375
+ "W_stat":291.0,
376
+ "p_two_sided":2.816907595e-16,
377
+ "z_equiv":-8.1809174845,
378
+ "effect_size_r":0.7835897804,
379
+ "p_holm_global":0.0,
380
+ "p_holm_within_metric":0.0
381
+ },
382
+ {
383
+ "metric":"mean_cert_acc_255",
384
+ "alg_a":"ortho",
385
+ "alg_b":"sandwich",
386
+ "n_common":121,
387
+ "n_nonzero":111,
388
+ "wins_a":16,
389
+ "wins_b":95,
390
+ "ties":10,
391
+ "win_rate_a_over_b":0.173553719,
392
+ "mean_diff_a_minus_b":-0.0509395486,
393
+ "median_diff_a_minus_b":-0.0340253412,
394
+ "W_stat":427.0,
395
+ "p_two_sided":0.0,
396
+ "z_equiv":-7.8867577308,
397
+ "effect_size_r":0.7485779161,
398
+ "p_holm_global":0.0,
399
+ "p_holm_within_metric":0.0
400
+ },
401
+ {
402
+ "metric":"mean_cert_acc_255",
403
+ "alg_a":"aol",
404
+ "alg_b":"ldlt",
405
+ "n_common":121,
406
+ "n_nonzero":85,
407
+ "wins_a":6,
408
+ "wins_b":79,
409
+ "ties":36,
410
+ "win_rate_a_over_b":0.1983471074,
411
+ "mean_diff_a_minus_b":-0.0630476518,
412
+ "median_diff_a_minus_b":-0.0166666675,
413
+ "W_stat":127.0,
414
+ "p_two_sided":0.0,
415
+ "z_equiv":-7.4489969861,
416
+ "effect_size_r":0.8079571632,
417
+ "p_holm_global":0.0,
418
+ "p_holm_within_metric":0.0
419
+ },
420
+ {
421
+ "metric":"mean_cert_acc_255",
422
+ "alg_a":"sandwich",
423
+ "alg_b":"sdp",
424
+ "n_common":121,
425
+ "n_nonzero":110,
426
+ "wins_a":86,
427
+ "wins_b":24,
428
+ "ties":11,
429
+ "win_rate_a_over_b":0.7561983471,
430
+ "mean_diff_a_minus_b":0.0608013713,
431
+ "median_diff_a_minus_b":0.0260695191,
432
+ "W_stat":845.0,
433
+ "p_two_sided":0.0,
434
+ "z_equiv":6.5819410032,
435
+ "effect_size_r":0.6275634511,
436
+ "p_holm_global":0.0000000018,
437
+ "p_holm_within_metric":0.0000000004
438
+ },
439
+ {
440
+ "metric":"mean_cert_acc_255",
441
+ "alg_a":"ldlt",
442
+ "alg_b":"ldlt-resnet",
443
+ "n_common":121,
444
+ "n_nonzero":109,
445
+ "wins_a":20,
446
+ "wins_b":89,
447
+ "ties":12,
448
+ "win_rate_a_over_b":0.2148760331,
449
+ "mean_diff_a_minus_b":-0.0544854035,
450
+ "median_diff_a_minus_b":-0.0192859648,
451
+ "W_stat":847.0,
452
+ "p_two_sided":0.0000000001,
453
+ "z_equiv":-6.4999861581,
454
+ "effect_size_r":0.6225857596,
455
+ "p_holm_global":0.0000000031,
456
+ "p_holm_within_metric":0.0000000006
457
+ },
458
+ {
459
+ "metric":"mean_cert_acc_255",
460
+ "alg_a":"ldlt-resnet",
461
+ "alg_b":"sdp",
462
+ "n_common":121,
463
+ "n_nonzero":109,
464
+ "wins_a":80,
465
+ "wins_b":29,
466
+ "ties":12,
467
+ "win_rate_a_over_b":0.7107438017,
468
+ "mean_diff_a_minus_b":0.0306340168,
469
+ "median_diff_a_minus_b":0.01836963,
470
+ "W_stat":1331.0,
471
+ "p_two_sided":0.0000004735,
472
+ "z_equiv":5.0367334602,
473
+ "effect_size_r":0.48243157,
474
+ "p_holm_global":0.0000137328,
475
+ "p_holm_within_metric":0.0000028413
476
+ },
477
+ {
478
+ "metric":"mean_cert_acc_255",
479
+ "alg_a":"ldlt",
480
+ "alg_b":"sdp",
481
+ "n_common":121,
482
+ "n_nonzero":101,
483
+ "wins_a":29,
484
+ "wins_b":72,
485
+ "ties":20,
486
+ "win_rate_a_over_b":0.3223140496,
487
+ "mean_diff_a_minus_b":-0.0238513867,
488
+ "median_diff_a_minus_b":-0.0067567569,
489
+ "W_stat":1312.0,
490
+ "p_two_sided":0.0000188085,
491
+ "z_equiv":-4.2785851518,
492
+ "effect_size_r":0.4257351348,
493
+ "p_holm_global":0.0003813214,
494
+ "p_holm_within_metric":0.0000940425
495
+ },
496
+ {
497
+ "metric":"mean_cert_acc_255",
498
+ "alg_a":"ldlt-resnet",
499
+ "alg_b":"ortho",
500
+ "n_common":121,
501
+ "n_nonzero":112,
502
+ "wins_a":74,
503
+ "wins_b":38,
504
+ "ties":9,
505
+ "win_rate_a_over_b":0.6487603306,
506
+ "mean_diff_a_minus_b":0.0207721941,
507
+ "median_diff_a_minus_b":0.010416667,
508
+ "W_stat":1829.0,
509
+ "p_two_sided":0.0001069651,
510
+ "z_equiv":3.8742238188,
511
+ "effect_size_r":0.366079741,
512
+ "p_holm_global":0.0018184062,
513
+ "p_holm_within_metric":0.0004278603
514
+ },
515
+ {
516
+ "metric":"mean_cert_acc_255",
517
+ "alg_a":"ldlt",
518
+ "alg_b":"ortho",
519
+ "n_common":121,
520
+ "n_nonzero":105,
521
+ "wins_a":34,
522
+ "wins_b":71,
523
+ "ties":16,
524
+ "win_rate_a_over_b":0.347107438,
525
+ "mean_diff_a_minus_b":-0.0337132094,
526
+ "median_diff_a_minus_b":-0.0067276117,
527
+ "W_stat":1607.0,
528
+ "p_two_sided":0.0001724773,
529
+ "z_equiv":-3.7562516286,
530
+ "effect_size_r":0.3665726238,
531
+ "p_holm_global":0.0027596365,
532
+ "p_holm_within_metric":0.0005174318
533
+ },
534
+ {
535
+ "metric":"mean_cert_acc_255",
536
+ "alg_a":"ldlt-resnet",
537
+ "alg_b":"sandwich",
538
+ "n_common":121,
539
+ "n_nonzero":113,
540
+ "wins_a":45,
541
+ "wins_b":68,
542
+ "ties":8,
543
+ "win_rate_a_over_b":0.4049586777,
544
+ "mean_diff_a_minus_b":-0.0301673545,
545
+ "median_diff_a_minus_b":-0.0091719143,
546
+ "W_stat":2100.0,
547
+ "p_two_sided":0.0013337096,
548
+ "z_equiv":-3.2086257723,
549
+ "effect_size_r":0.3018421223,
550
+ "p_holm_global":0.0160045154,
551
+ "p_holm_within_metric":0.0026674192
552
+ },
553
+ {
554
+ "metric":"mean_cert_acc_255",
555
+ "alg_a":"ortho",
556
+ "alg_b":"sdp",
557
+ "n_common":121,
558
+ "n_nonzero":109,
559
+ "wins_a":57,
560
+ "wins_b":52,
561
+ "ties":12,
562
+ "win_rate_a_over_b":0.520661157,
563
+ "mean_diff_a_minus_b":0.0098618227,
564
+ "median_diff_a_minus_b":0.0,
565
+ "W_stat":2967.0,
566
+ "p_two_sided":0.927732972,
567
+ "z_equiv":0.0906974813,
568
+ "effect_size_r":0.0086872432,
569
+ "p_holm_global":1.0,
570
+ "p_holm_within_metric":0.927732972
571
+ },
572
+ {
573
+ "metric":"mean_cert_acc_36",
574
+ "alg_a":"aol",
575
+ "alg_b":"sdp",
576
+ "n_common":121,
577
+ "n_nonzero":121,
578
+ "wins_a":4,
579
+ "wins_b":117,
580
+ "ties":0,
581
+ "win_rate_a_over_b":0.0330578512,
582
+ "mean_diff_a_minus_b":-0.2273283296,
583
+ "median_diff_a_minus_b":-0.1997737549,
584
+ "W_stat":27.0,
585
+ "p_two_sided":2.674537392e-21,
586
+ "z_equiv":-9.474729115,
587
+ "effect_size_r":0.8613390105,
588
+ "p_holm_global":1.97915767e-19,
589
+ "p_holm_within_metric":4.011806088e-20
590
+ },
591
+ {
592
+ "metric":"mean_cert_acc_36",
593
+ "alg_a":"aol",
594
+ "alg_b":"ldlt-resnet",
595
+ "n_common":121,
596
+ "n_nonzero":121,
597
+ "wins_a":4,
598
+ "wins_b":117,
599
+ "ties":0,
600
+ "win_rate_a_over_b":0.0330578512,
601
+ "mean_diff_a_minus_b":-0.2496376197,
602
+ "median_diff_a_minus_b":-0.2301754896,
603
+ "W_stat":47.0,
604
+ "p_two_sided":4.383924691e-21,
605
+ "z_equiv":-9.4229970423,
606
+ "effect_size_r":0.8566360948,
607
+ "p_holm_global":3.200265025e-19,
608
+ "p_holm_within_metric":6.137494568e-20
609
+ },
610
+ {
611
+ "metric":"mean_cert_acc_36",
612
+ "alg_a":"aol",
613
+ "alg_b":"sandwich",
614
+ "n_common":121,
615
+ "n_nonzero":120,
616
+ "wins_a":6,
617
+ "wins_b":114,
618
+ "ties":1,
619
+ "win_rate_a_over_b":0.0537190083,
620
+ "mean_diff_a_minus_b":-0.2737254626,
621
+ "median_diff_a_minus_b":-0.2625566777,
622
+ "W_stat":32.0,
623
+ "p_two_sided":4.451910362e-21,
624
+ "z_equiv":-9.4213815859,
625
+ "effect_size_r":0.8600505362,
626
+ "p_holm_global":3.205252159e-19,
627
+ "p_holm_within_metric":6.137494568e-20
628
+ },
629
+ {
630
+ "metric":"mean_cert_acc_36",
631
+ "alg_a":"aol",
632
+ "alg_b":"ortho",
633
+ "n_common":121,
634
+ "n_nonzero":121,
635
+ "wins_a":8,
636
+ "wins_b":113,
637
+ "ties":0,
638
+ "win_rate_a_over_b":0.0661157025,
639
+ "mean_diff_a_minus_b":-0.2416769448,
640
+ "median_diff_a_minus_b":-0.2204087526,
641
+ "W_stat":87.0,
642
+ "p_two_sided":1.16849306e-20,
643
+ "z_equiv":-9.319536794,
644
+ "effect_size_r":0.8472306176,
645
+ "p_holm_global":7.945752805e-19,
646
+ "p_holm_within_metric":1.402191672e-19
647
+ },
648
+ {
649
+ "metric":"mean_cert_acc_36",
650
+ "alg_a":"aol",
651
+ "alg_b":"ldlt",
652
+ "n_common":121,
653
+ "n_nonzero":121,
654
+ "wins_a":17,
655
+ "wins_b":104,
656
+ "ties":0,
657
+ "win_rate_a_over_b":0.1404958678,
658
+ "mean_diff_a_minus_b":-0.1643635913,
659
+ "median_diff_a_minus_b":-0.1415114701,
660
+ "W_stat":554.0,
661
+ "p_two_sided":4.996204614e-16,
662
+ "z_equiv":-8.1115889994,
663
+ "effect_size_r":0.7374171818,
664
+ "p_holm_global":0.0,
665
+ "p_holm_within_metric":0.0
666
+ },
667
+ {
668
+ "metric":"mean_cert_acc_36",
669
+ "alg_a":"ldlt",
670
+ "alg_b":"sandwich",
671
+ "n_common":121,
672
+ "n_nonzero":120,
673
+ "wins_a":31,
674
+ "wins_b":89,
675
+ "ties":1,
676
+ "win_rate_a_over_b":0.2603305785,
677
+ "mean_diff_a_minus_b":-0.1093618713,
678
+ "median_diff_a_minus_b":-0.0386904776,
679
+ "W_stat":998.0,
680
+ "p_two_sided":0.0,
681
+ "z_equiv":-6.8915540356,
682
+ "effect_size_r":0.6291099336,
683
+ "p_holm_global":0.0000000002,
684
+ "p_holm_within_metric":0.0000000001
685
+ },
686
+ {
687
+ "metric":"mean_cert_acc_36",
688
+ "alg_a":"ldlt",
689
+ "alg_b":"ldlt-resnet",
690
+ "n_common":121,
691
+ "n_nonzero":121,
692
+ "wins_a":40,
693
+ "wins_b":81,
694
+ "ties":0,
695
+ "win_rate_a_over_b":0.3305785124,
696
+ "mean_diff_a_minus_b":-0.0852740284,
697
+ "median_diff_a_minus_b":-0.0296717156,
698
+ "W_stat":1410.0,
699
+ "p_two_sided":0.0000000037,
700
+ "z_equiv":-5.8974562878,
701
+ "effect_size_r":0.5361323898,
702
+ "p_holm_global":0.0000001292,
703
+ "p_holm_within_metric":0.0000000332
704
+ },
705
+ {
706
+ "metric":"mean_cert_acc_36",
707
+ "alg_a":"ortho",
708
+ "alg_b":"sandwich",
709
+ "n_common":121,
710
+ "n_nonzero":121,
711
+ "wins_a":28,
712
+ "wins_b":93,
713
+ "ties":0,
714
+ "win_rate_a_over_b":0.2314049587,
715
+ "mean_diff_a_minus_b":-0.0320485178,
716
+ "median_diff_a_minus_b":-0.0237708986,
717
+ "W_stat":1424.5,
718
+ "p_two_sided":0.0000000046,
719
+ "z_equiv":-5.8599529855,
720
+ "effect_size_r":0.5327229987,
721
+ "p_holm_global":0.0000001574,
722
+ "p_holm_within_metric":0.000000037
723
+ },
724
+ {
725
+ "metric":"mean_cert_acc_36",
726
+ "alg_a":"sandwich",
727
+ "alg_b":"sdp",
728
+ "n_common":121,
729
+ "n_nonzero":121,
730
+ "wins_a":83,
731
+ "wins_b":38,
732
+ "ties":0,
733
+ "win_rate_a_over_b":0.6859504132,
734
+ "mean_diff_a_minus_b":0.046397133,
735
+ "median_diff_a_minus_b":0.0207032859,
736
+ "W_stat":1530.0,
737
+ "p_two_sided":0.0000000231,
738
+ "z_equiv":5.5870638516,
739
+ "effect_size_r":0.5079148956,
740
+ "p_holm_global":0.000000739,
741
+ "p_holm_within_metric":0.0000001617
742
+ },
743
+ {
744
+ "metric":"mean_cert_acc_36",
745
+ "alg_a":"ldlt",
746
+ "alg_b":"ortho",
747
+ "n_common":121,
748
+ "n_nonzero":121,
749
+ "wins_a":48,
750
+ "wins_b":73,
751
+ "ties":0,
752
+ "win_rate_a_over_b":0.3966942149,
753
+ "mean_diff_a_minus_b":-0.0773133535,
754
+ "median_diff_a_minus_b":-0.0200195611,
755
+ "W_stat":1957.0,
756
+ "p_two_sided":0.0000073745,
757
+ "z_equiv":-4.4825840995,
758
+ "effect_size_r":0.4075076454,
759
+ "p_holm_global":0.000176987,
760
+ "p_holm_within_metric":0.0000442467
761
+ },
762
+ {
763
+ "metric":"mean_cert_acc_36",
764
+ "alg_a":"ldlt",
765
+ "alg_b":"sdp",
766
+ "n_common":121,
767
+ "n_nonzero":120,
768
+ "wins_a":47,
769
+ "wins_b":73,
770
+ "ties":1,
771
+ "win_rate_a_over_b":0.3925619835,
772
+ "mean_diff_a_minus_b":-0.0629647383,
773
+ "median_diff_a_minus_b":-0.0085342675,
774
+ "W_stat":2014.0,
775
+ "p_two_sided":0.0000232877,
776
+ "z_equiv":-4.230784844,
777
+ "effect_size_r":0.3862160492,
778
+ "p_holm_global":0.0004424669,
779
+ "p_holm_within_metric":0.0001164387
780
+ },
781
+ {
782
+ "metric":"mean_cert_acc_36",
783
+ "alg_a":"ldlt-resnet",
784
+ "alg_b":"sdp",
785
+ "n_common":121,
786
+ "n_nonzero":119,
787
+ "wins_a":76,
788
+ "wins_b":43,
789
+ "ties":2,
790
+ "win_rate_a_over_b":0.6363636364,
791
+ "mean_diff_a_minus_b":0.0223092901,
792
+ "median_diff_a_minus_b":0.0094590336,
793
+ "W_stat":2285.0,
794
+ "p_two_sided":0.0006586154,
795
+ "z_equiv":3.4062512207,
796
+ "effect_size_r":0.3122505375,
797
+ "p_holm_global":0.0092206162,
798
+ "p_holm_within_metric":0.0026344618
799
+ },
800
+ {
801
+ "metric":"mean_cert_acc_36",
802
+ "alg_a":"ldlt-resnet",
803
+ "alg_b":"sandwich",
804
+ "n_common":121,
805
+ "n_nonzero":121,
806
+ "wins_a":44,
807
+ "wins_b":77,
808
+ "ties":0,
809
+ "win_rate_a_over_b":0.3636363636,
810
+ "mean_diff_a_minus_b":-0.0240878429,
811
+ "median_diff_a_minus_b":-0.0088888556,
812
+ "W_stat":2466.0,
813
+ "p_two_sided":0.0015454858,
814
+ "z_equiv":-3.1660041731,
815
+ "effect_size_r":0.2878185612,
816
+ "p_holm_global":0.0170003434,
817
+ "p_holm_within_metric":0.0046364573
818
+ },
819
+ {
820
+ "metric":"mean_cert_acc_36",
821
+ "alg_a":"ldlt-resnet",
822
+ "alg_b":"ortho",
823
+ "n_common":121,
824
+ "n_nonzero":120,
825
+ "wins_a":78,
826
+ "wins_b":42,
827
+ "ties":1,
828
+ "win_rate_a_over_b":0.6487603306,
829
+ "mean_diff_a_minus_b":0.0079606749,
830
+ "median_diff_a_minus_b":0.0084358044,
831
+ "W_stat":2756.0,
832
+ "p_two_sided":0.0221618659,
833
+ "z_equiv":2.2875821585,
834
+ "effect_size_r":0.2088267251,
835
+ "p_holm_global":0.1994567929,
836
+ "p_holm_within_metric":0.0443237318
837
+ },
838
+ {
839
+ "metric":"mean_cert_acc_36",
840
+ "alg_a":"ortho",
841
+ "alg_b":"sdp",
842
+ "n_common":121,
843
+ "n_nonzero":120,
844
+ "wins_a":60,
845
+ "wins_b":60,
846
+ "ties":1,
847
+ "win_rate_a_over_b":0.5,
848
+ "mean_diff_a_minus_b":0.0143486152,
849
+ "median_diff_a_minus_b":0.0,
850
+ "W_stat":2916.5,
851
+ "p_two_sided":0.0618660605,
852
+ "z_equiv":1.8672544684,
853
+ "effect_size_r":0.1704562322,
854
+ "p_holm_global":0.4949284838,
855
+ "p_holm_within_metric":0.0618660605
856
+ },
857
+ {
858
+ "metric":"mean_cert_acc_72",
859
+ "alg_a":"aol",
860
+ "alg_b":"sandwich",
861
+ "n_common":121,
862
+ "n_nonzero":120,
863
+ "wins_a":6,
864
+ "wins_b":114,
865
+ "ties":1,
866
+ "win_rate_a_over_b":0.0537190083,
867
+ "mean_diff_a_minus_b":-0.2997736487,
868
+ "median_diff_a_minus_b":-0.2722690813,
869
+ "W_stat":58.0,
870
+ "p_two_sided":8.496209444e-21,
871
+ "z_equiv":-9.3532909893,
872
+ "effect_size_r":0.8538347436,
873
+ "p_holm_global":5.862384516e-19,
874
+ "p_holm_within_metric":1.274431417e-19
875
+ },
876
+ {
877
+ "metric":"mean_cert_acc_72",
878
+ "alg_a":"aol",
879
+ "alg_b":"sdp",
880
+ "n_common":121,
881
+ "n_nonzero":119,
882
+ "wins_a":3,
883
+ "wins_b":116,
884
+ "ties":2,
885
+ "win_rate_a_over_b":0.0330578512,
886
+ "mean_diff_a_minus_b":-0.2336338337,
887
+ "median_diff_a_minus_b":-0.1966586188,
888
+ "W_stat":59.0,
889
+ "p_two_sided":1.288200158e-20,
890
+ "z_equiv":-9.3091824916,
891
+ "effect_size_r":0.8533713599,
892
+ "p_holm_global":8.63094106e-19,
893
+ "p_holm_within_metric":1.803480222e-19
894
+ },
895
+ {
896
+ "metric":"mean_cert_acc_72",
897
+ "alg_a":"aol",
898
+ "alg_b":"ldlt-resnet",
899
+ "n_common":121,
900
+ "n_nonzero":121,
901
+ "wins_a":5,
902
+ "wins_b":116,
903
+ "ties":0,
904
+ "win_rate_a_over_b":0.041322314,
905
+ "mean_diff_a_minus_b":-0.2667177943,
906
+ "median_diff_a_minus_b":-0.2325268835,
907
+ "W_stat":103.0,
908
+ "p_two_sided":1.72451088e-20,
909
+ "z_equiv":-9.2781472388,
910
+ "effect_size_r":0.8434679308,
911
+ "p_holm_global":1.138177181e-18,
912
+ "p_holm_within_metric":2.241864144e-19
913
+ },
914
+ {
915
+ "metric":"mean_cert_acc_72",
916
+ "alg_a":"aol",
917
+ "alg_b":"ortho",
918
+ "n_common":121,
919
+ "n_nonzero":121,
920
+ "wins_a":8,
921
+ "wins_b":113,
922
+ "ties":0,
923
+ "win_rate_a_over_b":0.0661157025,
924
+ "mean_diff_a_minus_b":-0.2485917487,
925
+ "median_diff_a_minus_b":-0.2084712535,
926
+ "W_stat":149.0,
927
+ "p_two_sided":5.23011637e-20,
928
+ "z_equiv":-9.1591634716,
929
+ "effect_size_r":0.8326512247,
930
+ "p_holm_global":3.347274477e-18,
931
+ "p_holm_within_metric":6.276139644e-19
932
+ },
933
+ {
934
+ "metric":"mean_cert_acc_72",
935
+ "alg_a":"aol",
936
+ "alg_b":"ldlt",
937
+ "n_common":121,
938
+ "n_nonzero":118,
939
+ "wins_a":16,
940
+ "wins_b":102,
941
+ "ties":3,
942
+ "win_rate_a_over_b":0.1446280992,
943
+ "mean_diff_a_minus_b":-0.1650780078,
944
+ "median_diff_a_minus_b":-0.1154970769,
945
+ "W_stat":460.5,
946
+ "p_two_sided":2.627903656e-16,
947
+ "z_equiv":-8.1892814443,
948
+ "effect_size_r":0.7538844636,
949
+ "p_holm_global":0.0,
950
+ "p_holm_within_metric":0.0
951
+ },
952
+ {
953
+ "metric":"mean_cert_acc_72",
954
+ "alg_a":"ldlt",
955
+ "alg_b":"sandwich",
956
+ "n_common":121,
957
+ "n_nonzero":121,
958
+ "wins_a":21,
959
+ "wins_b":100,
960
+ "ties":0,
961
+ "win_rate_a_over_b":0.173553719,
962
+ "mean_diff_a_minus_b":-0.1346956409,
963
+ "median_diff_a_minus_b":-0.0748069138,
964
+ "W_stat":670.0,
965
+ "p_two_sided":0.0,
966
+ "z_equiv":-7.8115462442,
967
+ "effect_size_r":0.7101405677,
968
+ "p_holm_global":0.0,
969
+ "p_holm_within_metric":0.0
970
+ },
971
+ {
972
+ "metric":"mean_cert_acc_72",
973
+ "alg_a":"ortho",
974
+ "alg_b":"sandwich",
975
+ "n_common":121,
976
+ "n_nonzero":121,
977
+ "wins_a":18,
978
+ "wins_b":103,
979
+ "ties":0,
980
+ "win_rate_a_over_b":0.1487603306,
981
+ "mean_diff_a_minus_b":-0.0511819,
982
+ "median_diff_a_minus_b":-0.0369775556,
983
+ "W_stat":697.5,
984
+ "p_two_sided":0.0,
985
+ "z_equiv":-7.7404146145,
986
+ "effect_size_r":0.7036740559,
987
+ "p_holm_global":0.0,
988
+ "p_holm_within_metric":0.0
989
+ },
990
+ {
991
+ "metric":"mean_cert_acc_72",
992
+ "alg_a":"sandwich",
993
+ "alg_b":"sdp",
994
+ "n_common":121,
995
+ "n_nonzero":119,
996
+ "wins_a":91,
997
+ "wins_b":28,
998
+ "ties":2,
999
+ "win_rate_a_over_b":0.7603305785,
1000
+ "mean_diff_a_minus_b":0.066139815,
1001
+ "median_diff_a_minus_b":0.0395776592,
1002
+ "W_stat":823.0,
1003
+ "p_two_sided":0.0,
1004
+ "z_equiv":7.2831988928,
1005
+ "effect_size_r":0.6676497479,
1006
+ "p_holm_global":0.0,
1007
+ "p_holm_within_metric":0.0
1008
+ },
1009
+ {
1010
+ "metric":"mean_cert_acc_72",
1011
+ "alg_a":"ldlt",
1012
+ "alg_b":"ldlt-resnet",
1013
+ "n_common":121,
1014
+ "n_nonzero":120,
1015
+ "wins_a":30,
1016
+ "wins_b":90,
1017
+ "ties":1,
1018
+ "win_rate_a_over_b":0.2520661157,
1019
+ "mean_diff_a_minus_b":-0.1016397865,
1020
+ "median_diff_a_minus_b":-0.0625369996,
1021
+ "W_stat":988.0,
1022
+ "p_two_sided":0.0,
1023
+ "z_equiv":-6.9177427266,
1024
+ "effect_size_r":0.6315006231,
1025
+ "p_holm_global":0.0000000002,
1026
+ "p_holm_within_metric":0.0
1027
+ },
1028
+ {
1029
+ "metric":"mean_cert_acc_72",
1030
+ "alg_a":"ldlt",
1031
+ "alg_b":"sdp",
1032
+ "n_common":121,
1033
+ "n_nonzero":121,
1034
+ "wins_a":42,
1035
+ "wins_b":79,
1036
+ "ties":0,
1037
+ "win_rate_a_over_b":0.347107438,
1038
+ "mean_diff_a_minus_b":-0.0685558259,
1039
+ "median_diff_a_minus_b":-0.0231065899,
1040
+ "W_stat":1813.0,
1041
+ "p_two_sided":0.0000012035,
1042
+ "z_equiv":-4.8550570531,
1043
+ "effect_size_r":0.441368823,
1044
+ "p_holm_global":0.0000312915,
1045
+ "p_holm_within_metric":0.0000072211
1046
+ },
1047
+ {
1048
+ "metric":"mean_cert_acc_72",
1049
+ "alg_a":"ldlt",
1050
+ "alg_b":"ortho",
1051
+ "n_common":121,
1052
+ "n_nonzero":121,
1053
+ "wins_a":44,
1054
+ "wins_b":77,
1055
+ "ties":0,
1056
+ "win_rate_a_over_b":0.3636363636,
1057
+ "mean_diff_a_minus_b":-0.0835137409,
1058
+ "median_diff_a_minus_b":-0.0192150771,
1059
+ "W_stat":1857.0,
1060
+ "p_two_sided":0.0000021241,
1061
+ "z_equiv":-4.741244463,
1062
+ "effect_size_r":0.4310222239,
1063
+ "p_holm_global":0.0000531024,
1064
+ "p_holm_within_metric":0.0000106205
1065
+ },
1066
+ {
1067
+ "metric":"mean_cert_acc_72",
1068
+ "alg_a":"ldlt-resnet",
1069
+ "alg_b":"sdp",
1070
+ "n_common":121,
1071
+ "n_nonzero":120,
1072
+ "wins_a":79,
1073
+ "wins_b":41,
1074
+ "ties":1,
1075
+ "win_rate_a_over_b":0.6570247934,
1076
+ "mean_diff_a_minus_b":0.0330839606,
1077
+ "median_diff_a_minus_b":0.015625,
1078
+ "W_stat":1982.5,
1079
+ "p_two_sided":0.0000160851,
1080
+ "z_equiv":4.313279256,
1081
+ "effect_size_r":0.3937467242,
1082
+ "p_holm_global":0.0003538716,
1083
+ "p_holm_within_metric":0.0000643403
1084
+ },
1085
+ {
1086
+ "metric":"mean_cert_acc_72",
1087
+ "alg_a":"ldlt-resnet",
1088
+ "alg_b":"sandwich",
1089
+ "n_common":121,
1090
+ "n_nonzero":121,
1091
+ "wins_a":44,
1092
+ "wins_b":77,
1093
+ "ties":0,
1094
+ "win_rate_a_over_b":0.3636363636,
1095
+ "mean_diff_a_minus_b":-0.0330558544,
1096
+ "median_diff_a_minus_b":-0.0237561315,
1097
+ "W_stat":2090.5,
1098
+ "p_two_sided":0.0000351456,
1099
+ "z_equiv":-4.1372742442,
1100
+ "effect_size_r":0.3761158404,
1101
+ "p_holm_global":0.0006326207,
1102
+ "p_holm_within_metric":0.0001054368
1103
+ },
1104
+ {
1105
+ "metric":"mean_cert_acc_72",
1106
+ "alg_a":"ldlt-resnet",
1107
+ "alg_b":"ortho",
1108
+ "n_common":121,
1109
+ "n_nonzero":119,
1110
+ "wins_a":77,
1111
+ "wins_b":42,
1112
+ "ties":2,
1113
+ "win_rate_a_over_b":0.6446280992,
1114
+ "mean_diff_a_minus_b":0.0181260456,
1115
+ "median_diff_a_minus_b":0.0105711035,
1116
+ "W_stat":2346.0,
1117
+ "p_two_sided":0.0011766084,
1118
+ "z_equiv":3.2444907502,
1119
+ "effect_size_r":0.2974219794,
1120
+ "p_holm_global":0.015295909,
1121
+ "p_holm_within_metric":0.0023532168
1122
+ },
1123
+ {
1124
+ "metric":"mean_cert_acc_72",
1125
+ "alg_a":"ortho",
1126
+ "alg_b":"sdp",
1127
+ "n_common":121,
1128
+ "n_nonzero":120,
1129
+ "wins_a":61,
1130
+ "wins_b":59,
1131
+ "ties":1,
1132
+ "win_rate_a_over_b":0.5082644628,
1133
+ "mean_diff_a_minus_b":0.014957915,
1134
+ "median_diff_a_minus_b":0.0001711249,
1135
+ "W_stat":3188.0,
1136
+ "p_two_sided":0.2475868026,
1137
+ "z_equiv":1.1562307075,
1138
+ "effect_size_r":0.10554894,
1139
+ "p_holm_global":0.9903472104,
1140
+ "p_holm_within_metric":0.2475868026
1141
+ },
1142
+ {
1143
+ "metric":"mean_test_acc",
1144
+ "alg_a":"aol",
1145
+ "alg_b":"ldlt",
1146
+ "n_common":121,
1147
+ "n_nonzero":121,
1148
+ "wins_a":16,
1149
+ "wins_b":105,
1150
+ "ties":0,
1151
+ "win_rate_a_over_b":0.132231405,
1152
+ "mean_diff_a_minus_b":-0.0928145234,
1153
+ "median_diff_a_minus_b":-0.0567989122,
1154
+ "W_stat":412.0,
1155
+ "p_two_sided":2.273589155e-17,
1156
+ "z_equiv":-8.4788867156,
1157
+ "effect_size_r":0.7708078832,
1158
+ "p_holm_global":0.0,
1159
+ "p_holm_within_metric":3.410383732e-16
1160
+ },
1161
+ {
1162
+ "metric":"mean_test_acc",
1163
+ "alg_a":"aol",
1164
+ "alg_b":"sandwich",
1165
+ "n_common":121,
1166
+ "n_nonzero":121,
1167
+ "wins_a":18,
1168
+ "wins_b":103,
1169
+ "ties":0,
1170
+ "win_rate_a_over_b":0.1487603306,
1171
+ "mean_diff_a_minus_b":-0.0920325933,
1172
+ "median_diff_a_minus_b":-0.0594664378,
1173
+ "W_stat":518.0,
1174
+ "p_two_sided":2.311544437e-16,
1175
+ "z_equiv":-8.2047067302,
1176
+ "effect_size_r":0.74588243,
1177
+ "p_holm_global":0.0,
1178
+ "p_holm_within_metric":0.0
1179
+ },
1180
+ {
1181
+ "metric":"mean_test_acc",
1182
+ "alg_a":"aol",
1183
+ "alg_b":"sdp",
1184
+ "n_common":121,
1185
+ "n_nonzero":121,
1186
+ "wins_a":22,
1187
+ "wins_b":99,
1188
+ "ties":0,
1189
+ "win_rate_a_over_b":0.1818181818,
1190
+ "mean_diff_a_minus_b":-0.0683567538,
1191
+ "median_diff_a_minus_b":-0.0351344055,
1192
+ "W_stat":806.0,
1193
+ "p_two_sided":0.0,
1194
+ "z_equiv":-7.4597648834,
1195
+ "effect_size_r":0.6781604439,
1196
+ "p_holm_global":0.0,
1197
+ "p_holm_within_metric":0.0
1198
+ },
1199
+ {
1200
+ "metric":"mean_test_acc",
1201
+ "alg_a":"aol",
1202
+ "alg_b":"ortho",
1203
+ "n_common":121,
1204
+ "n_nonzero":121,
1205
+ "wins_a":27,
1206
+ "wins_b":94,
1207
+ "ties":0,
1208
+ "win_rate_a_over_b":0.2231404959,
1209
+ "mean_diff_a_minus_b":-0.0674542894,
1210
+ "median_diff_a_minus_b":-0.0264984947,
1211
+ "W_stat":971.0,
1212
+ "p_two_sided":0.0,
1213
+ "z_equiv":-7.0329752836,
1214
+ "effect_size_r":0.6393613894,
1215
+ "p_holm_global":0.0000000001,
1216
+ "p_holm_within_metric":0.0
1217
+ },
1218
+ {
1219
+ "metric":"mean_test_acc",
1220
+ "alg_a":"aol",
1221
+ "alg_b":"ldlt-resnet",
1222
+ "n_common":121,
1223
+ "n_nonzero":121,
1224
+ "wins_a":25,
1225
+ "wins_b":96,
1226
+ "ties":0,
1227
+ "win_rate_a_over_b":0.2066115702,
1228
+ "mean_diff_a_minus_b":-0.0727332781,
1229
+ "median_diff_a_minus_b":-0.0313389237,
1230
+ "W_stat":1013.0,
1231
+ "p_two_sided":0.0,
1232
+ "z_equiv":-6.9243379309,
1233
+ "effect_size_r":0.6294852664,
1234
+ "p_holm_global":0.0000000002,
1235
+ "p_holm_within_metric":0.0
1236
+ },
1237
+ {
1238
+ "metric":"mean_test_acc",
1239
+ "alg_a":"ortho",
1240
+ "alg_b":"sandwich",
1241
+ "n_common":121,
1242
+ "n_nonzero":120,
1243
+ "wins_a":31,
1244
+ "wins_b":89,
1245
+ "ties":1,
1246
+ "win_rate_a_over_b":0.2603305785,
1247
+ "mean_diff_a_minus_b":-0.0245783039,
1248
+ "median_diff_a_minus_b":-0.0125617273,
1249
+ "W_stat":1269.0,
1250
+ "p_two_sided":0.0000000006,
1251
+ "z_equiv":-6.1818405096,
1252
+ "effect_size_r":0.564322249,
1253
+ "p_holm_global":0.0000000234,
1254
+ "p_holm_within_metric":0.0000000063
1255
+ },
1256
+ {
1257
+ "metric":"mean_test_acc",
1258
+ "alg_a":"ldlt",
1259
+ "alg_b":"ortho",
1260
+ "n_common":121,
1261
+ "n_nonzero":121,
1262
+ "wins_a":94,
1263
+ "wins_b":27,
1264
+ "ties":0,
1265
+ "win_rate_a_over_b":0.7768595041,
1266
+ "mean_diff_a_minus_b":0.025360234,
1267
+ "median_diff_a_minus_b":0.013893891,
1268
+ "W_stat":1309.0,
1269
+ "p_two_sided":0.0000000007,
1270
+ "z_equiv":6.158703255,
1271
+ "effect_size_r":0.5598821141,
1272
+ "p_holm_global":0.0000000264,
1273
+ "p_holm_within_metric":0.0000000066
1274
+ },
1275
+ {
1276
+ "metric":"mean_test_acc",
1277
+ "alg_a":"ldlt",
1278
+ "alg_b":"sdp",
1279
+ "n_common":121,
1280
+ "n_nonzero":121,
1281
+ "wins_a":86,
1282
+ "wins_b":35,
1283
+ "ties":0,
1284
+ "win_rate_a_over_b":0.7107438017,
1285
+ "mean_diff_a_minus_b":0.0244577696,
1286
+ "median_diff_a_minus_b":0.0110695032,
1287
+ "W_stat":1503.0,
1288
+ "p_two_sided":0.0000000154,
1289
+ "z_equiv":5.6569021498,
1290
+ "effect_size_r":0.5142638318,
1291
+ "p_holm_global":0.0000005086,
1292
+ "p_holm_within_metric":0.0000001233
1293
+ },
1294
+ {
1295
+ "metric":"mean_test_acc",
1296
+ "alg_a":"ldlt",
1297
+ "alg_b":"ldlt-resnet",
1298
+ "n_common":121,
1299
+ "n_nonzero":120,
1300
+ "wins_a":87,
1301
+ "wins_b":33,
1302
+ "ties":1,
1303
+ "win_rate_a_over_b":0.7231404959,
1304
+ "mean_diff_a_minus_b":0.0200812453,
1305
+ "median_diff_a_minus_b":0.0108439309,
1306
+ "W_stat":1689.0,
1307
+ "p_two_sided":0.0000003736,
1308
+ "z_equiv":5.0819154878,
1309
+ "effect_size_r":0.4639132913,
1310
+ "p_holm_global":0.0000112094,
1311
+ "p_holm_within_metric":0.0000026155
1312
+ },
1313
+ {
1314
+ "metric":"mean_test_acc",
1315
+ "alg_a":"sandwich",
1316
+ "alg_b":"sdp",
1317
+ "n_common":121,
1318
+ "n_nonzero":121,
1319
+ "wins_a":83,
1320
+ "wins_b":38,
1321
+ "ties":0,
1322
+ "win_rate_a_over_b":0.6859504132,
1323
+ "mean_diff_a_minus_b":0.0236758395,
1324
+ "median_diff_a_minus_b":0.0089801928,
1325
+ "W_stat":1789.0,
1326
+ "p_two_sided":0.0000008782,
1327
+ "z_equiv":4.9171335102,
1328
+ "effect_size_r":0.4470121373,
1329
+ "p_holm_global":0.0000237116,
1330
+ "p_holm_within_metric":0.0000052692
1331
+ },
1332
+ {
1333
+ "metric":"mean_test_acc",
1334
+ "alg_a":"ldlt-resnet",
1335
+ "alg_b":"sandwich",
1336
+ "n_common":121,
1337
+ "n_nonzero":121,
1338
+ "wins_a":43,
1339
+ "wins_b":78,
1340
+ "ties":0,
1341
+ "win_rate_a_over_b":0.3553719008,
1342
+ "mean_diff_a_minus_b":-0.0192993151,
1343
+ "median_diff_a_minus_b":-0.0067946254,
1344
+ "W_stat":2364.0,
1345
+ "p_two_sided":0.0006039452,
1346
+ "z_equiv":-3.42983642,
1347
+ "effect_size_r":0.3118033109,
1348
+ "p_holm_global":0.0090591784,
1349
+ "p_holm_within_metric":0.0030197261
1350
+ },
1351
+ {
1352
+ "metric":"mean_test_acc",
1353
+ "alg_a":"ldlt-resnet",
1354
+ "alg_b":"sdp",
1355
+ "n_common":121,
1356
+ "n_nonzero":120,
1357
+ "wins_a":66,
1358
+ "wins_b":54,
1359
+ "ties":1,
1360
+ "win_rate_a_over_b":0.5495867769,
1361
+ "mean_diff_a_minus_b":0.0043765243,
1362
+ "median_diff_a_minus_b":0.0019017287,
1363
+ "W_stat":3070.0,
1364
+ "p_two_sided":0.1428507422,
1365
+ "z_equiv":1.4652572612,
1366
+ "effect_size_r":0.1337590758,
1367
+ "p_holm_global":0.8571044533,
1368
+ "p_holm_within_metric":0.5714029689
1369
+ },
1370
+ {
1371
+ "metric":"mean_test_acc",
1372
+ "alg_a":"ldlt-resnet",
1373
+ "alg_b":"ortho",
1374
+ "n_common":121,
1375
+ "n_nonzero":121,
1376
+ "wins_a":71,
1377
+ "wins_b":50,
1378
+ "ties":0,
1379
+ "win_rate_a_over_b":0.5867768595,
1380
+ "mean_diff_a_minus_b":0.0052789887,
1381
+ "median_diff_a_minus_b":0.002452642,
1382
+ "W_stat":3138.0,
1383
+ "p_two_sided":0.1533479338,
1384
+ "z_equiv":1.4278052065,
1385
+ "effect_size_r":0.1298004733,
1386
+ "p_holm_global":0.8571044533,
1387
+ "p_holm_within_metric":0.5714029689
1388
+ },
1389
+ {
1390
+ "metric":"mean_test_acc",
1391
+ "alg_a":"ortho",
1392
+ "alg_b":"sdp",
1393
+ "n_common":121,
1394
+ "n_nonzero":121,
1395
+ "wins_a":60,
1396
+ "wins_b":61,
1397
+ "ties":0,
1398
+ "win_rate_a_over_b":0.4958677686,
1399
+ "mean_diff_a_minus_b":-0.0009024644,
1400
+ "median_diff_a_minus_b":-0.0003659998,
1401
+ "W_stat":3623.0,
1402
+ "p_two_sided":0.8624137031,
1403
+ "z_equiv":-0.1733024435,
1404
+ "effect_size_r":0.0157547676,
1405
+ "p_holm_global":1.0,
1406
+ "p_holm_within_metric":1.0
1407
+ },
1408
+ {
1409
+ "metric":"mean_test_acc",
1410
+ "alg_a":"ldlt",
1411
+ "alg_b":"sandwich",
1412
+ "n_common":121,
1413
+ "n_nonzero":121,
1414
+ "wins_a":59,
1415
+ "wins_b":62,
1416
+ "ties":0,
1417
+ "win_rate_a_over_b":0.4876033058,
1418
+ "mean_diff_a_minus_b":0.0007819301,
1419
+ "median_diff_a_minus_b":-0.0001641521,
1420
+ "W_stat":3624.0,
1421
+ "p_two_sided":0.8644472072,
1422
+ "z_equiv":0.1707158399,
1423
+ "effect_size_r":0.0155196218,
1424
+ "p_holm_global":1.0,
1425
+ "p_holm_within_metric":1.0
1426
+ }
1427
+ ]
UCI_N4/wilcoxon_prep_all.json ADDED
The diff for this file is too large to render. See raw diff
 
UCI_N6/jmlr_tables.tex ADDED
@@ -0,0 +1,469 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ % JMLR-ready tables for two-column papers
2
+ % Required packages (no siunitx):
3
+ % \usepackage{booktabs}
4
+ % \usepackage{threeparttable}
5
+ % \usepackage{threeparttablex} % for TableNotes + longtable
6
+ % \usepackage{longtable}
7
+ % Optional for landscape: \usepackage{pdflscape}
8
+
9
+ \begin{table*}[t]
10
+ \centering
11
+ \begin{threeparttable}
12
+ \caption{Model dimension ranges (min--max across all datasets and folds). Input/Output dimensions follow dataset label spaces.}
13
+ \label{tab:model-ranges}
14
+ \begin{tabular}{l r r r r r r}
15
+ \toprule
16
+ Algorithm & Width & Depth & Parameters & Padding & Input dim & Output dim \\
17
+ \midrule
18
+ AOL & 32--512 & 6--6 & 502--1245037 & 10--524 & 3--262 & 2--100 \\
19
+ Orthogonal & 32--512 & 6--6 & 507--1245042 & 10--524 & 3--262 & 2--100 \\
20
+ Sandwich & 32--512 & 6--6 & 1057--2620542 & 10--524 & 3--262 & 2--100 \\
21
+ SLL & 32--512 & 6--6 & 2326--1622697 & 10--524 & 3--262 & 2--100 \\
22
+ LDLT-L & 32--512 & 6--6 & 5480--1454611 & 10--524 & 3--262 & 2--100 \\
23
+ LDLT-R & 32--512 & 6--6 & 5577--1588756 & 10--524 & 3--262 & 2--100 \\
24
+ \bottomrule
25
+ \end{tabular}
26
+ \end{threeparttable}
27
+ \end{table*}
28
+
29
+ \begin{table*}[t]
30
+ \centering
31
+ \begin{threeparttable}
32
+ \caption{Sorted mean$\pm$std across $N$ datasets for each algorithm.}
33
+ \label{tab:metric_summary}
34
+ \begin{tabular}{l r lllll}
35
+ \toprule
36
+ & & & \multicolumn{4}{c}{Certified Accuracy} \\
37
+ \cmidrule(lr){4-7}
38
+ Algorithm & $N$ & Accuracy & 36/255 & 72/255 & 108/255 & 255/255 \\
39
+ \midrule
40
+ AOL & 121 & 0.6049\,\tiny$\pm$0.2396 & 0.2918\,\tiny$\pm$0.3122 & 0.2161\,\tiny$\pm$0.2949 & 0.1740\,\tiny$\pm$0.2722 & 0.0837\,\tiny$\pm$0.1782 \\
41
+ Orthogonal & 121 & 0.7036\,\tiny$\pm$0.1911 & 0.6071\,\tiny$\pm$0.2396 & 0.5068\,\tiny$\pm$0.2668 & 0.4233\,\tiny$\pm$0.2781 & 0.1983\,\tiny$\pm$0.2361 \\
42
+ Sandwich & 121 & 0.7163\,\tiny$\pm$0.1879 & \textbf{0.6284\,\tiny$\pm$0.2414} & \textbf{0.5525\,\tiny$\pm$0.2633} & \textbf{0.4743\,\tiny$\pm$0.2773} & \textbf{0.2476\,\tiny$\pm$0.2509} \\
43
+ SLL & 121 & 0.7011\,\tiny$\pm$0.1939 & 0.5866\,\tiny$\pm$0.2459 & 0.4810\,\tiny$\pm$0.2741 & 0.3932\,\tiny$\pm$0.2829 & 0.1882\,\tiny$\pm$0.2325 \\
44
+ \midrule
45
+ LDLT-L & 121 & \textbf{0.7245\,\tiny$\pm$0.1908} & 0.4665\,\tiny$\pm$0.3341 & 0.3863\,\tiny$\pm$0.3235 & 0.3226\,\tiny$\pm$0.3084 & 0.1562\,\tiny$\pm$0.2269 \\
46
+ LDLT-R & 121 & 0.6970\,\tiny$\pm$0.2021 & 0.6114\,\tiny$\pm$0.2325 & 0.5253\,\tiny$\pm$0.2552 & 0.4516\,\tiny$\pm$0.2645 & 0.2138\,\tiny$\pm$0.2275 \\
47
+ \bottomrule
48
+ \end{tabular}
49
+ \end{threeparttable}
50
+ \end{table*}
51
+
52
+ \begin{table}[t]
53
+ \centering
54
+ \begin{threeparttable}
55
+ {\small
56
+ \caption{Overall comparison on Mean Accuracy: average rank (lower is better) with Iman--Davenport $F=34.41$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
57
+ \label{tab:overall:mean_test_acc}
58
+ \setlength{\tabcolsep}{4pt}
59
+ \begin{tabular}{@{}l r r r r r r@{}}
60
+ \toprule
61
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
62
+ \midrule
63
+ LDLT-L & 2.525 & 4 & 0 & 4 & 0.800 & 0.533 \\
64
+ Sandwich & 2.773 & 4 & 0 & 4 & 0.800 & 0.421 \\
65
+ Orthogonal & 3.479 & 1 & 2 & -1 & 0.200 & 0.654 \\
66
+ SLL & 3.545 & 1 & 2 & -1 & 0.200 & 0.621 \\
67
+ LDLT-R & 3.628 & 1 & 2 & -1 & 0.200 & 0.560 \\
68
+ AOL & 5.050 & 0 & 5 & -5 & 0.000 & 0.000 \\
69
+ \bottomrule
70
+ \end{tabular}
71
+ }
72
+ \end{threeparttable}
73
+ \end{table}
74
+
75
+ \begin{table}[t]
76
+ \centering
77
+ \begin{threeparttable}
78
+ {\small
79
+ \caption{Overall comparison on Mean Certified Accuracy (36/255): average rank (lower is better) with Iman--Davenport $F=71.33$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
80
+ \label{tab:overall:mean_cert_acc_36}
81
+ \setlength{\tabcolsep}{4pt}
82
+ \begin{tabular}{@{}l r r r r r r@{}}
83
+ \toprule
84
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
85
+ \midrule
86
+ Sandwich & 2.380 & 4 & 0 & 4 & 0.800 & 0.574 \\
87
+ LDLT-R & 2.694 & 3 & 0 & 3 & 0.600 & 0.580 \\
88
+ SLL & 3.128 & 2 & 2 & 0 & 0.400 & 0.696 \\
89
+ Orthogonal & 3.252 & 2 & 1 & 1 & 0.400 & 0.671 \\
90
+ LDLT-L & 4.004 & 1 & 4 & -3 & 0.200 & 0.645 \\
91
+ AOL & 5.541 & 0 & 5 & -5 & 0.000 & 0.000 \\
92
+ \bottomrule
93
+ \end{tabular}
94
+ }
95
+ \end{threeparttable}
96
+ \end{table}
97
+
98
+ \begin{table}[t]
99
+ \centering
100
+ \begin{threeparttable}
101
+ {\small
102
+ \caption{Overall comparison on Mean Certified Accuracy (72/255): average rank (lower is better) with Iman--Davenport $F=111.54$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
103
+ \label{tab:overall:mean_cert_acc_72}
104
+ \setlength{\tabcolsep}{4pt}
105
+ \begin{tabular}{@{}l r r r r r r@{}}
106
+ \toprule
107
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
108
+ \midrule
109
+ Sandwich & 2.041 & 5 & 0 & 5 & 1.000 & 0.599 \\
110
+ LDLT-R & 2.562 & 4 & 1 & 3 & 0.800 & 0.540 \\
111
+ SLL & 3.260 & 2 & 2 & 0 & 0.400 & 0.729 \\
112
+ Orthogonal & 3.273 & 2 & 2 & 0 & 0.400 & 0.707 \\
113
+ LDLT-L & 4.153 & 1 & 4 & -3 & 0.200 & 0.776 \\
114
+ AOL & 5.711 & 0 & 5 & -5 & 0.000 & 0.000 \\
115
+ \bottomrule
116
+ \end{tabular}
117
+ }
118
+ \end{threeparttable}
119
+ \end{table}
120
+
121
+ \begin{table}[t]
122
+ \centering
123
+ \begin{threeparttable}
124
+ {\small
125
+ \caption{Overall comparison on Mean Certified Accuracy (108/255): average rank (lower is better) with Iman--Davenport $F=129.26$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
126
+ \label{tab:overall:mean_cert_acc_108}
127
+ \setlength{\tabcolsep}{4pt}
128
+ \begin{tabular}{@{}l r r r r r r@{}}
129
+ \toprule
130
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
131
+ \midrule
132
+ Sandwich & 2.083 & 4 & 0 & 4 & 0.800 & 0.704 \\
133
+ LDLT-R & 2.277 & 4 & 0 & 4 & 0.800 & 0.605 \\
134
+ Orthogonal & 3.248 & 3 & 2 & 1 & 0.600 & 0.546 \\
135
+ SLL & 3.430 & 2 & 3 & -1 & 0.400 & 0.702 \\
136
+ LDLT-L & 4.236 & 1 & 4 & -3 & 0.200 & 0.828 \\
137
+ AOL & 5.727 & 0 & 5 & -5 & 0.000 & 0.000 \\
138
+ \bottomrule
139
+ \end{tabular}
140
+ }
141
+ \end{threeparttable}
142
+ \end{table}
143
+
144
+ \begin{table}[t]
145
+ \centering
146
+ \begin{threeparttable}
147
+ {\small
148
+ \caption{Overall comparison on Mean Certified Accuracy (255/255): average rank (lower is better) with Iman--Davenport $F=91.19$ (df=5,600), $p=1.11e-16$; Nemenyi CD$=0.969$. Counts are significant wins/losses after Holm within-metric at $\alpha=0.05$.}
149
+ \label{tab:overall:mean_cert_acc_255}
150
+ \setlength{\tabcolsep}{4pt}
151
+ \begin{tabular}{@{}l r r r r r r@{}}
152
+ \toprule
153
+ Algorithm & \shortstack{Avg \\ rank} $\downarrow$ & \shortstack{sig \\ wins} & \shortstack{sig \\ losses} & \shortstack{net \\ wins} & \shortstack{win \\ share} & mean $r$ \\
154
+ \midrule
155
+ Sandwich & 2.037 & 5 & 0 & 5 & 1.000 & 0.652 \\
156
+ LDLT-R & 2.508 & 4 & 1 & 3 & 0.800 & 0.597 \\
157
+ SLL & 3.322 & 2 & 2 & 0 & 0.400 & 0.679 \\
158
+ Orthogonal & 3.459 & 2 & 2 & 0 & 0.400 & 0.653 \\
159
+ LDLT-L & 4.194 & 1 & 4 & -3 & 0.200 & 0.850 \\
160
+ AOL & 5.479 & 0 & 5 & -5 & 0.000 & 0.000 \\
161
+ \bottomrule
162
+ \end{tabular}
163
+ }
164
+ \end{threeparttable}
165
+ \end{table}
166
+
167
+ \begin{table}[t]
168
+ \centering
169
+ \begin{threeparttable}
170
+ {
171
+ \caption{Pairwise Wilcoxon outcomes for Mean Accuracy (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
172
+ \label{tab:signif:mean_test_acc}
173
+ \setlength{\tabcolsep}{3pt}
174
+ \begin{tabular}{@{}l c c c c c c @{}}
175
+ \toprule
176
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
177
+ \midrule
178
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
179
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
180
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
181
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
182
+ Sandwich & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
183
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
184
+ \bottomrule
185
+ \end{tabular}
186
+ }
187
+ \end{threeparttable}
188
+ \end{table}
189
+
190
+ \begin{table}[t]
191
+ \centering
192
+ \begin{threeparttable}
193
+ {
194
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (36/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
195
+ \label{tab:signif:mean_cert_acc_36}
196
+ \setlength{\tabcolsep}{3pt}
197
+ \begin{tabular}{@{}l c c c c c c @{}}
198
+ \toprule
199
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
200
+ \midrule
201
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
202
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
203
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & $\cdot$ & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
204
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
205
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
206
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
207
+ \bottomrule
208
+ \end{tabular}
209
+ }
210
+ \end{threeparttable}
211
+ \end{table}
212
+
213
+ \begin{table}[t]
214
+ \centering
215
+ \begin{threeparttable}
216
+ {
217
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (72/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
218
+ \label{tab:signif:mean_cert_acc_72}
219
+ \setlength{\tabcolsep}{3pt}
220
+ \begin{tabular}{@{}l c c c c c c @{}}
221
+ \toprule
222
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
223
+ \midrule
224
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
225
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
226
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
227
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
228
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
229
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
230
+ \bottomrule
231
+ \end{tabular}
232
+ }
233
+ \end{threeparttable}
234
+ \end{table}
235
+
236
+ \begin{table}[t]
237
+ \centering
238
+ \begin{threeparttable}
239
+ {
240
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (108/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
241
+ \label{tab:signif:mean_cert_acc_108}
242
+ \setlength{\tabcolsep}{3pt}
243
+ \begin{tabular}{@{}l c c c c c c @{}}
244
+ \toprule
245
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
246
+ \midrule
247
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
248
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
249
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
250
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
251
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
252
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
253
+ \bottomrule
254
+ \end{tabular}
255
+ }
256
+ \end{threeparttable}
257
+ \end{table}
258
+
259
+ \begin{table}[t]
260
+ \centering
261
+ \begin{threeparttable}
262
+ {
263
+ \caption{Pairwise Wilcoxon outcomes for Mean Certified Accuracy (255/255) (Holm within-metric at $\alpha=0.05$): row vs. column (\textcolor{green}{$\blacktriangle$} win, \textcolor{red}{$\blacktriangledown$} loss, $\cdot$ none).}
264
+ \label{tab:signif:mean_cert_acc_255}
265
+ \setlength{\tabcolsep}{3pt}
266
+ \begin{tabular}{@{}l c c c c c c @{}}
267
+ \toprule
268
+ & AOL & LDLT-L & LDLT-R & Orthogonal & Sandwich & SLL \\
269
+ \midrule
270
+ AOL & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
271
+ LDLT-L & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{red}{$\blacktriangledown$} \\
272
+ LDLT-R & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & \textcolor{green}{$\blacktriangle$} \\
273
+ Orthogonal & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
274
+ Sandwich & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & $\cdot$ & \textcolor{green}{$\blacktriangle$} \\
275
+ SLL & \textcolor{green}{$\blacktriangle$} & \textcolor{green}{$\blacktriangle$} & \textcolor{red}{$\blacktriangledown$} & $\cdot$ & \textcolor{red}{$\blacktriangledown$} & $\cdot$ \\
276
+ \bottomrule
277
+ \end{tabular}
278
+ }
279
+ \end{threeparttable}
280
+ \end{table}
281
+
282
+
283
+ \begin{table*}[t]
284
+ \centering
285
+ \begin{threeparttable}
286
+ \caption[Mean Accuracy]{Wilcoxon signed-rank tests (two-sided) for Mean Accuracy; $p$-values with Holm FWER corrections within-metric and global.}
287
+ \label{tab:wilcoxon:mean_test_acc}
288
+ \begingroup
289
+ \setlength{\tabcolsep}{4pt}
290
+ \begin{tabular}{ll r r r r r r r r r r r}
291
+ \toprule
292
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
293
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
294
+ \midrule
295
+ AOL & LDLT-L & 121 & 16 & 105 & 0 & 0.1322 & -0.0632 & 409 & $2.1e-17^{***}$ & $3.2e-16^{***}$ & $0^{***}$ & 0.7715 \\
296
+ AOL & Sandwich & 121 & 23 & 98 & 0 & 0.1901 & -0.0656 & 698 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7036 \\
297
+ AOL & Orthogonal & 121 & 25 & 96 & 0 & 0.2066 & -0.0525 & 908 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6542 \\
298
+ AOL & SLL & 121 & 24 & 97 & 0 & 0.1983 & -0.0445 & 1047 & $0^{***}$ & $1.0e-10^{***}$ & $4.0e-10^{***}$ & 0.6215 \\
299
+ AOL & LDLT-R & 121 & 27 & 94 & 0 & 0.2231 & -0.0357 & 1307 & $7.0e-10^{***}$ & $7.8e-09^{***}$ & $2.4e-08^{***}$ & 0.5604 \\
300
+ LDLT-L & SLL & 121 & 86 & 35 & 0 & 0.7107 & 0.0103 & 1511 & $1.7e-08^{***}$ & $1.7e-07^{***}$ & $5.0e-07^{***}$ & 0.5124 \\
301
+ LDLT-L & LDLT-R & 121 & 87 & 34 & 0 & 0.7190 & 0.0125 & 1779 & $7.7e-07^{***}$ & $6.9e-06^{***}$ & $2.1e-05^{***}$ & 0.4494 \\
302
+ LDLT-L & Orthogonal & 121 & 78 & 43 & 0 & 0.6446 & 0.0104 & 2002 & $1.3e-05^{***}$ & $1.0e-04^{***}$ & $2.8e-04^{***}$ & 0.3969 \\
303
+ Orthogonal & Sandwich & 121 & 39 & 81 & 1 & 0.3264 & -0.0079 & 2171 & $1.3e-04^{***}$ & $9.4e-04^{***}$ & $2.5e-03^{**}$ & 0.3487 \\
304
+ Sandwich & SLL & 121 & 80 & 41 & 0 & 0.6612 & 0.0063 & 2279 & $2.6e-04^{***}$ & $1.6e-03^{**}$ & $4.5e-03^{**}$ & 0.3318 \\
305
+ LDLT-R & Sandwich & 121 & 47 & 74 & 0 & 0.3884 & -0.0101 & 2411 & $9.4e-04^{***}$ & $4.7e-03^{**}$ & $1.4e-02^{*}$ & 0.3008 \\
306
+ LDLT-L & Sandwich & 121 & 64 & 56 & 1 & 0.5331 & 0.0008 & 3145 & $2.0e-01$ & $8.2e-01$ & $1.0e+00$ & 0.1158 \\
307
+ LDLT-R & Orthogonal & 121 & 54 & 67 & 0 & 0.4463 & -0.0024 & 3206 & $2.1e-01$ & $8.2e-01$ & $1.0e+00$ & 0.1138 \\
308
+ Orthogonal & SLL & 121 & 60 & 61 & 0 & 0.4959 & -0.0000 & 3382 & $4.3e-01$ & $8.5e-01$ & $1.0e+00$ & 0.0724 \\
309
+ LDLT-R & SLL & 121 & 58 & 63 & 0 & 0.4793 & -0.0010 & 3627 & $8.7e-01$ & $8.7e-01$ & $1.0e+00$ & 0.0148 \\
310
+ \bottomrule
311
+ \end{tabular}
312
+ \begin{tablenotes}
313
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
314
+ \end{tablenotes}
315
+ \endgroup
316
+ \end{threeparttable}
317
+ \end{table*}
318
+
319
+
320
+
321
+ \begin{table*}[t]
322
+ \centering
323
+ \begin{threeparttable}
324
+ \caption[Mean Certified Accuracy (36/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (36/255); $p$-values with Holm FWER corrections within-metric and global.}
325
+ \label{tab:wilcoxon:mean_cert_acc_36}
326
+ \begingroup
327
+ \setlength{\tabcolsep}{4pt}
328
+ \begin{tabular}{ll r r r r r r r r r r r}
329
+ \toprule
330
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
331
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
332
+ \midrule
333
+ AOL & LDLT-R & 121 & 6 & 115 & 0 & 0.0496 & -0.2928 & 93 & $1.4e-20^{***}$ & $2.0e-19^{***}$ & $9.5e-19^{***}$ & 0.8458 \\
334
+ AOL & SLL & 121 & 7 & 114 & 0 & 0.0579 & -0.2868 & 156 & $6.2e-20^{***}$ & $8.7e-19^{***}$ & $4.1e-18^{***}$ & 0.8310 \\
335
+ AOL & Sandwich & 121 & 9 & 112 & 0 & 0.0744 & -0.3563 & 174 & $9.5e-20^{***}$ & $1.2e-18^{***}$ & $6.2e-18^{***}$ & 0.8268 \\
336
+ AOL & Orthogonal & 121 & 9 & 112 & 0 & 0.0744 & -0.2985 & 184 & $1.2e-19^{***}$ & $1.4e-18^{***}$ & $7.6e-18^{***}$ & 0.8245 \\
337
+ AOL & LDLT-L & 121 & 21 & 93 & 7 & 0.2025 & -0.1185 & 843 & $0^{***}$ & $1.0e-10^{***}$ & $3.0e-10^{***}$ & 0.6445 \\
338
+ LDLT-L & Sandwich & 121 & 31 & 90 & 0 & 0.2562 & -0.0772 & 975 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6384 \\
339
+ LDLT-L & LDLT-R & 121 & 36 & 85 & 0 & 0.2975 & -0.0605 & 1205 & $1.0e-10^{***}$ & $1.2e-09^{***}$ & $5.1e-09^{***}$ & 0.5843 \\
340
+ LDLT-L & SLL & 121 & 36 & 85 & 0 & 0.2975 & -0.0489 & 1305 & $7.0e-10^{***}$ & $5.5e-09^{***}$ & $2.4e-08^{***}$ & 0.5608 \\
341
+ LDLT-L & Orthogonal & 121 & 42 & 79 & 0 & 0.3471 & -0.0531 & 1489 & $1.3e-08^{***}$ & $8.7e-08^{***}$ & $3.7e-07^{***}$ & 0.5176 \\
342
+ Sandwich & SLL & 121 & 84 & 35 & 2 & 0.7025 & 0.0174 & 1683 & $5.7e-07^{***}$ & $3.4e-06^{***}$ & $1.6e-05^{***}$ & 0.4586 \\
343
+ Orthogonal & Sandwich & 121 & 38 & 82 & 1 & 0.3182 & -0.0130 & 2067 & $4.3e-05^{***}$ & $2.1e-04^{***}$ & $9.0e-04^{***}$ & 0.3735 \\
344
+ LDLT-R & SLL & 121 & 71 & 49 & 1 & 0.5909 & 0.0081 & 2331 & $6.7e-04^{***}$ & $2.7e-03^{**}$ & $1.1e-02^{*}$ & 0.3104 \\
345
+ LDLT-R & Sandwich & 121 & 52 & 68 & 1 & 0.4339 & -0.0088 & 2802 & $3.0e-02^{*}$ & $9.1e-02$ & $3.0e-01$ & 0.1978 \\
346
+ Orthogonal & SLL & 121 & 58 & 63 & 0 & 0.4793 & -0.0016 & 3123 & $1.4e-01$ & $2.8e-01$ & $1.0e+00$ & 0.1333 \\
347
+ LDLT-R & Orthogonal & 121 & 76 & 45 & 0 & 0.6281 & 0.0060 & 3225 & $2.3e-01$ & $2.8e-01$ & $1.0e+00$ & 0.1093 \\
348
+ \bottomrule
349
+ \end{tabular}
350
+ \begin{tablenotes}
351
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
352
+ \end{tablenotes}
353
+ \endgroup
354
+ \end{threeparttable}
355
+ \end{table*}
356
+
357
+
358
+
359
+ \begin{table*}[t]
360
+ \centering
361
+ \begin{threeparttable}
362
+ \caption[Mean Certified Accuracy (72/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (72/255); $p$-values with Holm FWER corrections within-metric and global.}
363
+ \label{tab:wilcoxon:mean_cert_acc_72}
364
+ \begingroup
365
+ \setlength{\tabcolsep}{4pt}
366
+ \begin{tabular}{ll r r r r r r r r r r r}
367
+ \toprule
368
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
369
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
370
+ \midrule
371
+ AOL & SLL & 121 & 1 & 118 & 2 & 0.0165 & -0.2343 & 2 & $3.1e-21^{***}$ & $4.3e-20^{***}$ & $2.3e-19^{***}$ & 0.8672 \\
372
+ AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2920 & 21 & $2.3e-21^{***}$ & $3.5e-20^{***}$ & $1.7e-19^{***}$ & 0.8628 \\
373
+ AOL & Orthogonal & 121 & 6 & 115 & 0 & 0.0496 & -0.2589 & 86 & $1.2e-20^{***}$ & $1.5e-19^{***}$ & $8.3e-19^{***}$ & 0.8473 \\
374
+ AOL & Sandwich & 121 & 7 & 114 & 0 & 0.0579 & -0.3205 & 90 & $1.3e-20^{***}$ & $1.5e-19^{***}$ & $8.9e-19^{***}$ & 0.8465 \\
375
+ AOL & LDLT-L & 121 & 10 & 93 & 18 & 0.1570 & -0.1040 & 284 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7759 \\
376
+ LDLT-L & Sandwich & 121 & 21 & 99 & 1 & 0.1777 & -0.0916 & 608 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7223 \\
377
+ LDLT-L & LDLT-R & 121 & 30 & 91 & 0 & 0.2479 & -0.0704 & 922 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6509 \\
378
+ Orthogonal & Sandwich & 121 & 19 & 99 & 3 & 0.1694 & -0.0301 & 1122 & $1.0e-10^{***}$ & $8.0e-10^{***}$ & $5.4e-09^{***}$ & 0.5905 \\
379
+ LDLT-L & SLL & 121 & 34 & 86 & 1 & 0.2851 & -0.0486 & 1161 & $1.0e-10^{***}$ & $8.0e-10^{***}$ & $4.1e-09^{***}$ & 0.5901 \\
380
+ Sandwich & SLL & 121 & 93 & 28 & 0 & 0.7686 & 0.0368 & 1188 & $1.0e-10^{***}$ & $8.0e-10^{***}$ & $4.0e-09^{***}$ & 0.5883 \\
381
+ LDLT-L & Orthogonal & 121 & 35 & 85 & 1 & 0.2934 & -0.0477 & 1257 & $5.0e-10^{***}$ & $2.6e-09^{***}$ & $1.9e-08^{***}$ & 0.5672 \\
382
+ LDLT-R & SLL & 121 & 82 & 39 & 0 & 0.6777 & 0.0152 & 1961 & $7.7e-06^{***}$ & $3.1e-05^{***}$ & $1.8e-04^{***}$ & 0.4066 \\
383
+ LDLT-R & Sandwich & 121 & 49 & 72 & 0 & 0.4050 & -0.0105 & 2635 & $6.4e-03^{**}$ & $1.9e-02^{*}$ & $8.3e-02$ & 0.2481 \\
384
+ LDLT-R & Orthogonal & 121 & 74 & 47 & 0 & 0.6116 & 0.0114 & 2675 & $8.7e-03^{**}$ & $1.9e-02^{*}$ & $1.0e-01$ & 0.2387 \\
385
+ Orthogonal & SLL & 121 & 62 & 59 & 0 & 0.5124 & 0.0025 & 2936 & $5.1e-02$ & $5.1e-02$ & $4.6e-01$ & 0.1774 \\
386
+ \bottomrule
387
+ \end{tabular}
388
+ \begin{tablenotes}
389
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
390
+ \end{tablenotes}
391
+ \endgroup
392
+ \end{threeparttable}
393
+ \end{table*}
394
+
395
+
396
+
397
+ \begin{table*}[t]
398
+ \centering
399
+ \begin{threeparttable}
400
+ \caption[Mean Certified Accuracy (108/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (108/255); $p$-values with Holm FWER corrections within-metric and global.}
401
+ \label{tab:wilcoxon:mean_cert_acc_108}
402
+ \begingroup
403
+ \setlength{\tabcolsep}{4pt}
404
+ \begin{tabular}{ll r r r r r r r r r r r}
405
+ \toprule
406
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
407
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
408
+ \midrule
409
+ AOL & SLL & 121 & 1 & 113 & 7 & 0.0372 & -0.1619 & 31 & $4.4e-20^{***}$ & $5.3e-19^{***}$ & $2.9e-18^{***}$ & 0.8596 \\
410
+ AOL & LDLT-R & 121 & 1 & 120 & 0 & 0.0083 & -0.2368 & 43 & $4.0e-21^{***}$ & $6.0e-20^{***}$ & $2.9e-19^{***}$ & 0.8576 \\
411
+ AOL & Orthogonal & 121 & 3 & 114 & 4 & 0.0413 & -0.1930 & 53 & $2.4e-20^{***}$ & $3.2e-19^{***}$ & $1.6e-18^{***}$ & 0.8544 \\
412
+ AOL & Sandwich & 121 & 4 & 115 & 2 & 0.0413 & -0.2776 & 82 & $2.3e-20^{***}$ & $3.2e-19^{***}$ & $1.6e-18^{***}$ & 0.8478 \\
413
+ AOL & LDLT-L & 121 & 5 & 91 & 25 & 0.1446 & -0.0716 & 108 & $5.0e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.8278 \\
414
+ LDLT-L & Sandwich & 121 & 16 & 103 & 2 & 0.1405 & -0.0699 & 532 & $8.0e-16^{***}$ & $0^{***}$ & $0^{***}$ & 0.7384 \\
415
+ LDLT-L & LDLT-R & 121 & 25 & 95 & 1 & 0.2107 & -0.0751 & 711 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.6977 \\
416
+ Orthogonal & Sandwich & 121 & 20 & 97 & 4 & 0.1818 & -0.0322 & 1002 & $0^{***}$ & $2.0e-10^{***}$ & $1.1e-09^{***}$ & 0.6159 \\
417
+ Sandwich & SLL & 121 & 92 & 27 & 2 & 0.7686 & 0.0456 & 1046 & $0^{***}$ & $2.0e-10^{***}$ & $9.0e-10^{***}$ & 0.6134 \\
418
+ LDLT-L & Orthogonal & 121 & 31 & 86 & 4 & 0.2727 & -0.0380 & 1169 & $5.0e-10^{***}$ & $3.2e-09^{***}$ & $1.9e-08^{***}$ & 0.5738 \\
419
+ LDLT-L & SLL & 121 & 31 & 83 & 7 & 0.2851 & -0.0308 & 1220 & $6.0e-09^{***}$ & $3.0e-08^{***}$ & $1.9e-07^{***}$ & 0.5447 \\
420
+ LDLT-R & SLL & 121 & 92 & 29 & 0 & 0.7603 & 0.0294 & 1470 & $9.3e-09^{***}$ & $3.7e-08^{***}$ & $2.9e-07^{***}$ & 0.5220 \\
421
+ LDLT-R & Orthogonal & 121 & 84 & 37 & 0 & 0.6942 & 0.0207 & 2239 & $1.7e-04^{***}$ & $5.2e-04^{***}$ & $3.1e-03^{**}$ & 0.3412 \\
422
+ Orthogonal & SLL & 121 & 69 & 50 & 2 & 0.5785 & 0.0077 & 2708 & $2.2e-02^{*}$ & $4.5e-02^{*}$ & $2.4e-01$ & 0.2095 \\
423
+ LDLT-R & Sandwich & 121 & 59 & 62 & 0 & 0.4876 & -0.0023 & 3035 & $9.0e-02$ & $9.0e-02$ & $7.2e-01$ & 0.1540 \\
424
+ \bottomrule
425
+ \end{tabular}
426
+ \begin{tablenotes}
427
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
428
+ \end{tablenotes}
429
+ \endgroup
430
+ \end{threeparttable}
431
+ \end{table*}
432
+
433
+
434
+
435
+ \begin{table*}[t]
436
+ \centering
437
+ \begin{threeparttable}
438
+ \caption[Mean Certified Accuracy (255/255)]{Wilcoxon signed-rank tests (two-sided) for Mean Certified Accuracy (255/255); $p$-values with Holm FWER corrections within-metric and global.}
439
+ \label{tab:wilcoxon:mean_cert_acc_255}
440
+ \begingroup
441
+ \setlength{\tabcolsep}{4pt}
442
+ \begin{tabular}{ll r r r r r r r r r r r}
443
+ \toprule
444
+ \multicolumn{2}{c}{Algorithms} & \multicolumn{6}{c}{Run Statistics} & \multicolumn{5}{c}{Wilcoxon pairwise Statistics} \\\cmidrule(lr){1-2} \cmidrule(lr){3-8} \cmidrule(lr){9-13}
445
+ Alg A & Alg B & $n$ & wins$_A$ & wins$_B$ & ties & WinRate A & \shortstack{Median \\ $\Delta$ (A--B)} & $W$ & $p$ & $p_{\text{Holm,within}}$ & $p_{\text{Holm,global}}$ & $r$ \\
446
+ \midrule
447
+ AOL & LDLT-R & 121 & 0 & 107 & 14 & 0.0579 & -0.0753 & 0 & $2.8e-19^{***}$ & $4.2e-18^{***}$ & $1.7e-17^{***}$ & 0.8679 \\
448
+ AOL & SLL & 121 & 1 & 99 & 21 & 0.0950 & -0.0435 & 4 & $4.5e-18^{***}$ & $5.8e-17^{***}$ & $2.7e-16^{***}$ & 0.8666 \\
449
+ AOL & LDLT-L & 121 & 3 & 78 & 40 & 0.1901 & -0.0180 & 36 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.8496 \\
450
+ AOL & Orthogonal & 121 & 2 & 97 & 22 & 0.1074 & -0.0518 & 61 & $3.6e-17^{***}$ & $4.4e-16^{***}$ & $0^{***}$ & 0.8466 \\
451
+ AOL & Sandwich & 121 & 3 & 107 & 11 & 0.0702 & -0.0914 & 67 & $5.5e-19^{***}$ & $7.7e-18^{***}$ & $3.4e-17^{***}$ & 0.8488 \\
452
+ Orthogonal & Sandwich & 121 & 12 & 97 & 12 & 0.1488 & -0.0259 & 367 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7616 \\
453
+ LDLT-L & Sandwich & 121 & 12 & 98 & 11 & 0.1446 & -0.0363 & 385 & $0^{***}$ & $0^{***}$ & $0^{***}$ & 0.7584 \\
454
+ LDLT-L & LDLT-R & 121 & 22 & 86 & 13 & 0.2355 & -0.0305 & 669 & $0^{***}$ & $0^{***}$ & $1.0e-10^{***}$ & 0.6706 \\
455
+ Sandwich & SLL & 121 & 83 & 28 & 10 & 0.7273 & 0.0187 & 1014 & $7.0e-10^{***}$ & $5.1e-09^{***}$ & $2.4e-08^{***}$ & 0.5846 \\
456
+ LDLT-L & SLL & 121 & 24 & 77 & 20 & 0.2810 & -0.0083 & 1120 & $8.3e-07^{***}$ & $5.0e-06^{***}$ & $2.1e-05^{***}$ & 0.4905 \\
457
+ LDLT-L & Orthogonal & 121 & 30 & 70 & 21 & 0.3347 & -0.0077 & 1191 & $4.5e-06^{***}$ & $1.8e-05^{***}$ & $1.1e-04^{***}$ & 0.4585 \\
458
+ LDLT-R & SLL & 121 & 80 & 29 & 12 & 0.7107 & 0.0156 & 1368 & $8.5e-07^{***}$ & $5.0e-06^{***}$ & $2.1e-05^{***}$ & 0.4716 \\
459
+ LDLT-R & Orthogonal & 121 & 76 & 34 & 11 & 0.6736 & 0.0123 & 1722 & $7.3e-05^{***}$ & $2.2e-04^{***}$ & $1.5e-03^{**}$ & 0.3780 \\
460
+ LDLT-R & Sandwich & 121 & 44 & 68 & 9 & 0.4008 & -0.0070 & 2043 & $1.1e-03^{**}$ & $2.3e-03^{**}$ & $1.6e-02^{*}$ & 0.3074 \\
461
+ Orthogonal & SLL & 121 & 53 & 51 & 17 & 0.5083 & 0.0000 & 2606 & $6.9e-01$ & $6.9e-01$ & $1.0e+00$ & 0.0393 \\
462
+ \bottomrule
463
+ \end{tabular}
464
+ \begin{tablenotes}
465
+ \item Stars mark significance ($^*\,p\!\le\!0.05$, $^{**}\,p\!\le\!0.01$, $^{***}\,p\!\le\!0.001$).
466
+ \end{tablenotes}
467
+ \endgroup
468
+ \end{threeparttable}
469
+ \end{table*}
UCI_N6/wilcoxon_pairwise_all.csv ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ metric,alg_a,alg_b,n_common,n_nonzero,wins_a,wins_b,ties,win_rate_a_over_b,mean_diff_a_minus_b,median_diff_a_minus_b,W_stat,p_two_sided,z_equiv,effect_size_r,p_holm_global,p_holm_within_metric
2
+ mean_cert_acc_108,aol,ldlt-resnet,121,121,1,120,0,0.008264462809917356,-0.27756937579256197,-0.23680263569999999,43.0,3.971911186286591e-21,-9.433351346128775,0.857577395102616,2.899495165989211e-19,5.957866779429887e-20
3
+ mean_cert_acc_108,aol,sandwich,121,119,4,115,2,0.04132231404958678,-0.3003505936595042,-0.2775541879,82.0,2.2832440515482022e-20,-9.248190838712615,0.8477802642077927,1.5754383955682595e-18,3.196541672167483e-19
4
+ mean_cert_acc_108,aol,ortho,121,117,3,114,4,0.04132231404958678,-0.24928130693223144,-0.1929709499,53.0,2.4216488584946992e-20,-9.241897120975947,0.8544136910831229,1.6467212237763955e-18,3.196541672167483e-19
5
+ mean_cert_acc_108,aol,sdp,121,114,1,113,7,0.0371900826446281,-0.21922742412561985,-0.1618937068,31.0,4.402939864544531e-20,-9.17772518836056,0.859572719401443,2.949969709244836e-18,5.2835278374534375e-19
6
+ mean_cert_acc_108,aol,ldlt,121,96,5,91,25,0.1446280991735537,-0.14859004186611569,-0.0715934783,108.0,5.031122992210323e-16,-8.110742844187337,0.8277992251328726,2.918051335481987e-14,5.534235291431355e-15
7
+ mean_cert_acc_108,ldlt,sandwich,121,119,16,103,2,0.14049586776859505,-0.15176055179338843,-0.06991830010000001,532.0,7.955949293607779e-16,-8.054875891781956,0.7383892623745293,4.534891097356434e-14,7.955949293607778e-15
8
+ mean_cert_acc_108,ldlt,ldlt-resnet,121,120,25,95,1,0.21074380165289255,-0.12897933392644628,-0.0750768315,711.0,2.119279523234749e-14,-7.643176019800993,0.6977233195045927,1.0596397616173746e-12,1.9073515709112743e-13
9
+ mean_cert_acc_108,sandwich,sdp,121,119,92,27,2,0.768595041322314,0.08112316953388428,0.0456349217,1046.0,2.203741621261607e-11,6.691845041287824,0.6134404291694237,9.47608897142491e-10,1.7629932970092855e-10
10
+ mean_cert_acc_108,ortho,sandwich,121,117,20,97,4,0.18181818181818182,-0.05106928672727272,-0.0322356224,1001.5,2.6982241694705535e-11,-6.662165233713968,0.6159173937376728,1.1332541511776325e-09,1.8887569186293875e-10
11
+ mean_cert_acc_108,ldlt,ortho,121,117,31,86,4,0.2727272727272727,-0.10069126506611571,-0.037954930200000014,1169.0,5.414495427550374e-10,-6.20659482933111,0.5737998949534099,1.9492183539181346e-08,3.248697256530224e-09
12
+ mean_cert_acc_108,ldlt,sdp,121,114,31,83,7,0.28512396694214875,-0.07063738225950414,-0.0307513103,1220.0,6.028970842431367e-09,-5.815952160338162,0.5447138274210623,1.9292706695780375e-07,3.0144854212156835e-08
13
+ mean_cert_acc_108,ldlt-resnet,sdp,121,121,92,29,0,0.7603305785123967,0.05834195166694215,0.02943234149999996,1470.0,9.3419869330056e-09,5.742262470887794,0.5220238609897995,2.896015949231736e-07,3.73679477320224e-08
14
+ mean_cert_acc_108,ldlt-resnet,ortho,121,121,84,37,0,0.6942148760330579,0.028288068860330577,0.020693764000000003,2239.0,0.00017461692075476892,3.7531634438099943,0.3411966767099995,0.0031431045735858406,0.0005238507622643068
15
+ mean_cert_acc_108,ortho,sdp,121,119,69,50,2,0.5785123966942148,0.030053882806611577,0.007734805400000044,2707.5,0.022262328422160898,2.2858620807716203,0.20954463338571241,0.24488561264376987,0.044524656844321796
16
+ mean_cert_acc_108,ldlt-resnet,sandwich,121,121,59,62,0,0.48760330578512395,-0.022781217866942153,-0.00227646530000003,3035.0,0.09022246362523051,-1.6942253809302392,0.15402048917547628,0.7217797090018441,0.09022246362523051
17
+ mean_cert_acc_255,aol,ldlt-resnet,121,107,0,107,14,0.05785123966942149,-0.13012088649173556,-0.07534636179999998,0.0,2.76996750319979e-19,-8.977496787439458,0.8678873724707945,1.7450795270158677e-17,4.154951254799685e-18
18
+ mean_cert_acc_255,aol,sandwich,121,110,3,107,11,0.07024793388429752,-0.16391362448842975,-0.0914320648,67.0,5.47642526250318e-19,-8.902172131588635,0.8487888090494454,3.3953836627519717e-17,7.666995367504452e-18
19
+ mean_cert_acc_255,aol,sdp,121,100,1,99,21,0.09504132231404959,-0.10447574966033059,-0.043450783900000005,4.0,4.463734493179987e-18,-8.666304171669932,0.8666304171669932,2.722878040839792e-16,5.802854841133983e-17
20
+ mean_cert_acc_255,aol,ortho,121,99,2,97,22,0.10743801652892562,-0.11459076743471074,-0.05179674919999999,61.0,3.6442146275228883e-17,-8.423814379367323,0.846625199998847,2.1500866302385042e-15,4.373057553027466e-16
21
+ mean_cert_acc_255,ldlt,sandwich,121,110,12,98,11,0.1446280991735537,-0.09138781576115705,-0.03625880179999996,385.0,1.8087600254343317e-15,-7.953800025107839,0.7583650766280977,1.0129056142432257e-13,1.989636027977765e-14
22
+ mean_cert_acc_255,ortho,sandwich,121,109,12,97,12,0.1487603305785124,-0.04932285705371901,-0.0258620679,367.0,1.8479421669945226e-15,-7.951145858516235,0.7615816500914148,1.0163681918469874e-13,1.989636027977765e-14
23
+ mean_cert_acc_255,aol,ldlt,121,81,3,78,40,0.19008264462809918,-0.07252580872727273,-0.0180000011,36.0,2.0692760364951348e-14,-7.646248493300708,0.8495831659223009,1.0553307786125188e-12,1.8623484328456214e-13
24
+ mean_cert_acc_255,ldlt,ldlt-resnet,121,108,22,86,13,0.23553719008264462,-0.05759507776446282,-0.03051157290000006,669.0,3.2009930486043397e-12,-6.968604880955203,0.6705543173159377,1.4724568023579962e-10,2.5607944388834718e-11
25
+ mean_cert_acc_255,sandwich,sdp,121,111,83,28,10,0.7272727272727273,0.059437874828099174,0.01872655469999998,1014.0,7.290838840470702e-10,6.15964458474609,0.5846475908605333,2.4135012522529935e-08,5.103587188329491e-09
26
+ mean_cert_acc_255,ldlt,sdp,121,101,24,77,20,0.2809917355371901,-0.031949940933057856,-0.0083265586,1120.0,8.264525789853738e-07,-4.9290149335535665,0.4904553169986217,2.148776705361972e-05,4.958715473912243e-06
27
+ mean_cert_acc_255,ldlt-resnet,sdp,121,109,80,29,12,0.7107438016528925,0.025645136831404965,0.015625,1368.5,8.506882131315028e-07,4.923364421074805,0.47157278542280645,2.148776705361972e-05,4.958715473912243e-06
28
+ mean_cert_acc_255,ldlt,ortho,121,100,30,70,21,0.3347107438016529,-0.04206495870743802,-0.007675599399999997,1191.0,4.539730104155671e-06,-4.585006178949154,0.4585006178949154,0.0001089535224997361,1.8158920416622684e-05
29
+ mean_cert_acc_255,ldlt-resnet,ortho,121,110,76,34,11,0.6735537190082644,0.015530119057024795,0.0123031566,1722.5,7.340425290385093e-05,3.9649730077287084,0.37804534302378984,0.0014680850580770185,0.0002202127587115528
30
+ mean_cert_acc_255,ldlt-resnet,sandwich,121,112,44,68,9,0.40082644628099173,-0.033792737996694217,-0.006987711899999999,2043.0,0.001142117810154983,-3.2529545065204624,0.3073753089449993,0.015989649342169763,0.002284235620309966
31
+ mean_cert_acc_255,ortho,sdp,121,104,53,51,17,0.5082644628099173,0.010115017774380166,0.0,2606.0,0.6887980651072516,0.4004867168703731,0.03927095354339887,1.0,0.6887980651072516
32
+ mean_cert_acc_36,aol,ldlt-resnet,121,121,6,115,0,0.049586776859504134,-0.3195985256429752,-0.2928244397,93.0,1.3524220958164444e-20,-9.304013275123774,0.8458193886476159,9.46695467071511e-19,2.0286331437246665e-19
33
+ mean_cert_acc_36,aol,sdp,121,121,7,114,0,0.05785123966942149,-0.29487104347272725,-0.2867985517,156.0,6.184471896701117e-20,-9.141057246118269,0.8310052041925698,4.0817514518227375e-18,8.6582606553815635e-19
34
+ mean_cert_acc_36,aol,sandwich,121,121,9,112,0,0.0743801652892562,-0.3366267439752066,-0.3562658951,174.0,9.50240904957694e-20,-9.094498380688126,0.8267725800625569,6.176565882225011e-18,1.2353131764450022e-18
35
+ mean_cert_acc_36,aol,ortho,121,121,9,112,0,0.0743801652892562,-0.3153361513099173,-0.2984701917,183.5,1.1909411544163069e-19,-9.069929438814437,0.8245390398922215,7.622023388264364e-18,1.4291293852995683e-18
36
+ mean_cert_acc_36,ldlt,sandwich,121,121,31,90,0,0.256198347107438,-0.16186784709090912,-0.07720418269999996,975.0,2.177320182273665e-12,-7.022628869046719,0.6384208062769745,1.0233404856686225e-10,2.3950522005010313e-11
37
+ mean_cert_acc_36,aol,ldlt,121,114,21,93,7,0.2024793388429752,-0.17475889688429755,-0.1185294129,843.0,5.906625670244248e-12,-6.8818836320461765,0.6445474566730744,2.6579815516099117e-10,5.906625670244248e-11
38
+ mean_cert_acc_36,ldlt,ldlt-resnet,121,121,36,85,0,0.2975206611570248,-0.14483962875867767,-0.06054405490000003,1205.0,1.2954054230165275e-10,-6.427710032994878,0.5843372757268072,5.0520811497644576e-09,1.1658648807148747e-09
39
+ mean_cert_acc_36,ldlt,sdp,121,121,36,85,0,0.2975206611570248,-0.12011214658842975,-0.048914968999999975,1305.0,6.870164641102856e-10,-6.169049669494079,0.5608226972267345,2.4045576243859998e-08,5.496131712882285e-09
40
+ mean_cert_acc_36,ldlt,ortho,121,121,42,79,0,0.34710743801652894,-0.14057725442561983,-0.05313736200000008,1489.0,1.2474259752304599e-08,-5.693114600652607,0.5175558727866006,3.74227792569138e-07,8.731981826613219e-08
41
+ mean_cert_acc_36,sandwich,sdp,121,119,84,35,2,0.7024793388429752,0.04175570050247934,0.017416268600000007,1683.0,5.655006341785244e-07,5.002641438632645,0.45859138879655953,1.5834017756998682e-05,3.393003805071146e-06
42
+ mean_cert_acc_36,ortho,sandwich,121,120,38,82,1,0.3181818181818182,-0.02129059266528926,-0.013042002900000016,2067.0,4.277000715808299e-05,-4.091982968151117,0.3735452294305518,0.0008981701503197428,0.00021385003579041495
43
+ mean_cert_acc_36,ldlt-resnet,sdp,121,120,71,49,1,0.5909090909090909,0.024727482170247932,0.008074492300000014,2331.0,0.0006723776229561895,3.4006015258523057,0.31043102746596585,0.010758041967299032,0.002689510491824758
44
+ mean_cert_acc_36,ldlt-resnet,sandwich,121,120,52,68,1,0.43388429752066116,-0.017028218332231407,-0.008829414899999999,2802.0,0.030226148960912597,-2.167114179932833,0.1978295535064203,0.30226148960912597,0.0906784468827378
45
+ mean_cert_acc_36,ortho,sdp,121,121,58,63,0,0.4793388429752066,0.020465107837190088,-0.0016042887999999644,3123.0,0.1424837402278625,1.466604261049536,0.13332766009541236,0.9973861815950376,0.284967480455725
46
+ mean_cert_acc_36,ldlt-resnet,ortho,121,121,76,45,0,0.628099173553719,0.004262374333057851,0.005987092899999991,3225.0,0.2290650698616885,1.2027706902787196,0.10934279002533814,1.0,0.284967480455725
47
+ mean_cert_acc_72,aol,ldlt-resnet,121,121,1,120,0,0.008264462809917356,-0.3092410627958678,-0.2919858993,21.0,2.3047485551154483e-21,-9.490252705264558,0.8627502459331416,1.7285614163365862e-19,3.4571228326731724e-20
48
+ mean_cert_acc_72,aol,sdp,121,119,1,118,2,0.01652892561983471,-0.2649477861495868,-0.23431782420000002,2.0,3.06956082705418e-21,-9.460335718166954,0.8672275534225952,2.2714750120200932e-19,4.297385157875852e-20
49
+ mean_cert_acc_72,aol,ortho,121,121,6,115,0,0.049586776859504134,-0.29073976685619835,-0.2589285746,86.5,1.15433610944114e-20,-9.320830096326201,0.8473481905751092,8.3112199879762075e-19,1.500636942273482e-19
50
+ mean_cert_acc_72,aol,sandwich,121,121,7,114,0,0.05785123966942149,-0.33645687826198345,-0.32054936889999996,90.0,1.2571587049174732e-20,-9.311773086028797,0.8465248260026179,8.92582680491406e-19,1.5085904459009678e-19
51
+ mean_cert_acc_72,ldlt,sandwich,121,120,21,99,1,0.17768595041322313,-0.1661887828859504,-0.09155106540000002,608.0,2.5143510494245837e-15,-7.9129129844919035,0.7223468228636237,1.3577495666892752e-13,2.765786154367042e-14
52
+ mean_cert_acc_72,aol,ldlt,121,103,10,93,18,0.15702479338842976,-0.1702680953760331,-0.1040100288,284.0,3.4232603031044563e-15,-7.874420413270477,0.7758896981769975,1.8143279606453618e-13,3.423260303104456e-14
53
+ mean_cert_acc_72,ldlt,ldlt-resnet,121,121,30,91,0,0.24793388429752067,-0.13897296741983473,-0.0703703724,922.0,8.084268131100275e-13,-7.159718861702142,0.650883532882013,3.8804487029281324e-11,7.2758413179902475e-12
54
+ mean_cert_acc_72,sandwich,sdp,121,121,93,28,0,0.768595041322314,0.07150909211239669,0.03682704640000001,1188.0,9.69177377400736e-11,6.471682294790014,0.5883347540718195,3.973627247343017e-09,7.753419019205888e-10
55
+ mean_cert_acc_72,ldlt,sdp,121,120,34,86,1,0.28512396694214875,-0.09467969077355372,-0.04857719500000002,1161.0,1.0151448930030595e-10,-6.464678372403863,0.5901416952635631,4.060579572012238e-09,7.753419019205888e-10
56
+ mean_cert_acc_72,ortho,sandwich,121,118,19,99,3,0.16942148760330578,-0.04571711140578512,-0.030128806799999963,1121.5,1.4156553253762546e-10,-6.414198632497565,0.5904748455235395,5.3794902364297675e-09,8.493931952257528e-10
57
+ mean_cert_acc_72,ldlt,ortho,121,120,35,85,1,0.29338842975206614,-0.12047167148016531,-0.04772219800000005,1257.0,5.189417983892635e-10,-6.213266938840658,0.5671910763673499,1.920084654040275e-08,2.5947089919463174e-09
58
+ mean_cert_acc_72,ldlt-resnet,sdp,121,121,82,39,0,0.6776859504132231,0.044293276646280993,0.01521807910000006,1961.0,7.7404645028487e-06,4.472239555029277,0.4065672322753888,0.0001780306835655201,3.09618580113948e-05
59
+ mean_cert_acc_72,ldlt-resnet,sandwich,121,121,49,72,0,0.4049586776859504,-0.0272158154661157,-0.010539218799999972,2635.0,0.006355236164498874,-2.728866834933439,0.24807880317576717,0.08261807013848536,0.019065708493496623
60
+ mean_cert_acc_72,ldlt-resnet,ortho,121,121,74,47,0,0.6115702479338843,0.018501295939669423,0.011391893000000097,2675.0,0.008654654351165116,2.6254026895331193,0.23867297177573812,0.10385585221398139,0.019065708493496623
61
+ mean_cert_acc_72,ortho,sdp,121,121,62,59,0,0.512396694214876,0.02579198070661157,0.0024819821999999547,2935.5,0.05098651424705218,1.9515932586868652,0.17741756897153318,0.45887862822346964,0.05098651424705218
62
+ mean_test_acc,aol,ldlt,121,121,16,105,0,0.1322314049586777,-0.11958352569586778,-0.06315010610000005,409.0,2.1268544183487774e-17,-8.486646526461245,0.7715133205873859,1.2761126510092665e-15,3.1902816275231663e-16
63
+ mean_test_acc,aol,sandwich,121,121,23,98,0,0.19008264462809918,-0.11132838667768594,-0.06561486950000006,698.0,1.0010877948097709e-14,-7.739118075943935,0.703556188722176,5.205656533010808e-13,1.4015229127336793e-13
64
+ mean_test_acc,aol,ortho,121,121,25,96,0,0.2066115702479339,-0.09866207272396695,-0.05250947429999997,908.0,6.203585473534351e-13,-7.195931312592255,0.6541755738720232,3.039756882031832e-11,8.064661115594657e-12
65
+ mean_test_acc,aol,sdp,121,121,24,97,0,0.19834710743801653,-0.09612382466942149,-0.044510062900000036,1047.0,8.121173320702691e-12,-6.836393407326143,0.6214903097569221,3.573316261109184e-10,9.74540798484323e-11
66
+ mean_test_acc,aol,ldlt-resnet,121,121,27,94,0,0.2231404958677686,-0.09206069528677686,-0.03569083780000004,1307.0,7.098533094861746e-10,-6.163876462224062,0.5603524056567329,2.4135012522529935e-08,7.80838640434792e-09
67
+ mean_test_acc,ldlt,sdp,121,121,86,35,0,0.7107438016528925,0.023459701026446286,0.010278406500000004,1511.0,1.7383406684454798e-08,5.636209320682431,0.5123826655165846,5.041187938491891e-07,1.7383406684454799e-07
68
+ mean_test_acc,ldlt,ldlt-resnet,121,121,87,34,0,0.71900826446281,0.02752283040909091,0.01248115980000003,1779.0,7.69296628945801e-07,4.942999546500287,0.44936359513638974,2.077100898153663e-05,6.923669660512209e-06
69
+ mean_test_acc,ldlt,ortho,121,121,78,43,0,0.6446280991735537,0.020921452971900834,0.010356299000000013,2002.0,1.264342847332638e-05,4.366186935893503,0.39692608508122756,0.00027815542641318036,0.00010114742778661104
70
+ mean_test_acc,ortho,sandwich,121,120,39,81,1,0.32644628099173556,-0.01266631395371901,-0.007894689300000035,2171.0,0.00013365710865816523,-3.8196205817909794,0.3486820589596543,0.0025394850645051393,0.0009355997606071565
71
+ mean_test_acc,sandwich,sdp,121,121,80,41,0,0.6611570247933884,0.015204562008264456,0.006305895000000006,2279.0,0.00026254907665535047,3.6496977289962866,0.33179070263602606,0.004463334303140958,0.001575294459932103
72
+ mean_test_acc,ldlt-resnet,sandwich,121,121,47,74,0,0.3884297520661157,-0.019267691390909086,-0.01009704999999994,2411.0,0.0009387558222226796,-3.308266049175231,0.3007514590159301,0.014081337333340193,0.004693779111113398
73
+ mean_test_acc,ldlt,sandwich,121,120,64,56,1,0.5330578512396694,0.008255139018181824,0.0008221223000000055,3145.0,0.2044973939148288,1.2688420787642989,0.11582890474182553,1.0,0.8179895756593152
74
+ mean_test_acc,ldlt-resnet,ortho,121,121,54,67,0,0.4462809917355372,-0.006601377437190076,-0.0023532391000000152,3206.0,0.2106004158723539,-1.2519161593438723,0.11381055994035204,1.0,0.8179895756593152
75
+ mean_test_acc,ortho,sdp,121,121,60,61,0,0.49586776859504134,0.002538248054545448,-6.572600000032125e-06,3382.0,0.42564043452591804,0.7966739195824637,0.07242490178022397,1.0,0.8512808690518361
76
+ mean_test_acc,ldlt-resnet,sdp,121,121,58,63,0,0.4793388429752066,-0.0040631293826446264,-0.000977559300000097,3627.0,0.8705530555843003,-0.16295602900550393,0.014814184455045813,1.0,0.8705530555843003
UCI_N6/wilcoxon_pairwise_all.json ADDED
@@ -0,0 +1,1427 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metric":"mean_cert_acc_108",
4
+ "alg_a":"aol",
5
+ "alg_b":"ldlt-resnet",
6
+ "n_common":121,
7
+ "n_nonzero":121,
8
+ "wins_a":1,
9
+ "wins_b":120,
10
+ "ties":0,
11
+ "win_rate_a_over_b":0.0082644628,
12
+ "mean_diff_a_minus_b":-0.2775693758,
13
+ "median_diff_a_minus_b":-0.2368026357,
14
+ "W_stat":43.0,
15
+ "p_two_sided":3.971911186e-21,
16
+ "z_equiv":-9.4333513461,
17
+ "effect_size_r":0.8575773951,
18
+ "p_holm_global":2.899495166e-19,
19
+ "p_holm_within_metric":5.957866779e-20
20
+ },
21
+ {
22
+ "metric":"mean_cert_acc_108",
23
+ "alg_a":"aol",
24
+ "alg_b":"sandwich",
25
+ "n_common":121,
26
+ "n_nonzero":119,
27
+ "wins_a":4,
28
+ "wins_b":115,
29
+ "ties":2,
30
+ "win_rate_a_over_b":0.041322314,
31
+ "mean_diff_a_minus_b":-0.3003505937,
32
+ "median_diff_a_minus_b":-0.2775541879,
33
+ "W_stat":82.0,
34
+ "p_two_sided":2.283244052e-20,
35
+ "z_equiv":-9.2481908387,
36
+ "effect_size_r":0.8477802642,
37
+ "p_holm_global":1.575438396e-18,
38
+ "p_holm_within_metric":3.196541672e-19
39
+ },
40
+ {
41
+ "metric":"mean_cert_acc_108",
42
+ "alg_a":"aol",
43
+ "alg_b":"ortho",
44
+ "n_common":121,
45
+ "n_nonzero":117,
46
+ "wins_a":3,
47
+ "wins_b":114,
48
+ "ties":4,
49
+ "win_rate_a_over_b":0.041322314,
50
+ "mean_diff_a_minus_b":-0.2492813069,
51
+ "median_diff_a_minus_b":-0.1929709499,
52
+ "W_stat":53.0,
53
+ "p_two_sided":2.421648858e-20,
54
+ "z_equiv":-9.241897121,
55
+ "effect_size_r":0.8544136911,
56
+ "p_holm_global":1.646721224e-18,
57
+ "p_holm_within_metric":3.196541672e-19
58
+ },
59
+ {
60
+ "metric":"mean_cert_acc_108",
61
+ "alg_a":"aol",
62
+ "alg_b":"sdp",
63
+ "n_common":121,
64
+ "n_nonzero":114,
65
+ "wins_a":1,
66
+ "wins_b":113,
67
+ "ties":7,
68
+ "win_rate_a_over_b":0.0371900826,
69
+ "mean_diff_a_minus_b":-0.2192274241,
70
+ "median_diff_a_minus_b":-0.1618937068,
71
+ "W_stat":31.0,
72
+ "p_two_sided":4.402939865e-20,
73
+ "z_equiv":-9.1777251884,
74
+ "effect_size_r":0.8595727194,
75
+ "p_holm_global":2.949969709e-18,
76
+ "p_holm_within_metric":5.283527837e-19
77
+ },
78
+ {
79
+ "metric":"mean_cert_acc_108",
80
+ "alg_a":"aol",
81
+ "alg_b":"ldlt",
82
+ "n_common":121,
83
+ "n_nonzero":96,
84
+ "wins_a":5,
85
+ "wins_b":91,
86
+ "ties":25,
87
+ "win_rate_a_over_b":0.1446280992,
88
+ "mean_diff_a_minus_b":-0.1485900419,
89
+ "median_diff_a_minus_b":-0.0715934783,
90
+ "W_stat":108.0,
91
+ "p_two_sided":5.031122992e-16,
92
+ "z_equiv":-8.1107428442,
93
+ "effect_size_r":0.8277992251,
94
+ "p_holm_global":0.0,
95
+ "p_holm_within_metric":0.0
96
+ },
97
+ {
98
+ "metric":"mean_cert_acc_108",
99
+ "alg_a":"ldlt",
100
+ "alg_b":"sandwich",
101
+ "n_common":121,
102
+ "n_nonzero":119,
103
+ "wins_a":16,
104
+ "wins_b":103,
105
+ "ties":2,
106
+ "win_rate_a_over_b":0.1404958678,
107
+ "mean_diff_a_minus_b":-0.1517605518,
108
+ "median_diff_a_minus_b":-0.0699183001,
109
+ "W_stat":532.0,
110
+ "p_two_sided":7.955949294e-16,
111
+ "z_equiv":-8.0548758918,
112
+ "effect_size_r":0.7383892624,
113
+ "p_holm_global":0.0,
114
+ "p_holm_within_metric":0.0
115
+ },
116
+ {
117
+ "metric":"mean_cert_acc_108",
118
+ "alg_a":"ldlt",
119
+ "alg_b":"ldlt-resnet",
120
+ "n_common":121,
121
+ "n_nonzero":120,
122
+ "wins_a":25,
123
+ "wins_b":95,
124
+ "ties":1,
125
+ "win_rate_a_over_b":0.2107438017,
126
+ "mean_diff_a_minus_b":-0.1289793339,
127
+ "median_diff_a_minus_b":-0.0750768315,
128
+ "W_stat":711.0,
129
+ "p_two_sided":0.0,
130
+ "z_equiv":-7.6431760198,
131
+ "effect_size_r":0.6977233195,
132
+ "p_holm_global":0.0,
133
+ "p_holm_within_metric":0.0
134
+ },
135
+ {
136
+ "metric":"mean_cert_acc_108",
137
+ "alg_a":"sandwich",
138
+ "alg_b":"sdp",
139
+ "n_common":121,
140
+ "n_nonzero":119,
141
+ "wins_a":92,
142
+ "wins_b":27,
143
+ "ties":2,
144
+ "win_rate_a_over_b":0.7685950413,
145
+ "mean_diff_a_minus_b":0.0811231695,
146
+ "median_diff_a_minus_b":0.0456349217,
147
+ "W_stat":1046.0,
148
+ "p_two_sided":0.0,
149
+ "z_equiv":6.6918450413,
150
+ "effect_size_r":0.6134404292,
151
+ "p_holm_global":0.0000000009,
152
+ "p_holm_within_metric":0.0000000002
153
+ },
154
+ {
155
+ "metric":"mean_cert_acc_108",
156
+ "alg_a":"ortho",
157
+ "alg_b":"sandwich",
158
+ "n_common":121,
159
+ "n_nonzero":117,
160
+ "wins_a":20,
161
+ "wins_b":97,
162
+ "ties":4,
163
+ "win_rate_a_over_b":0.1818181818,
164
+ "mean_diff_a_minus_b":-0.0510692867,
165
+ "median_diff_a_minus_b":-0.0322356224,
166
+ "W_stat":1001.5,
167
+ "p_two_sided":0.0,
168
+ "z_equiv":-6.6621652337,
169
+ "effect_size_r":0.6159173937,
170
+ "p_holm_global":0.0000000011,
171
+ "p_holm_within_metric":0.0000000002
172
+ },
173
+ {
174
+ "metric":"mean_cert_acc_108",
175
+ "alg_a":"ldlt",
176
+ "alg_b":"ortho",
177
+ "n_common":121,
178
+ "n_nonzero":117,
179
+ "wins_a":31,
180
+ "wins_b":86,
181
+ "ties":4,
182
+ "win_rate_a_over_b":0.2727272727,
183
+ "mean_diff_a_minus_b":-0.1006912651,
184
+ "median_diff_a_minus_b":-0.0379549302,
185
+ "W_stat":1169.0,
186
+ "p_two_sided":0.0000000005,
187
+ "z_equiv":-6.2065948293,
188
+ "effect_size_r":0.573799895,
189
+ "p_holm_global":0.0000000195,
190
+ "p_holm_within_metric":0.0000000032
191
+ },
192
+ {
193
+ "metric":"mean_cert_acc_108",
194
+ "alg_a":"ldlt",
195
+ "alg_b":"sdp",
196
+ "n_common":121,
197
+ "n_nonzero":114,
198
+ "wins_a":31,
199
+ "wins_b":83,
200
+ "ties":7,
201
+ "win_rate_a_over_b":0.2851239669,
202
+ "mean_diff_a_minus_b":-0.0706373823,
203
+ "median_diff_a_minus_b":-0.0307513103,
204
+ "W_stat":1220.0,
205
+ "p_two_sided":0.000000006,
206
+ "z_equiv":-5.8159521603,
207
+ "effect_size_r":0.5447138274,
208
+ "p_holm_global":0.0000001929,
209
+ "p_holm_within_metric":0.0000000301
210
+ },
211
+ {
212
+ "metric":"mean_cert_acc_108",
213
+ "alg_a":"ldlt-resnet",
214
+ "alg_b":"sdp",
215
+ "n_common":121,
216
+ "n_nonzero":121,
217
+ "wins_a":92,
218
+ "wins_b":29,
219
+ "ties":0,
220
+ "win_rate_a_over_b":0.7603305785,
221
+ "mean_diff_a_minus_b":0.0583419517,
222
+ "median_diff_a_minus_b":0.0294323415,
223
+ "W_stat":1470.0,
224
+ "p_two_sided":0.0000000093,
225
+ "z_equiv":5.7422624709,
226
+ "effect_size_r":0.522023861,
227
+ "p_holm_global":0.0000002896,
228
+ "p_holm_within_metric":0.0000000374
229
+ },
230
+ {
231
+ "metric":"mean_cert_acc_108",
232
+ "alg_a":"ldlt-resnet",
233
+ "alg_b":"ortho",
234
+ "n_common":121,
235
+ "n_nonzero":121,
236
+ "wins_a":84,
237
+ "wins_b":37,
238
+ "ties":0,
239
+ "win_rate_a_over_b":0.694214876,
240
+ "mean_diff_a_minus_b":0.0282880689,
241
+ "median_diff_a_minus_b":0.020693764,
242
+ "W_stat":2239.0,
243
+ "p_two_sided":0.0001746169,
244
+ "z_equiv":3.7531634438,
245
+ "effect_size_r":0.3411966767,
246
+ "p_holm_global":0.0031431046,
247
+ "p_holm_within_metric":0.0005238508
248
+ },
249
+ {
250
+ "metric":"mean_cert_acc_108",
251
+ "alg_a":"ortho",
252
+ "alg_b":"sdp",
253
+ "n_common":121,
254
+ "n_nonzero":119,
255
+ "wins_a":69,
256
+ "wins_b":50,
257
+ "ties":2,
258
+ "win_rate_a_over_b":0.5785123967,
259
+ "mean_diff_a_minus_b":0.0300538828,
260
+ "median_diff_a_minus_b":0.0077348054,
261
+ "W_stat":2707.5,
262
+ "p_two_sided":0.0222623284,
263
+ "z_equiv":2.2858620808,
264
+ "effect_size_r":0.2095446334,
265
+ "p_holm_global":0.2448856126,
266
+ "p_holm_within_metric":0.0445246568
267
+ },
268
+ {
269
+ "metric":"mean_cert_acc_108",
270
+ "alg_a":"ldlt-resnet",
271
+ "alg_b":"sandwich",
272
+ "n_common":121,
273
+ "n_nonzero":121,
274
+ "wins_a":59,
275
+ "wins_b":62,
276
+ "ties":0,
277
+ "win_rate_a_over_b":0.4876033058,
278
+ "mean_diff_a_minus_b":-0.0227812179,
279
+ "median_diff_a_minus_b":-0.0022764653,
280
+ "W_stat":3035.0,
281
+ "p_two_sided":0.0902224636,
282
+ "z_equiv":-1.6942253809,
283
+ "effect_size_r":0.1540204892,
284
+ "p_holm_global":0.721779709,
285
+ "p_holm_within_metric":0.0902224636
286
+ },
287
+ {
288
+ "metric":"mean_cert_acc_255",
289
+ "alg_a":"aol",
290
+ "alg_b":"ldlt-resnet",
291
+ "n_common":121,
292
+ "n_nonzero":107,
293
+ "wins_a":0,
294
+ "wins_b":107,
295
+ "ties":14,
296
+ "win_rate_a_over_b":0.0578512397,
297
+ "mean_diff_a_minus_b":-0.1301208865,
298
+ "median_diff_a_minus_b":-0.0753463618,
299
+ "W_stat":0.0,
300
+ "p_two_sided":2.769967503e-19,
301
+ "z_equiv":-8.9774967874,
302
+ "effect_size_r":0.8678873725,
303
+ "p_holm_global":1.745079527e-17,
304
+ "p_holm_within_metric":4.154951255e-18
305
+ },
306
+ {
307
+ "metric":"mean_cert_acc_255",
308
+ "alg_a":"aol",
309
+ "alg_b":"sandwich",
310
+ "n_common":121,
311
+ "n_nonzero":110,
312
+ "wins_a":3,
313
+ "wins_b":107,
314
+ "ties":11,
315
+ "win_rate_a_over_b":0.0702479339,
316
+ "mean_diff_a_minus_b":-0.1639136245,
317
+ "median_diff_a_minus_b":-0.0914320648,
318
+ "W_stat":67.0,
319
+ "p_two_sided":5.476425263e-19,
320
+ "z_equiv":-8.9021721316,
321
+ "effect_size_r":0.848788809,
322
+ "p_holm_global":3.395383663e-17,
323
+ "p_holm_within_metric":7.666995368e-18
324
+ },
325
+ {
326
+ "metric":"mean_cert_acc_255",
327
+ "alg_a":"aol",
328
+ "alg_b":"sdp",
329
+ "n_common":121,
330
+ "n_nonzero":100,
331
+ "wins_a":1,
332
+ "wins_b":99,
333
+ "ties":21,
334
+ "win_rate_a_over_b":0.0950413223,
335
+ "mean_diff_a_minus_b":-0.1044757497,
336
+ "median_diff_a_minus_b":-0.0434507839,
337
+ "W_stat":4.0,
338
+ "p_two_sided":4.463734493e-18,
339
+ "z_equiv":-8.6663041717,
340
+ "effect_size_r":0.8666304172,
341
+ "p_holm_global":2.722878041e-16,
342
+ "p_holm_within_metric":5.802854841e-17
343
+ },
344
+ {
345
+ "metric":"mean_cert_acc_255",
346
+ "alg_a":"aol",
347
+ "alg_b":"ortho",
348
+ "n_common":121,
349
+ "n_nonzero":99,
350
+ "wins_a":2,
351
+ "wins_b":97,
352
+ "ties":22,
353
+ "win_rate_a_over_b":0.1074380165,
354
+ "mean_diff_a_minus_b":-0.1145907674,
355
+ "median_diff_a_minus_b":-0.0517967492,
356
+ "W_stat":61.0,
357
+ "p_two_sided":3.644214628e-17,
358
+ "z_equiv":-8.4238143794,
359
+ "effect_size_r":0.8466252,
360
+ "p_holm_global":0.0,
361
+ "p_holm_within_metric":4.373057553e-16
362
+ },
363
+ {
364
+ "metric":"mean_cert_acc_255",
365
+ "alg_a":"ldlt",
366
+ "alg_b":"sandwich",
367
+ "n_common":121,
368
+ "n_nonzero":110,
369
+ "wins_a":12,
370
+ "wins_b":98,
371
+ "ties":11,
372
+ "win_rate_a_over_b":0.1446280992,
373
+ "mean_diff_a_minus_b":-0.0913878158,
374
+ "median_diff_a_minus_b":-0.0362588018,
375
+ "W_stat":385.0,
376
+ "p_two_sided":0.0,
377
+ "z_equiv":-7.9538000251,
378
+ "effect_size_r":0.7583650766,
379
+ "p_holm_global":0.0,
380
+ "p_holm_within_metric":0.0
381
+ },
382
+ {
383
+ "metric":"mean_cert_acc_255",
384
+ "alg_a":"ortho",
385
+ "alg_b":"sandwich",
386
+ "n_common":121,
387
+ "n_nonzero":109,
388
+ "wins_a":12,
389
+ "wins_b":97,
390
+ "ties":12,
391
+ "win_rate_a_over_b":0.1487603306,
392
+ "mean_diff_a_minus_b":-0.0493228571,
393
+ "median_diff_a_minus_b":-0.0258620679,
394
+ "W_stat":367.0,
395
+ "p_two_sided":0.0,
396
+ "z_equiv":-7.9511458585,
397
+ "effect_size_r":0.7615816501,
398
+ "p_holm_global":0.0,
399
+ "p_holm_within_metric":0.0
400
+ },
401
+ {
402
+ "metric":"mean_cert_acc_255",
403
+ "alg_a":"aol",
404
+ "alg_b":"ldlt",
405
+ "n_common":121,
406
+ "n_nonzero":81,
407
+ "wins_a":3,
408
+ "wins_b":78,
409
+ "ties":40,
410
+ "win_rate_a_over_b":0.1900826446,
411
+ "mean_diff_a_minus_b":-0.0725258087,
412
+ "median_diff_a_minus_b":-0.0180000011,
413
+ "W_stat":36.0,
414
+ "p_two_sided":0.0,
415
+ "z_equiv":-7.6462484933,
416
+ "effect_size_r":0.8495831659,
417
+ "p_holm_global":0.0,
418
+ "p_holm_within_metric":0.0
419
+ },
420
+ {
421
+ "metric":"mean_cert_acc_255",
422
+ "alg_a":"ldlt",
423
+ "alg_b":"ldlt-resnet",
424
+ "n_common":121,
425
+ "n_nonzero":108,
426
+ "wins_a":22,
427
+ "wins_b":86,
428
+ "ties":13,
429
+ "win_rate_a_over_b":0.2355371901,
430
+ "mean_diff_a_minus_b":-0.0575950778,
431
+ "median_diff_a_minus_b":-0.0305115729,
432
+ "W_stat":669.0,
433
+ "p_two_sided":0.0,
434
+ "z_equiv":-6.968604881,
435
+ "effect_size_r":0.6705543173,
436
+ "p_holm_global":0.0000000001,
437
+ "p_holm_within_metric":0.0
438
+ },
439
+ {
440
+ "metric":"mean_cert_acc_255",
441
+ "alg_a":"sandwich",
442
+ "alg_b":"sdp",
443
+ "n_common":121,
444
+ "n_nonzero":111,
445
+ "wins_a":83,
446
+ "wins_b":28,
447
+ "ties":10,
448
+ "win_rate_a_over_b":0.7272727273,
449
+ "mean_diff_a_minus_b":0.0594378748,
450
+ "median_diff_a_minus_b":0.0187265547,
451
+ "W_stat":1014.0,
452
+ "p_two_sided":0.0000000007,
453
+ "z_equiv":6.1596445847,
454
+ "effect_size_r":0.5846475909,
455
+ "p_holm_global":0.0000000241,
456
+ "p_holm_within_metric":0.0000000051
457
+ },
458
+ {
459
+ "metric":"mean_cert_acc_255",
460
+ "alg_a":"ldlt",
461
+ "alg_b":"sdp",
462
+ "n_common":121,
463
+ "n_nonzero":101,
464
+ "wins_a":24,
465
+ "wins_b":77,
466
+ "ties":20,
467
+ "win_rate_a_over_b":0.2809917355,
468
+ "mean_diff_a_minus_b":-0.0319499409,
469
+ "median_diff_a_minus_b":-0.0083265586,
470
+ "W_stat":1120.0,
471
+ "p_two_sided":0.0000008265,
472
+ "z_equiv":-4.9290149336,
473
+ "effect_size_r":0.490455317,
474
+ "p_holm_global":0.0000214878,
475
+ "p_holm_within_metric":0.0000049587
476
+ },
477
+ {
478
+ "metric":"mean_cert_acc_255",
479
+ "alg_a":"ldlt-resnet",
480
+ "alg_b":"sdp",
481
+ "n_common":121,
482
+ "n_nonzero":109,
483
+ "wins_a":80,
484
+ "wins_b":29,
485
+ "ties":12,
486
+ "win_rate_a_over_b":0.7107438017,
487
+ "mean_diff_a_minus_b":0.0256451368,
488
+ "median_diff_a_minus_b":0.015625,
489
+ "W_stat":1368.5,
490
+ "p_two_sided":0.0000008507,
491
+ "z_equiv":4.9233644211,
492
+ "effect_size_r":0.4715727854,
493
+ "p_holm_global":0.0000214878,
494
+ "p_holm_within_metric":0.0000049587
495
+ },
496
+ {
497
+ "metric":"mean_cert_acc_255",
498
+ "alg_a":"ldlt",
499
+ "alg_b":"ortho",
500
+ "n_common":121,
501
+ "n_nonzero":100,
502
+ "wins_a":30,
503
+ "wins_b":70,
504
+ "ties":21,
505
+ "win_rate_a_over_b":0.3347107438,
506
+ "mean_diff_a_minus_b":-0.0420649587,
507
+ "median_diff_a_minus_b":-0.0076755994,
508
+ "W_stat":1191.0,
509
+ "p_two_sided":0.0000045397,
510
+ "z_equiv":-4.5850061789,
511
+ "effect_size_r":0.4585006179,
512
+ "p_holm_global":0.0001089535,
513
+ "p_holm_within_metric":0.0000181589
514
+ },
515
+ {
516
+ "metric":"mean_cert_acc_255",
517
+ "alg_a":"ldlt-resnet",
518
+ "alg_b":"ortho",
519
+ "n_common":121,
520
+ "n_nonzero":110,
521
+ "wins_a":76,
522
+ "wins_b":34,
523
+ "ties":11,
524
+ "win_rate_a_over_b":0.673553719,
525
+ "mean_diff_a_minus_b":0.0155301191,
526
+ "median_diff_a_minus_b":0.0123031566,
527
+ "W_stat":1722.5,
528
+ "p_two_sided":0.0000734043,
529
+ "z_equiv":3.9649730077,
530
+ "effect_size_r":0.378045343,
531
+ "p_holm_global":0.0014680851,
532
+ "p_holm_within_metric":0.0002202128
533
+ },
534
+ {
535
+ "metric":"mean_cert_acc_255",
536
+ "alg_a":"ldlt-resnet",
537
+ "alg_b":"sandwich",
538
+ "n_common":121,
539
+ "n_nonzero":112,
540
+ "wins_a":44,
541
+ "wins_b":68,
542
+ "ties":9,
543
+ "win_rate_a_over_b":0.4008264463,
544
+ "mean_diff_a_minus_b":-0.033792738,
545
+ "median_diff_a_minus_b":-0.0069877119,
546
+ "W_stat":2043.0,
547
+ "p_two_sided":0.0011421178,
548
+ "z_equiv":-3.2529545065,
549
+ "effect_size_r":0.3073753089,
550
+ "p_holm_global":0.0159896493,
551
+ "p_holm_within_metric":0.0022842356
552
+ },
553
+ {
554
+ "metric":"mean_cert_acc_255",
555
+ "alg_a":"ortho",
556
+ "alg_b":"sdp",
557
+ "n_common":121,
558
+ "n_nonzero":104,
559
+ "wins_a":53,
560
+ "wins_b":51,
561
+ "ties":17,
562
+ "win_rate_a_over_b":0.5082644628,
563
+ "mean_diff_a_minus_b":0.0101150178,
564
+ "median_diff_a_minus_b":0.0,
565
+ "W_stat":2606.0,
566
+ "p_two_sided":0.6887980651,
567
+ "z_equiv":0.4004867169,
568
+ "effect_size_r":0.0392709535,
569
+ "p_holm_global":1.0,
570
+ "p_holm_within_metric":0.6887980651
571
+ },
572
+ {
573
+ "metric":"mean_cert_acc_36",
574
+ "alg_a":"aol",
575
+ "alg_b":"ldlt-resnet",
576
+ "n_common":121,
577
+ "n_nonzero":121,
578
+ "wins_a":6,
579
+ "wins_b":115,
580
+ "ties":0,
581
+ "win_rate_a_over_b":0.0495867769,
582
+ "mean_diff_a_minus_b":-0.3195985256,
583
+ "median_diff_a_minus_b":-0.2928244397,
584
+ "W_stat":93.0,
585
+ "p_two_sided":1.352422096e-20,
586
+ "z_equiv":-9.3040132751,
587
+ "effect_size_r":0.8458193886,
588
+ "p_holm_global":9.466954671e-19,
589
+ "p_holm_within_metric":2.028633144e-19
590
+ },
591
+ {
592
+ "metric":"mean_cert_acc_36",
593
+ "alg_a":"aol",
594
+ "alg_b":"sdp",
595
+ "n_common":121,
596
+ "n_nonzero":121,
597
+ "wins_a":7,
598
+ "wins_b":114,
599
+ "ties":0,
600
+ "win_rate_a_over_b":0.0578512397,
601
+ "mean_diff_a_minus_b":-0.2948710435,
602
+ "median_diff_a_minus_b":-0.2867985517,
603
+ "W_stat":156.0,
604
+ "p_two_sided":6.184471897e-20,
605
+ "z_equiv":-9.1410572461,
606
+ "effect_size_r":0.8310052042,
607
+ "p_holm_global":4.081751452e-18,
608
+ "p_holm_within_metric":8.658260655e-19
609
+ },
610
+ {
611
+ "metric":"mean_cert_acc_36",
612
+ "alg_a":"aol",
613
+ "alg_b":"sandwich",
614
+ "n_common":121,
615
+ "n_nonzero":121,
616
+ "wins_a":9,
617
+ "wins_b":112,
618
+ "ties":0,
619
+ "win_rate_a_over_b":0.0743801653,
620
+ "mean_diff_a_minus_b":-0.336626744,
621
+ "median_diff_a_minus_b":-0.3562658951,
622
+ "W_stat":174.0,
623
+ "p_two_sided":9.50240905e-20,
624
+ "z_equiv":-9.0944983807,
625
+ "effect_size_r":0.8267725801,
626
+ "p_holm_global":6.176565882e-18,
627
+ "p_holm_within_metric":1.235313176e-18
628
+ },
629
+ {
630
+ "metric":"mean_cert_acc_36",
631
+ "alg_a":"aol",
632
+ "alg_b":"ortho",
633
+ "n_common":121,
634
+ "n_nonzero":121,
635
+ "wins_a":9,
636
+ "wins_b":112,
637
+ "ties":0,
638
+ "win_rate_a_over_b":0.0743801653,
639
+ "mean_diff_a_minus_b":-0.3153361513,
640
+ "median_diff_a_minus_b":-0.2984701917,
641
+ "W_stat":183.5,
642
+ "p_two_sided":1.190941154e-19,
643
+ "z_equiv":-9.0699294388,
644
+ "effect_size_r":0.8245390399,
645
+ "p_holm_global":7.622023388e-18,
646
+ "p_holm_within_metric":1.429129385e-18
647
+ },
648
+ {
649
+ "metric":"mean_cert_acc_36",
650
+ "alg_a":"ldlt",
651
+ "alg_b":"sandwich",
652
+ "n_common":121,
653
+ "n_nonzero":121,
654
+ "wins_a":31,
655
+ "wins_b":90,
656
+ "ties":0,
657
+ "win_rate_a_over_b":0.2561983471,
658
+ "mean_diff_a_minus_b":-0.1618678471,
659
+ "median_diff_a_minus_b":-0.0772041827,
660
+ "W_stat":975.0,
661
+ "p_two_sided":0.0,
662
+ "z_equiv":-7.022628869,
663
+ "effect_size_r":0.6384208063,
664
+ "p_holm_global":0.0000000001,
665
+ "p_holm_within_metric":0.0
666
+ },
667
+ {
668
+ "metric":"mean_cert_acc_36",
669
+ "alg_a":"aol",
670
+ "alg_b":"ldlt",
671
+ "n_common":121,
672
+ "n_nonzero":114,
673
+ "wins_a":21,
674
+ "wins_b":93,
675
+ "ties":7,
676
+ "win_rate_a_over_b":0.2024793388,
677
+ "mean_diff_a_minus_b":-0.1747588969,
678
+ "median_diff_a_minus_b":-0.1185294129,
679
+ "W_stat":843.0,
680
+ "p_two_sided":0.0,
681
+ "z_equiv":-6.881883632,
682
+ "effect_size_r":0.6445474567,
683
+ "p_holm_global":0.0000000003,
684
+ "p_holm_within_metric":0.0000000001
685
+ },
686
+ {
687
+ "metric":"mean_cert_acc_36",
688
+ "alg_a":"ldlt",
689
+ "alg_b":"ldlt-resnet",
690
+ "n_common":121,
691
+ "n_nonzero":121,
692
+ "wins_a":36,
693
+ "wins_b":85,
694
+ "ties":0,
695
+ "win_rate_a_over_b":0.2975206612,
696
+ "mean_diff_a_minus_b":-0.1448396288,
697
+ "median_diff_a_minus_b":-0.0605440549,
698
+ "W_stat":1205.0,
699
+ "p_two_sided":0.0000000001,
700
+ "z_equiv":-6.427710033,
701
+ "effect_size_r":0.5843372757,
702
+ "p_holm_global":0.0000000051,
703
+ "p_holm_within_metric":0.0000000012
704
+ },
705
+ {
706
+ "metric":"mean_cert_acc_36",
707
+ "alg_a":"ldlt",
708
+ "alg_b":"sdp",
709
+ "n_common":121,
710
+ "n_nonzero":121,
711
+ "wins_a":36,
712
+ "wins_b":85,
713
+ "ties":0,
714
+ "win_rate_a_over_b":0.2975206612,
715
+ "mean_diff_a_minus_b":-0.1201121466,
716
+ "median_diff_a_minus_b":-0.048914969,
717
+ "W_stat":1305.0,
718
+ "p_two_sided":0.0000000007,
719
+ "z_equiv":-6.1690496695,
720
+ "effect_size_r":0.5608226972,
721
+ "p_holm_global":0.000000024,
722
+ "p_holm_within_metric":0.0000000055
723
+ },
724
+ {
725
+ "metric":"mean_cert_acc_36",
726
+ "alg_a":"ldlt",
727
+ "alg_b":"ortho",
728
+ "n_common":121,
729
+ "n_nonzero":121,
730
+ "wins_a":42,
731
+ "wins_b":79,
732
+ "ties":0,
733
+ "win_rate_a_over_b":0.347107438,
734
+ "mean_diff_a_minus_b":-0.1405772544,
735
+ "median_diff_a_minus_b":-0.053137362,
736
+ "W_stat":1489.0,
737
+ "p_two_sided":0.0000000125,
738
+ "z_equiv":-5.6931146007,
739
+ "effect_size_r":0.5175558728,
740
+ "p_holm_global":0.0000003742,
741
+ "p_holm_within_metric":0.0000000873
742
+ },
743
+ {
744
+ "metric":"mean_cert_acc_36",
745
+ "alg_a":"sandwich",
746
+ "alg_b":"sdp",
747
+ "n_common":121,
748
+ "n_nonzero":119,
749
+ "wins_a":84,
750
+ "wins_b":35,
751
+ "ties":2,
752
+ "win_rate_a_over_b":0.7024793388,
753
+ "mean_diff_a_minus_b":0.0417557005,
754
+ "median_diff_a_minus_b":0.0174162686,
755
+ "W_stat":1683.0,
756
+ "p_two_sided":0.0000005655,
757
+ "z_equiv":5.0026414386,
758
+ "effect_size_r":0.4585913888,
759
+ "p_holm_global":0.000015834,
760
+ "p_holm_within_metric":0.000003393
761
+ },
762
+ {
763
+ "metric":"mean_cert_acc_36",
764
+ "alg_a":"ortho",
765
+ "alg_b":"sandwich",
766
+ "n_common":121,
767
+ "n_nonzero":120,
768
+ "wins_a":38,
769
+ "wins_b":82,
770
+ "ties":1,
771
+ "win_rate_a_over_b":0.3181818182,
772
+ "mean_diff_a_minus_b":-0.0212905927,
773
+ "median_diff_a_minus_b":-0.0130420029,
774
+ "W_stat":2067.0,
775
+ "p_two_sided":0.00004277,
776
+ "z_equiv":-4.0919829682,
777
+ "effect_size_r":0.3735452294,
778
+ "p_holm_global":0.0008981702,
779
+ "p_holm_within_metric":0.00021385
780
+ },
781
+ {
782
+ "metric":"mean_cert_acc_36",
783
+ "alg_a":"ldlt-resnet",
784
+ "alg_b":"sdp",
785
+ "n_common":121,
786
+ "n_nonzero":120,
787
+ "wins_a":71,
788
+ "wins_b":49,
789
+ "ties":1,
790
+ "win_rate_a_over_b":0.5909090909,
791
+ "mean_diff_a_minus_b":0.0247274822,
792
+ "median_diff_a_minus_b":0.0080744923,
793
+ "W_stat":2331.0,
794
+ "p_two_sided":0.0006723776,
795
+ "z_equiv":3.4006015259,
796
+ "effect_size_r":0.3104310275,
797
+ "p_holm_global":0.010758042,
798
+ "p_holm_within_metric":0.0026895105
799
+ },
800
+ {
801
+ "metric":"mean_cert_acc_36",
802
+ "alg_a":"ldlt-resnet",
803
+ "alg_b":"sandwich",
804
+ "n_common":121,
805
+ "n_nonzero":120,
806
+ "wins_a":52,
807
+ "wins_b":68,
808
+ "ties":1,
809
+ "win_rate_a_over_b":0.4338842975,
810
+ "mean_diff_a_minus_b":-0.0170282183,
811
+ "median_diff_a_minus_b":-0.0088294149,
812
+ "W_stat":2802.0,
813
+ "p_two_sided":0.030226149,
814
+ "z_equiv":-2.1671141799,
815
+ "effect_size_r":0.1978295535,
816
+ "p_holm_global":0.3022614896,
817
+ "p_holm_within_metric":0.0906784469
818
+ },
819
+ {
820
+ "metric":"mean_cert_acc_36",
821
+ "alg_a":"ortho",
822
+ "alg_b":"sdp",
823
+ "n_common":121,
824
+ "n_nonzero":121,
825
+ "wins_a":58,
826
+ "wins_b":63,
827
+ "ties":0,
828
+ "win_rate_a_over_b":0.479338843,
829
+ "mean_diff_a_minus_b":0.0204651078,
830
+ "median_diff_a_minus_b":-0.0016042888,
831
+ "W_stat":3123.0,
832
+ "p_two_sided":0.1424837402,
833
+ "z_equiv":1.466604261,
834
+ "effect_size_r":0.1333276601,
835
+ "p_holm_global":0.9973861816,
836
+ "p_holm_within_metric":0.2849674805
837
+ },
838
+ {
839
+ "metric":"mean_cert_acc_36",
840
+ "alg_a":"ldlt-resnet",
841
+ "alg_b":"ortho",
842
+ "n_common":121,
843
+ "n_nonzero":121,
844
+ "wins_a":76,
845
+ "wins_b":45,
846
+ "ties":0,
847
+ "win_rate_a_over_b":0.6280991736,
848
+ "mean_diff_a_minus_b":0.0042623743,
849
+ "median_diff_a_minus_b":0.0059870929,
850
+ "W_stat":3225.0,
851
+ "p_two_sided":0.2290650699,
852
+ "z_equiv":1.2027706903,
853
+ "effect_size_r":0.10934279,
854
+ "p_holm_global":1.0,
855
+ "p_holm_within_metric":0.2849674805
856
+ },
857
+ {
858
+ "metric":"mean_cert_acc_72",
859
+ "alg_a":"aol",
860
+ "alg_b":"ldlt-resnet",
861
+ "n_common":121,
862
+ "n_nonzero":121,
863
+ "wins_a":1,
864
+ "wins_b":120,
865
+ "ties":0,
866
+ "win_rate_a_over_b":0.0082644628,
867
+ "mean_diff_a_minus_b":-0.3092410628,
868
+ "median_diff_a_minus_b":-0.2919858993,
869
+ "W_stat":21.0,
870
+ "p_two_sided":2.304748555e-21,
871
+ "z_equiv":-9.4902527053,
872
+ "effect_size_r":0.8627502459,
873
+ "p_holm_global":1.728561416e-19,
874
+ "p_holm_within_metric":3.457122833e-20
875
+ },
876
+ {
877
+ "metric":"mean_cert_acc_72",
878
+ "alg_a":"aol",
879
+ "alg_b":"sdp",
880
+ "n_common":121,
881
+ "n_nonzero":119,
882
+ "wins_a":1,
883
+ "wins_b":118,
884
+ "ties":2,
885
+ "win_rate_a_over_b":0.0165289256,
886
+ "mean_diff_a_minus_b":-0.2649477861,
887
+ "median_diff_a_minus_b":-0.2343178242,
888
+ "W_stat":2.0,
889
+ "p_two_sided":3.069560827e-21,
890
+ "z_equiv":-9.4603357182,
891
+ "effect_size_r":0.8672275534,
892
+ "p_holm_global":2.271475012e-19,
893
+ "p_holm_within_metric":4.297385158e-20
894
+ },
895
+ {
896
+ "metric":"mean_cert_acc_72",
897
+ "alg_a":"aol",
898
+ "alg_b":"ortho",
899
+ "n_common":121,
900
+ "n_nonzero":121,
901
+ "wins_a":6,
902
+ "wins_b":115,
903
+ "ties":0,
904
+ "win_rate_a_over_b":0.0495867769,
905
+ "mean_diff_a_minus_b":-0.2907397669,
906
+ "median_diff_a_minus_b":-0.2589285746,
907
+ "W_stat":86.5,
908
+ "p_two_sided":1.154336109e-20,
909
+ "z_equiv":-9.3208300963,
910
+ "effect_size_r":0.8473481906,
911
+ "p_holm_global":8.311219988e-19,
912
+ "p_holm_within_metric":1.500636942e-19
913
+ },
914
+ {
915
+ "metric":"mean_cert_acc_72",
916
+ "alg_a":"aol",
917
+ "alg_b":"sandwich",
918
+ "n_common":121,
919
+ "n_nonzero":121,
920
+ "wins_a":7,
921
+ "wins_b":114,
922
+ "ties":0,
923
+ "win_rate_a_over_b":0.0578512397,
924
+ "mean_diff_a_minus_b":-0.3364568783,
925
+ "median_diff_a_minus_b":-0.3205493689,
926
+ "W_stat":90.0,
927
+ "p_two_sided":1.257158705e-20,
928
+ "z_equiv":-9.311773086,
929
+ "effect_size_r":0.846524826,
930
+ "p_holm_global":8.925826805e-19,
931
+ "p_holm_within_metric":1.508590446e-19
932
+ },
933
+ {
934
+ "metric":"mean_cert_acc_72",
935
+ "alg_a":"ldlt",
936
+ "alg_b":"sandwich",
937
+ "n_common":121,
938
+ "n_nonzero":120,
939
+ "wins_a":21,
940
+ "wins_b":99,
941
+ "ties":1,
942
+ "win_rate_a_over_b":0.1776859504,
943
+ "mean_diff_a_minus_b":-0.1661887829,
944
+ "median_diff_a_minus_b":-0.0915510654,
945
+ "W_stat":608.0,
946
+ "p_two_sided":0.0,
947
+ "z_equiv":-7.9129129845,
948
+ "effect_size_r":0.7223468229,
949
+ "p_holm_global":0.0,
950
+ "p_holm_within_metric":0.0
951
+ },
952
+ {
953
+ "metric":"mean_cert_acc_72",
954
+ "alg_a":"aol",
955
+ "alg_b":"ldlt",
956
+ "n_common":121,
957
+ "n_nonzero":103,
958
+ "wins_a":10,
959
+ "wins_b":93,
960
+ "ties":18,
961
+ "win_rate_a_over_b":0.1570247934,
962
+ "mean_diff_a_minus_b":-0.1702680954,
963
+ "median_diff_a_minus_b":-0.1040100288,
964
+ "W_stat":284.0,
965
+ "p_two_sided":0.0,
966
+ "z_equiv":-7.8744204133,
967
+ "effect_size_r":0.7758896982,
968
+ "p_holm_global":0.0,
969
+ "p_holm_within_metric":0.0
970
+ },
971
+ {
972
+ "metric":"mean_cert_acc_72",
973
+ "alg_a":"ldlt",
974
+ "alg_b":"ldlt-resnet",
975
+ "n_common":121,
976
+ "n_nonzero":121,
977
+ "wins_a":30,
978
+ "wins_b":91,
979
+ "ties":0,
980
+ "win_rate_a_over_b":0.2479338843,
981
+ "mean_diff_a_minus_b":-0.1389729674,
982
+ "median_diff_a_minus_b":-0.0703703724,
983
+ "W_stat":922.0,
984
+ "p_two_sided":0.0,
985
+ "z_equiv":-7.1597188617,
986
+ "effect_size_r":0.6508835329,
987
+ "p_holm_global":0.0,
988
+ "p_holm_within_metric":0.0
989
+ },
990
+ {
991
+ "metric":"mean_cert_acc_72",
992
+ "alg_a":"sandwich",
993
+ "alg_b":"sdp",
994
+ "n_common":121,
995
+ "n_nonzero":121,
996
+ "wins_a":93,
997
+ "wins_b":28,
998
+ "ties":0,
999
+ "win_rate_a_over_b":0.7685950413,
1000
+ "mean_diff_a_minus_b":0.0715090921,
1001
+ "median_diff_a_minus_b":0.0368270464,
1002
+ "W_stat":1188.0,
1003
+ "p_two_sided":0.0000000001,
1004
+ "z_equiv":6.4716822948,
1005
+ "effect_size_r":0.5883347541,
1006
+ "p_holm_global":0.000000004,
1007
+ "p_holm_within_metric":0.0000000008
1008
+ },
1009
+ {
1010
+ "metric":"mean_cert_acc_72",
1011
+ "alg_a":"ldlt",
1012
+ "alg_b":"sdp",
1013
+ "n_common":121,
1014
+ "n_nonzero":120,
1015
+ "wins_a":34,
1016
+ "wins_b":86,
1017
+ "ties":1,
1018
+ "win_rate_a_over_b":0.2851239669,
1019
+ "mean_diff_a_minus_b":-0.0946796908,
1020
+ "median_diff_a_minus_b":-0.048577195,
1021
+ "W_stat":1161.0,
1022
+ "p_two_sided":0.0000000001,
1023
+ "z_equiv":-6.4646783724,
1024
+ "effect_size_r":0.5901416953,
1025
+ "p_holm_global":0.0000000041,
1026
+ "p_holm_within_metric":0.0000000008
1027
+ },
1028
+ {
1029
+ "metric":"mean_cert_acc_72",
1030
+ "alg_a":"ortho",
1031
+ "alg_b":"sandwich",
1032
+ "n_common":121,
1033
+ "n_nonzero":118,
1034
+ "wins_a":19,
1035
+ "wins_b":99,
1036
+ "ties":3,
1037
+ "win_rate_a_over_b":0.1694214876,
1038
+ "mean_diff_a_minus_b":-0.0457171114,
1039
+ "median_diff_a_minus_b":-0.0301288068,
1040
+ "W_stat":1121.5,
1041
+ "p_two_sided":0.0000000001,
1042
+ "z_equiv":-6.4141986325,
1043
+ "effect_size_r":0.5904748455,
1044
+ "p_holm_global":0.0000000054,
1045
+ "p_holm_within_metric":0.0000000008
1046
+ },
1047
+ {
1048
+ "metric":"mean_cert_acc_72",
1049
+ "alg_a":"ldlt",
1050
+ "alg_b":"ortho",
1051
+ "n_common":121,
1052
+ "n_nonzero":120,
1053
+ "wins_a":35,
1054
+ "wins_b":85,
1055
+ "ties":1,
1056
+ "win_rate_a_over_b":0.2933884298,
1057
+ "mean_diff_a_minus_b":-0.1204716715,
1058
+ "median_diff_a_minus_b":-0.047722198,
1059
+ "W_stat":1257.0,
1060
+ "p_two_sided":0.0000000005,
1061
+ "z_equiv":-6.2132669388,
1062
+ "effect_size_r":0.5671910764,
1063
+ "p_holm_global":0.0000000192,
1064
+ "p_holm_within_metric":0.0000000026
1065
+ },
1066
+ {
1067
+ "metric":"mean_cert_acc_72",
1068
+ "alg_a":"ldlt-resnet",
1069
+ "alg_b":"sdp",
1070
+ "n_common":121,
1071
+ "n_nonzero":121,
1072
+ "wins_a":82,
1073
+ "wins_b":39,
1074
+ "ties":0,
1075
+ "win_rate_a_over_b":0.6776859504,
1076
+ "mean_diff_a_minus_b":0.0442932766,
1077
+ "median_diff_a_minus_b":0.0152180791,
1078
+ "W_stat":1961.0,
1079
+ "p_two_sided":0.0000077405,
1080
+ "z_equiv":4.472239555,
1081
+ "effect_size_r":0.4065672323,
1082
+ "p_holm_global":0.0001780307,
1083
+ "p_holm_within_metric":0.0000309619
1084
+ },
1085
+ {
1086
+ "metric":"mean_cert_acc_72",
1087
+ "alg_a":"ldlt-resnet",
1088
+ "alg_b":"sandwich",
1089
+ "n_common":121,
1090
+ "n_nonzero":121,
1091
+ "wins_a":49,
1092
+ "wins_b":72,
1093
+ "ties":0,
1094
+ "win_rate_a_over_b":0.4049586777,
1095
+ "mean_diff_a_minus_b":-0.0272158155,
1096
+ "median_diff_a_minus_b":-0.0105392188,
1097
+ "W_stat":2635.0,
1098
+ "p_two_sided":0.0063552362,
1099
+ "z_equiv":-2.7288668349,
1100
+ "effect_size_r":0.2480788032,
1101
+ "p_holm_global":0.0826180701,
1102
+ "p_holm_within_metric":0.0190657085
1103
+ },
1104
+ {
1105
+ "metric":"mean_cert_acc_72",
1106
+ "alg_a":"ldlt-resnet",
1107
+ "alg_b":"ortho",
1108
+ "n_common":121,
1109
+ "n_nonzero":121,
1110
+ "wins_a":74,
1111
+ "wins_b":47,
1112
+ "ties":0,
1113
+ "win_rate_a_over_b":0.6115702479,
1114
+ "mean_diff_a_minus_b":0.0185012959,
1115
+ "median_diff_a_minus_b":0.011391893,
1116
+ "W_stat":2675.0,
1117
+ "p_two_sided":0.0086546544,
1118
+ "z_equiv":2.6254026895,
1119
+ "effect_size_r":0.2386729718,
1120
+ "p_holm_global":0.1038558522,
1121
+ "p_holm_within_metric":0.0190657085
1122
+ },
1123
+ {
1124
+ "metric":"mean_cert_acc_72",
1125
+ "alg_a":"ortho",
1126
+ "alg_b":"sdp",
1127
+ "n_common":121,
1128
+ "n_nonzero":121,
1129
+ "wins_a":62,
1130
+ "wins_b":59,
1131
+ "ties":0,
1132
+ "win_rate_a_over_b":0.5123966942,
1133
+ "mean_diff_a_minus_b":0.0257919807,
1134
+ "median_diff_a_minus_b":0.0024819822,
1135
+ "W_stat":2935.5,
1136
+ "p_two_sided":0.0509865142,
1137
+ "z_equiv":1.9515932587,
1138
+ "effect_size_r":0.177417569,
1139
+ "p_holm_global":0.4588786282,
1140
+ "p_holm_within_metric":0.0509865142
1141
+ },
1142
+ {
1143
+ "metric":"mean_test_acc",
1144
+ "alg_a":"aol",
1145
+ "alg_b":"ldlt",
1146
+ "n_common":121,
1147
+ "n_nonzero":121,
1148
+ "wins_a":16,
1149
+ "wins_b":105,
1150
+ "ties":0,
1151
+ "win_rate_a_over_b":0.132231405,
1152
+ "mean_diff_a_minus_b":-0.1195835257,
1153
+ "median_diff_a_minus_b":-0.0631501061,
1154
+ "W_stat":409.0,
1155
+ "p_two_sided":2.126854418e-17,
1156
+ "z_equiv":-8.4866465265,
1157
+ "effect_size_r":0.7715133206,
1158
+ "p_holm_global":0.0,
1159
+ "p_holm_within_metric":3.190281628e-16
1160
+ },
1161
+ {
1162
+ "metric":"mean_test_acc",
1163
+ "alg_a":"aol",
1164
+ "alg_b":"sandwich",
1165
+ "n_common":121,
1166
+ "n_nonzero":121,
1167
+ "wins_a":23,
1168
+ "wins_b":98,
1169
+ "ties":0,
1170
+ "win_rate_a_over_b":0.1900826446,
1171
+ "mean_diff_a_minus_b":-0.1113283867,
1172
+ "median_diff_a_minus_b":-0.0656148695,
1173
+ "W_stat":698.0,
1174
+ "p_two_sided":0.0,
1175
+ "z_equiv":-7.7391180759,
1176
+ "effect_size_r":0.7035561887,
1177
+ "p_holm_global":0.0,
1178
+ "p_holm_within_metric":0.0
1179
+ },
1180
+ {
1181
+ "metric":"mean_test_acc",
1182
+ "alg_a":"aol",
1183
+ "alg_b":"ortho",
1184
+ "n_common":121,
1185
+ "n_nonzero":121,
1186
+ "wins_a":25,
1187
+ "wins_b":96,
1188
+ "ties":0,
1189
+ "win_rate_a_over_b":0.2066115702,
1190
+ "mean_diff_a_minus_b":-0.0986620727,
1191
+ "median_diff_a_minus_b":-0.0525094743,
1192
+ "W_stat":908.0,
1193
+ "p_two_sided":0.0,
1194
+ "z_equiv":-7.1959313126,
1195
+ "effect_size_r":0.6541755739,
1196
+ "p_holm_global":0.0,
1197
+ "p_holm_within_metric":0.0
1198
+ },
1199
+ {
1200
+ "metric":"mean_test_acc",
1201
+ "alg_a":"aol",
1202
+ "alg_b":"sdp",
1203
+ "n_common":121,
1204
+ "n_nonzero":121,
1205
+ "wins_a":24,
1206
+ "wins_b":97,
1207
+ "ties":0,
1208
+ "win_rate_a_over_b":0.1983471074,
1209
+ "mean_diff_a_minus_b":-0.0961238247,
1210
+ "median_diff_a_minus_b":-0.0445100629,
1211
+ "W_stat":1047.0,
1212
+ "p_two_sided":0.0,
1213
+ "z_equiv":-6.8363934073,
1214
+ "effect_size_r":0.6214903098,
1215
+ "p_holm_global":0.0000000004,
1216
+ "p_holm_within_metric":0.0000000001
1217
+ },
1218
+ {
1219
+ "metric":"mean_test_acc",
1220
+ "alg_a":"aol",
1221
+ "alg_b":"ldlt-resnet",
1222
+ "n_common":121,
1223
+ "n_nonzero":121,
1224
+ "wins_a":27,
1225
+ "wins_b":94,
1226
+ "ties":0,
1227
+ "win_rate_a_over_b":0.2231404959,
1228
+ "mean_diff_a_minus_b":-0.0920606953,
1229
+ "median_diff_a_minus_b":-0.0356908378,
1230
+ "W_stat":1307.0,
1231
+ "p_two_sided":0.0000000007,
1232
+ "z_equiv":-6.1638764622,
1233
+ "effect_size_r":0.5603524057,
1234
+ "p_holm_global":0.0000000241,
1235
+ "p_holm_within_metric":0.0000000078
1236
+ },
1237
+ {
1238
+ "metric":"mean_test_acc",
1239
+ "alg_a":"ldlt",
1240
+ "alg_b":"sdp",
1241
+ "n_common":121,
1242
+ "n_nonzero":121,
1243
+ "wins_a":86,
1244
+ "wins_b":35,
1245
+ "ties":0,
1246
+ "win_rate_a_over_b":0.7107438017,
1247
+ "mean_diff_a_minus_b":0.023459701,
1248
+ "median_diff_a_minus_b":0.0102784065,
1249
+ "W_stat":1511.0,
1250
+ "p_two_sided":0.0000000174,
1251
+ "z_equiv":5.6362093207,
1252
+ "effect_size_r":0.5123826655,
1253
+ "p_holm_global":0.0000005041,
1254
+ "p_holm_within_metric":0.0000001738
1255
+ },
1256
+ {
1257
+ "metric":"mean_test_acc",
1258
+ "alg_a":"ldlt",
1259
+ "alg_b":"ldlt-resnet",
1260
+ "n_common":121,
1261
+ "n_nonzero":121,
1262
+ "wins_a":87,
1263
+ "wins_b":34,
1264
+ "ties":0,
1265
+ "win_rate_a_over_b":0.7190082645,
1266
+ "mean_diff_a_minus_b":0.0275228304,
1267
+ "median_diff_a_minus_b":0.0124811598,
1268
+ "W_stat":1779.0,
1269
+ "p_two_sided":0.0000007693,
1270
+ "z_equiv":4.9429995465,
1271
+ "effect_size_r":0.4493635951,
1272
+ "p_holm_global":0.000020771,
1273
+ "p_holm_within_metric":0.0000069237
1274
+ },
1275
+ {
1276
+ "metric":"mean_test_acc",
1277
+ "alg_a":"ldlt",
1278
+ "alg_b":"ortho",
1279
+ "n_common":121,
1280
+ "n_nonzero":121,
1281
+ "wins_a":78,
1282
+ "wins_b":43,
1283
+ "ties":0,
1284
+ "win_rate_a_over_b":0.6446280992,
1285
+ "mean_diff_a_minus_b":0.020921453,
1286
+ "median_diff_a_minus_b":0.010356299,
1287
+ "W_stat":2002.0,
1288
+ "p_two_sided":0.0000126434,
1289
+ "z_equiv":4.3661869359,
1290
+ "effect_size_r":0.3969260851,
1291
+ "p_holm_global":0.0002781554,
1292
+ "p_holm_within_metric":0.0001011474
1293
+ },
1294
+ {
1295
+ "metric":"mean_test_acc",
1296
+ "alg_a":"ortho",
1297
+ "alg_b":"sandwich",
1298
+ "n_common":121,
1299
+ "n_nonzero":120,
1300
+ "wins_a":39,
1301
+ "wins_b":81,
1302
+ "ties":1,
1303
+ "win_rate_a_over_b":0.326446281,
1304
+ "mean_diff_a_minus_b":-0.012666314,
1305
+ "median_diff_a_minus_b":-0.0078946893,
1306
+ "W_stat":2171.0,
1307
+ "p_two_sided":0.0001336571,
1308
+ "z_equiv":-3.8196205818,
1309
+ "effect_size_r":0.348682059,
1310
+ "p_holm_global":0.0025394851,
1311
+ "p_holm_within_metric":0.0009355998
1312
+ },
1313
+ {
1314
+ "metric":"mean_test_acc",
1315
+ "alg_a":"sandwich",
1316
+ "alg_b":"sdp",
1317
+ "n_common":121,
1318
+ "n_nonzero":121,
1319
+ "wins_a":80,
1320
+ "wins_b":41,
1321
+ "ties":0,
1322
+ "win_rate_a_over_b":0.6611570248,
1323
+ "mean_diff_a_minus_b":0.015204562,
1324
+ "median_diff_a_minus_b":0.006305895,
1325
+ "W_stat":2279.0,
1326
+ "p_two_sided":0.0002625491,
1327
+ "z_equiv":3.649697729,
1328
+ "effect_size_r":0.3317907026,
1329
+ "p_holm_global":0.0044633343,
1330
+ "p_holm_within_metric":0.0015752945
1331
+ },
1332
+ {
1333
+ "metric":"mean_test_acc",
1334
+ "alg_a":"ldlt-resnet",
1335
+ "alg_b":"sandwich",
1336
+ "n_common":121,
1337
+ "n_nonzero":121,
1338
+ "wins_a":47,
1339
+ "wins_b":74,
1340
+ "ties":0,
1341
+ "win_rate_a_over_b":0.3884297521,
1342
+ "mean_diff_a_minus_b":-0.0192676914,
1343
+ "median_diff_a_minus_b":-0.01009705,
1344
+ "W_stat":2411.0,
1345
+ "p_two_sided":0.0009387558,
1346
+ "z_equiv":-3.3082660492,
1347
+ "effect_size_r":0.300751459,
1348
+ "p_holm_global":0.0140813373,
1349
+ "p_holm_within_metric":0.0046937791
1350
+ },
1351
+ {
1352
+ "metric":"mean_test_acc",
1353
+ "alg_a":"ldlt",
1354
+ "alg_b":"sandwich",
1355
+ "n_common":121,
1356
+ "n_nonzero":120,
1357
+ "wins_a":64,
1358
+ "wins_b":56,
1359
+ "ties":1,
1360
+ "win_rate_a_over_b":0.5330578512,
1361
+ "mean_diff_a_minus_b":0.008255139,
1362
+ "median_diff_a_minus_b":0.0008221223,
1363
+ "W_stat":3145.0,
1364
+ "p_two_sided":0.2044973939,
1365
+ "z_equiv":1.2688420788,
1366
+ "effect_size_r":0.1158289047,
1367
+ "p_holm_global":1.0,
1368
+ "p_holm_within_metric":0.8179895757
1369
+ },
1370
+ {
1371
+ "metric":"mean_test_acc",
1372
+ "alg_a":"ldlt-resnet",
1373
+ "alg_b":"ortho",
1374
+ "n_common":121,
1375
+ "n_nonzero":121,
1376
+ "wins_a":54,
1377
+ "wins_b":67,
1378
+ "ties":0,
1379
+ "win_rate_a_over_b":0.4462809917,
1380
+ "mean_diff_a_minus_b":-0.0066013774,
1381
+ "median_diff_a_minus_b":-0.0023532391,
1382
+ "W_stat":3206.0,
1383
+ "p_two_sided":0.2106004159,
1384
+ "z_equiv":-1.2519161593,
1385
+ "effect_size_r":0.1138105599,
1386
+ "p_holm_global":1.0,
1387
+ "p_holm_within_metric":0.8179895757
1388
+ },
1389
+ {
1390
+ "metric":"mean_test_acc",
1391
+ "alg_a":"ortho",
1392
+ "alg_b":"sdp",
1393
+ "n_common":121,
1394
+ "n_nonzero":121,
1395
+ "wins_a":60,
1396
+ "wins_b":61,
1397
+ "ties":0,
1398
+ "win_rate_a_over_b":0.4958677686,
1399
+ "mean_diff_a_minus_b":0.0025382481,
1400
+ "median_diff_a_minus_b":-0.0000065726,
1401
+ "W_stat":3382.0,
1402
+ "p_two_sided":0.4256404345,
1403
+ "z_equiv":0.7966739196,
1404
+ "effect_size_r":0.0724249018,
1405
+ "p_holm_global":1.0,
1406
+ "p_holm_within_metric":0.8512808691
1407
+ },
1408
+ {
1409
+ "metric":"mean_test_acc",
1410
+ "alg_a":"ldlt-resnet",
1411
+ "alg_b":"sdp",
1412
+ "n_common":121,
1413
+ "n_nonzero":121,
1414
+ "wins_a":58,
1415
+ "wins_b":63,
1416
+ "ties":0,
1417
+ "win_rate_a_over_b":0.479338843,
1418
+ "mean_diff_a_minus_b":-0.0040631294,
1419
+ "median_diff_a_minus_b":-0.0009775593,
1420
+ "W_stat":3627.0,
1421
+ "p_two_sided":0.8705530556,
1422
+ "z_equiv":-0.162956029,
1423
+ "effect_size_r":0.0148141845,
1424
+ "p_holm_global":1.0,
1425
+ "p_holm_within_metric":0.8705530556
1426
+ }
1427
+ ]
UCI_N6/wilcoxon_prep_all.json ADDED
The diff for this file is too large to render. See raw diff