AbstractPhil commited on
Commit
82128cf
·
verified ·
1 Parent(s): 916d974

Ablation A-MID-baseline-s4

Browse files
A/MID/baseline/seed4/final_report.json ADDED
@@ -0,0 +1,201 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "group": "A",
4
+ "variant": "baseline",
5
+ "band": "MID",
6
+ "seed": 4,
7
+ "phase": 1,
8
+ "overrides": {},
9
+ "description": "A-MID-baseline-s4"
10
+ },
11
+ "run_config": {
12
+ "matrix_v": 64,
13
+ "D": 8,
14
+ "patch_size": 16,
15
+ "hidden": 64,
16
+ "depth": 1,
17
+ "n_cross_layers": 1,
18
+ "n_heads": 4,
19
+ "max_alpha": 0.2,
20
+ "alpha_init": -2.0,
21
+ "img_size": 64,
22
+ "batch_size": 128,
23
+ "lr": 0.0001,
24
+ "epochs": 1,
25
+ "weight_decay": 0.0,
26
+ "use_cv_ema": true,
27
+ "cv_ema_alpha": 0.01,
28
+ "cv_alignment_epochs": 0,
29
+ "cv_measure_every": 50,
30
+ "cv_sigma_scale": 0.3,
31
+ "boost": 0.5,
32
+ "cross_attn_clip": 0.5,
33
+ "allowed_types": [
34
+ 0,
35
+ 1,
36
+ 2,
37
+ 3,
38
+ 4,
39
+ 5,
40
+ 6,
41
+ 7,
42
+ 8,
43
+ 9,
44
+ 10,
45
+ 11,
46
+ 12,
47
+ 13,
48
+ 14,
49
+ 15
50
+ ],
51
+ "train_size": 1000000,
52
+ "val_size": 10000,
53
+ "num_workers": 2,
54
+ "report_every": 100,
55
+ "major_report_every": 10,
56
+ "save_every": 5,
57
+ "seed": 4,
58
+ "hf_repo": "AbstractPhil/geolip-svae-batteries",
59
+ "upload": false
60
+ },
61
+ "cv_ema_final": 0.3599670725388661,
62
+ "cv_last": 0.3347021000974292,
63
+ "predicted_band": "MID",
64
+ "expected_band": "MID",
65
+ "band_match": true,
66
+ "test_mse": 1.0100557804107666,
67
+ "recon_ema": 1.0220289967959604,
68
+ "S0": 3.543379783630371,
69
+ "SD": 2.09558367729187,
70
+ "ratio": 1.6908796365987622,
71
+ "erank": 7.888388633728027,
72
+ "observed_sphere_cv": 0.3608787914258507,
73
+ "uniform_sphere_cv_prediction": 0.35679185069620456,
74
+ "band_deviation": 0.00408694072964616,
75
+ "params_count": 183339,
76
+ "wallclock_seconds": 34.16153311729431,
77
+ "batches_completed": 1000,
78
+ "batch_limit": 1000,
79
+ "cv_trajectory": [
80
+ {
81
+ "batch": 0,
82
+ "cv": 0.3600818508493979,
83
+ "cv_ema": 0.3600818508493979,
84
+ "recon": 1.75569486618042
85
+ },
86
+ {
87
+ "batch": 50,
88
+ "cv": 0.33711562665475986,
89
+ "cv_ema": 0.35985218860745155,
90
+ "recon": 1.6380332708358765
91
+ },
92
+ {
93
+ "batch": 100,
94
+ "cv": 0.32665113742627583,
95
+ "cv_ema": 0.3595201780956398,
96
+ "recon": 1.495504379272461
97
+ },
98
+ {
99
+ "batch": 150,
100
+ "cv": 0.3508182205102274,
101
+ "cv_ema": 0.3594331585197857,
102
+ "recon": 1.2335050106048584
103
+ },
104
+ {
105
+ "batch": 200,
106
+ "cv": 0.371947341845095,
107
+ "cv_ema": 0.3595583003530388,
108
+ "recon": 1.2653498649597168
109
+ },
110
+ {
111
+ "batch": 250,
112
+ "cv": 0.33240998432863583,
113
+ "cv_ema": 0.35928681719279476,
114
+ "recon": 1.26668119430542
115
+ },
116
+ {
117
+ "batch": 300,
118
+ "cv": 0.35383638576800464,
119
+ "cv_ema": 0.35923231287854684,
120
+ "recon": 1.0561249256134033
121
+ },
122
+ {
123
+ "batch": 350,
124
+ "cv": 0.3749664130063572,
125
+ "cv_ema": 0.3593896538798249,
126
+ "recon": 1.2007616758346558
127
+ },
128
+ {
129
+ "batch": 400,
130
+ "cv": 0.39026814313458674,
131
+ "cv_ema": 0.3596984387723725,
132
+ "recon": 1.0227516889572144
133
+ },
134
+ {
135
+ "batch": 450,
136
+ "cv": 0.3798199528660714,
137
+ "cv_ema": 0.3598996539133095,
138
+ "recon": 0.9014067649841309
139
+ },
140
+ {
141
+ "batch": 500,
142
+ "cv": 0.33833482266750614,
143
+ "cv_ema": 0.3596840056008515,
144
+ "recon": 1.028473138809204
145
+ },
146
+ {
147
+ "batch": 550,
148
+ "cv": 0.35871193071775426,
149
+ "cv_ema": 0.3596742848520205,
150
+ "recon": 0.8945984840393066
151
+ },
152
+ {
153
+ "batch": 600,
154
+ "cv": 0.35962579899699704,
155
+ "cv_ema": 0.3596737999934703,
156
+ "recon": 1.046332597732544
157
+ },
158
+ {
159
+ "batch": 650,
160
+ "cv": 0.3549171823749464,
161
+ "cv_ema": 0.3596262338172851,
162
+ "recon": 1.3086342811584473
163
+ },
164
+ {
165
+ "batch": 700,
166
+ "cv": 0.3924401260737366,
167
+ "cv_ema": 0.3599543727398496,
168
+ "recon": 0.9383307695388794
169
+ },
170
+ {
171
+ "batch": 750,
172
+ "cv": 0.33259159575045844,
173
+ "cv_ema": 0.35968074496995567,
174
+ "recon": 1.2596534490585327
175
+ },
176
+ {
177
+ "batch": 800,
178
+ "cv": 0.36414357964406785,
179
+ "cv_ema": 0.3597253733166968,
180
+ "recon": 0.9013160467147827
181
+ },
182
+ {
183
+ "batch": 850,
184
+ "cv": 0.39595216010448,
185
+ "cv_ema": 0.3600876411845746,
186
+ "recon": 1.0062742233276367
187
+ },
188
+ {
189
+ "batch": 900,
190
+ "cv": 0.373550950796997,
191
+ "cv_ema": 0.3602222742806988,
192
+ "recon": 0.8960329294204712
193
+ },
194
+ {
195
+ "batch": 950,
196
+ "cv": 0.3347021000974292,
197
+ "cv_ema": 0.3599670725388661,
198
+ "recon": 1.1431188583374023
199
+ }
200
+ ]
201
+ }