thomas-schweich commited on
Commit
c62ea6a
·
verified ·
1 Parent(s): 6af51da

Update eval_results.json: probes + diagnostics from run_evals_backbone.py

Browse files
Files changed (1) hide show
  1. eval_results.json +642 -104
eval_results.json CHANGED
@@ -1,170 +1,708 @@
1
  {
2
  "probes": {
3
  "piece_type": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  "layer_7": {
5
- "accuracy": 0.8972528332996329,
6
- "loss": 0.462514906460532,
7
- "best_accuracy": 0.8972528332996329,
8
- "n_train": 485944,
9
- "n_val": 120043
10
  }
11
  },
12
  "side_to_move": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  "layer_7": {
14
- "accuracy": 0.999999999883316,
15
- "loss": 4.451842106768326e-08,
16
- "best_accuracy": 0.999999999883316,
17
- "n_train": 485944,
18
- "n_val": 120043
19
  }
20
  },
21
  "is_check": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  "layer_7": {
23
- "accuracy": 0.9391384753419195,
24
- "loss": 0.23080479027553283,
25
- "best_accuracy": 0.942370650479162,
26
- "n_train": 485944,
27
- "n_val": 120043
28
  }
29
  },
30
  "castling_rights": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
31
  "layer_7": {
32
- "accuracy": 0.9661996117109328,
33
- "loss": 0.09139342949068821,
34
- "best_accuracy": 0.9664266137326708,
35
- "n_train": 485944,
36
- "n_val": 120043
37
  }
38
  },
39
  "ep_square": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  "layer_7": {
41
- "accuracy": 0.9960014327032223,
42
- "loss": 0.07782827074727709,
43
- "best_accuracy": 0.9971426904192073,
44
- "n_train": 485944,
45
- "n_val": 120043
46
  }
47
  },
48
  "material_count": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
49
  "layer_7": {
50
- "accuracy": 0.7550588543344782,
51
- "loss": 0.7828635349641946,
52
- "best_accuracy": 0.8613100342512295,
53
- "n_train": 485944,
54
- "n_val": 120043,
55
- "mae": 6.08153298697524
56
  }
57
  },
58
  "legal_move_count": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59
  "layer_7": {
60
- "accuracy": 0.379081750813699,
61
- "loss": 83.04724725417708,
62
- "best_accuracy": 0.379081750813699,
63
- "n_train": 485944,
64
- "n_val": 120043,
65
- "mae": 6.84791993114902
66
  }
67
  },
68
  "halfmove_clock": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
69
  "layer_7": {
70
- "accuracy": 0.09443258406520243,
71
- "loss": 36.30150203530533,
72
- "best_accuracy": 0.11757128595164827,
73
- "n_train": 485944,
74
- "n_val": 120043,
75
- "mae": 4.078397593157374
76
  }
77
  },
78
  "game_phase": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
79
  "layer_7": {
80
- "accuracy": 0.9041093607915214,
81
- "loss": 0.25151603218794977,
82
- "best_accuracy": 0.907024982682253,
83
- "n_train": 485944,
84
- "n_val": 120043
85
  }
86
  }
87
  },
88
  "diagnostics": {
89
  "in_check": {
90
- "n_positions": 1000,
91
- "mean_legal_rate": 0.9768800000000001,
92
- "std_legal_rate": 0.06257527946401838,
93
- "mean_pad_prob": 0.00044610700723531917,
94
- "mean_entropy": 1.378539781215135,
95
- "std_entropy": 0.4953501412320156
 
96
  },
97
  "double_check": {
98
- "n_positions": 71,
99
- "mean_legal_rate": 0.9123943661971831,
100
- "std_legal_rate": 0.16090820398321937,
101
- "mean_pad_prob": 0.0003617955171410851,
102
- "mean_entropy": 1.1824169549828685,
103
- "std_entropy": 0.4335250151114159
 
104
  },
105
  "pin_restricts": {
106
- "n_positions": 1000,
107
- "mean_legal_rate": 0.97175,
108
- "std_legal_rate": 0.05368647408798607,
109
- "mean_pad_prob": 1.9187790060342758e-05,
110
- "mean_entropy": 3.195623012639582,
111
- "std_entropy": 0.5958539652673973
 
112
  },
113
  "ep_available": {
114
- "n_positions": 940,
115
- "mean_legal_rate": 0.9922553191489362,
116
- "std_legal_rate": 0.02910031665039855,
117
- "mean_pad_prob": 1.1382038407927192e-06,
118
- "mean_entropy": 3.4613142376250408,
119
- "std_entropy": 0.325010232064062
 
120
  },
121
  "castle_legal_k": {
122
- "n_positions": 1000,
123
- "mean_legal_rate": 0.9974100000000001,
124
- "std_legal_rate": 0.005813080078581411,
125
- "mean_pad_prob": 3.8981330552659286e-07,
126
- "mean_entropy": 3.5879413638114928,
127
- "std_entropy": 0.17921419256677748
 
128
  },
129
  "castle_legal_q": {
130
- "n_positions": 1000,
131
- "mean_legal_rate": 0.9958800000000001,
132
- "std_legal_rate": 0.007591152745136939,
133
- "mean_pad_prob": 4.083307937790548e-07,
134
- "mean_entropy": 3.6458762888908387,
135
- "std_entropy": 0.18727308169032228
 
136
  },
137
  "castle_blocked_check": {
138
- "n_positions": 892,
139
- "mean_legal_rate": 0.9937107623318385,
140
- "std_legal_rate": 0.01466430707907582,
141
- "mean_pad_prob": 0.00044056765007829507,
142
- "mean_entropy": 1.2424753979662841,
143
- "std_entropy": 0.5342524588211677
 
144
  },
145
  "promotion_available": {
146
- "n_positions": 1000,
147
- "mean_legal_rate": 0.9940599999999999,
148
- "std_legal_rate": 0.011735263098882794,
149
- "mean_pad_prob": 1.245503282853887e-06,
150
- "mean_entropy": 3.2927837179899218,
151
- "std_entropy": 0.46145118335448565
 
152
  },
153
  "checkmate": {
154
- "n_positions": 276,
 
155
  "mean_legal_rate": 0.0,
156
  "std_legal_rate": 0.0,
157
- "mean_pad_prob": 0.9116162136483911,
158
- "mean_entropy": 0.296485440773498,
159
- "std_entropy": 0.3978962669047925
160
  },
161
  "stalemate": {
162
- "n_positions": 41,
 
163
  "mean_legal_rate": 0.0,
164
  "std_legal_rate": 0.0,
165
- "mean_pad_prob": 0.8422023932529022,
166
- "mean_entropy": 0.30673794891889683,
167
- "std_entropy": 0.46605586628775386
168
  }
169
  }
170
  }
 
1
  {
2
  "probes": {
3
  "piece_type": {
4
+ "embed": {
5
+ "accuracy": 0.7939537763595581,
6
+ "loss": 0.8468984961509705,
7
+ "best_accuracy": 0.7941248416900635,
8
+ "n_train": 721682,
9
+ "n_val": 175570
10
+ },
11
+ "layer_0": {
12
+ "accuracy": 0.8614519834518433,
13
+ "loss": 0.48088300228118896,
14
+ "best_accuracy": 0.8614519834518433,
15
+ "n_train": 721682,
16
+ "n_val": 175570
17
+ },
18
+ "layer_1": {
19
+ "accuracy": 0.899398922920227,
20
+ "loss": 0.3235924243927002,
21
+ "best_accuracy": 0.899398922920227,
22
+ "n_train": 721682,
23
+ "n_val": 175570
24
+ },
25
+ "layer_2": {
26
+ "accuracy": 0.8952611088752747,
27
+ "loss": 0.37268662452697754,
28
+ "best_accuracy": 0.8952611088752747,
29
+ "n_train": 721682,
30
+ "n_val": 175570
31
+ },
32
+ "layer_3": {
33
+ "accuracy": 0.91811603307724,
34
+ "loss": 0.28765103220939636,
35
+ "best_accuracy": 0.91811603307724,
36
+ "n_train": 721682,
37
+ "n_val": 175570
38
+ },
39
+ "layer_4": {
40
+ "accuracy": 0.9070653319358826,
41
+ "loss": 0.3429071307182312,
42
+ "best_accuracy": 0.9071179628372192,
43
+ "n_train": 721682,
44
+ "n_val": 175570
45
+ },
46
+ "layer_5": {
47
+ "accuracy": 0.8869622945785522,
48
+ "loss": 0.46307042241096497,
49
+ "best_accuracy": 0.8869622945785522,
50
+ "n_train": 721682,
51
+ "n_val": 175570
52
+ },
53
+ "layer_6": {
54
+ "accuracy": 0.8946530818939209,
55
+ "loss": 0.6553605198860168,
56
+ "best_accuracy": 0.8946530818939209,
57
+ "n_train": 721682,
58
+ "n_val": 175570
59
+ },
60
  "layer_7": {
61
+ "accuracy": 0.8841903805732727,
62
+ "loss": 0.8387924432754517,
63
+ "best_accuracy": 0.8852172493934631,
64
+ "n_train": 721682,
65
+ "n_val": 175570
66
  }
67
  },
68
  "side_to_move": {
69
+ "embed": {
70
+ "accuracy": 0.6726946234703064,
71
+ "loss": 0.617131233215332,
72
+ "best_accuracy": 0.6737483739852905,
73
+ "n_train": 721682,
74
+ "n_val": 175570
75
+ },
76
+ "layer_0": {
77
+ "accuracy": 0.7186421155929565,
78
+ "loss": 0.5007065534591675,
79
+ "best_accuracy": 0.7200603485107422,
80
+ "n_train": 721682,
81
+ "n_val": 175570
82
+ },
83
+ "layer_1": {
84
+ "accuracy": 0.9996126890182495,
85
+ "loss": 0.0013729166239500046,
86
+ "best_accuracy": 0.9997152090072632,
87
+ "n_train": 721682,
88
+ "n_val": 175570
89
+ },
90
+ "layer_2": {
91
+ "accuracy": 1.0,
92
+ "loss": 1.0403724104435241e-07,
93
+ "best_accuracy": 1.0,
94
+ "n_train": 721682,
95
+ "n_val": 175570
96
+ },
97
+ "layer_3": {
98
+ "accuracy": 1.0,
99
+ "loss": 2.8485755976248583e-09,
100
+ "best_accuracy": 1.0,
101
+ "n_train": 721682,
102
+ "n_val": 175570
103
+ },
104
+ "layer_4": {
105
+ "accuracy": 1.0,
106
+ "loss": 2.5146256188435245e-09,
107
+ "best_accuracy": 1.0,
108
+ "n_train": 721682,
109
+ "n_val": 175570
110
+ },
111
+ "layer_5": {
112
+ "accuracy": 1.0,
113
+ "loss": 1.8359436193549072e-09,
114
+ "best_accuracy": 1.0,
115
+ "n_train": 721682,
116
+ "n_val": 175570
117
+ },
118
+ "layer_6": {
119
+ "accuracy": 1.0,
120
+ "loss": 5.28788575593353e-07,
121
+ "best_accuracy": 1.0,
122
+ "n_train": 721682,
123
+ "n_val": 175570
124
+ },
125
  "layer_7": {
126
+ "accuracy": 0.9997778534889221,
127
+ "loss": 0.002000772627070546,
128
+ "best_accuracy": 0.9998462200164795,
129
+ "n_train": 721682,
130
+ "n_val": 175570
131
  }
132
  },
133
  "is_check": {
134
+ "embed": {
135
+ "accuracy": 0.9438571333885193,
136
+ "loss": 0.2128543257713318,
137
+ "best_accuracy": 0.9438571333885193,
138
+ "n_train": 721682,
139
+ "n_val": 175570
140
+ },
141
+ "layer_0": {
142
+ "accuracy": 0.9444608688354492,
143
+ "loss": 0.1777006834745407,
144
+ "best_accuracy": 0.9445463418960571,
145
+ "n_train": 721682,
146
+ "n_val": 175570
147
+ },
148
+ "layer_1": {
149
+ "accuracy": 0.9497294425964355,
150
+ "loss": 0.13770730793476105,
151
+ "best_accuracy": 0.9497294425964355,
152
+ "n_train": 721682,
153
+ "n_val": 175570
154
+ },
155
+ "layer_2": {
156
+ "accuracy": 0.9498946070671082,
157
+ "loss": 0.1334017962217331,
158
+ "best_accuracy": 0.9500312805175781,
159
+ "n_train": 721682,
160
+ "n_val": 175570
161
+ },
162
+ "layer_3": {
163
+ "accuracy": 0.948766827583313,
164
+ "loss": 0.13876499235630035,
165
+ "best_accuracy": 0.9489434361457825,
166
+ "n_train": 721682,
167
+ "n_val": 175570
168
+ },
169
+ "layer_4": {
170
+ "accuracy": 0.948692798614502,
171
+ "loss": 0.13251903653144836,
172
+ "best_accuracy": 0.9488409161567688,
173
+ "n_train": 721682,
174
+ "n_val": 175570
175
+ },
176
+ "layer_5": {
177
+ "accuracy": 0.9457025527954102,
178
+ "loss": 0.15899775922298431,
179
+ "best_accuracy": 0.9465056657791138,
180
+ "n_train": 721682,
181
+ "n_val": 175570
182
+ },
183
+ "layer_6": {
184
+ "accuracy": 0.9412370920181274,
185
+ "loss": 0.22216182947158813,
186
+ "best_accuracy": 0.9436520934104919,
187
+ "n_train": 721682,
188
+ "n_val": 175570
189
+ },
190
  "layer_7": {
191
+ "accuracy": 0.9402061700820923,
192
+ "loss": 0.24624347686767578,
193
+ "best_accuracy": 0.9422793984413147,
194
+ "n_train": 721682,
195
+ "n_val": 175570
196
  }
197
  },
198
  "castling_rights": {
199
+ "embed": {
200
+ "accuracy": 0.9315600395202637,
201
+ "loss": 0.22545865178108215,
202
+ "best_accuracy": 0.9315600395202637,
203
+ "n_train": 721682,
204
+ "n_val": 175570
205
+ },
206
+ "layer_0": {
207
+ "accuracy": 0.9853334426879883,
208
+ "loss": 0.03903070092201233,
209
+ "best_accuracy": 0.9853420257568359,
210
+ "n_train": 721682,
211
+ "n_val": 175570
212
+ },
213
+ "layer_1": {
214
+ "accuracy": 0.9914606213569641,
215
+ "loss": 0.021991031244397163,
216
+ "best_accuracy": 0.991588830947876,
217
+ "n_train": 721682,
218
+ "n_val": 175570
219
+ },
220
+ "layer_2": {
221
+ "accuracy": 0.9929686188697815,
222
+ "loss": 0.017853515222668648,
223
+ "best_accuracy": 0.9930654168128967,
224
+ "n_train": 721682,
225
+ "n_val": 175570
226
+ },
227
+ "layer_3": {
228
+ "accuracy": 0.9865978956222534,
229
+ "loss": 0.03318539634346962,
230
+ "best_accuracy": 0.9868285655975342,
231
+ "n_train": 721682,
232
+ "n_val": 175570
233
+ },
234
+ "layer_4": {
235
+ "accuracy": 0.9831904172897339,
236
+ "loss": 0.04187026247382164,
237
+ "best_accuracy": 0.9836090803146362,
238
+ "n_train": 721682,
239
+ "n_val": 175570
240
+ },
241
+ "layer_5": {
242
+ "accuracy": 0.9788687825202942,
243
+ "loss": 0.058379411697387695,
244
+ "best_accuracy": 0.9798797965049744,
245
+ "n_train": 721682,
246
+ "n_val": 175570
247
+ },
248
+ "layer_6": {
249
+ "accuracy": 0.9751836657524109,
250
+ "loss": 0.0907355323433876,
251
+ "best_accuracy": 0.9754883646965027,
252
+ "n_train": 721682,
253
+ "n_val": 175570
254
+ },
255
  "layer_7": {
256
+ "accuracy": 0.9707794189453125,
257
+ "loss": 0.11967474222183228,
258
+ "best_accuracy": 0.9712464809417725,
259
+ "n_train": 721682,
260
+ "n_val": 175570
261
  }
262
  },
263
  "ep_square": {
264
+ "embed": {
265
+ "accuracy": 0.9986899495124817,
266
+ "loss": 0.01372161041945219,
267
+ "best_accuracy": 0.9986899495124817,
268
+ "n_train": 721682,
269
+ "n_val": 175570
270
+ },
271
+ "layer_0": {
272
+ "accuracy": 0.998684287071228,
273
+ "loss": 0.011701500043272972,
274
+ "best_accuracy": 0.9986899495124817,
275
+ "n_train": 721682,
276
+ "n_val": 175570
277
+ },
278
+ "layer_1": {
279
+ "accuracy": 0.9981716275215149,
280
+ "loss": 0.006189861800521612,
281
+ "best_accuracy": 0.9985817670822144,
282
+ "n_train": 721682,
283
+ "n_val": 175570
284
+ },
285
+ "layer_2": {
286
+ "accuracy": 0.9982627630233765,
287
+ "loss": 0.006863097194582224,
288
+ "best_accuracy": 0.9985817670822144,
289
+ "n_train": 721682,
290
+ "n_val": 175570
291
+ },
292
+ "layer_3": {
293
+ "accuracy": 0.9990431070327759,
294
+ "loss": 0.003790292190387845,
295
+ "best_accuracy": 0.9991456270217896,
296
+ "n_train": 721682,
297
+ "n_val": 175570
298
+ },
299
+ "layer_4": {
300
+ "accuracy": 0.9987013339996338,
301
+ "loss": 0.007270838599652052,
302
+ "best_accuracy": 0.9988323450088501,
303
+ "n_train": 721682,
304
+ "n_val": 175570
305
+ },
306
+ "layer_5": {
307
+ "accuracy": 0.9974995255470276,
308
+ "loss": 0.026773931458592415,
309
+ "best_accuracy": 0.9982684850692749,
310
+ "n_train": 721682,
311
+ "n_val": 175570
312
+ },
313
+ "layer_6": {
314
+ "accuracy": 0.9960300326347351,
315
+ "loss": 0.0977015346288681,
316
+ "best_accuracy": 0.9980349540710449,
317
+ "n_train": 721682,
318
+ "n_val": 175570
319
+ },
320
  "layer_7": {
321
+ "accuracy": 0.9952667951583862,
322
+ "loss": 0.13185012340545654,
323
+ "best_accuracy": 0.9978071451187134,
324
+ "n_train": 721682,
325
+ "n_val": 175570
326
  }
327
  },
328
  "material_count": {
329
+ "embed": {
330
+ "accuracy": 0.034823477268218994,
331
+ "loss": 1.8249613046646118,
332
+ "best_accuracy": 0.03692054748535156,
333
+ "n_train": 721682,
334
+ "n_val": 175570,
335
+ "mae": 9.569934844970703
336
+ },
337
+ "layer_0": {
338
+ "accuracy": 0.7515236735343933,
339
+ "loss": 0.46982043981552124,
340
+ "best_accuracy": 0.7537726759910583,
341
+ "n_train": 721682,
342
+ "n_val": 175570,
343
+ "mae": 5.040376663208008
344
+ },
345
+ "layer_1": {
346
+ "accuracy": 0.7843592762947083,
347
+ "loss": 0.4077347218990326,
348
+ "best_accuracy": 0.8040273189544678,
349
+ "n_train": 721682,
350
+ "n_val": 175570,
351
+ "mae": 4.520277500152588
352
+ },
353
+ "layer_2": {
354
+ "accuracy": 0.7963148355484009,
355
+ "loss": 0.3851289749145508,
356
+ "best_accuracy": 0.8129063844680786,
357
+ "n_train": 721682,
358
+ "n_val": 175570,
359
+ "mae": 4.381388187408447
360
+ },
361
+ "layer_3": {
362
+ "accuracy": 0.8059321641921997,
363
+ "loss": 0.3669446110725403,
364
+ "best_accuracy": 0.8202922940254211,
365
+ "n_train": 721682,
366
+ "n_val": 175570,
367
+ "mae": 4.309057712554932
368
+ },
369
+ "layer_4": {
370
+ "accuracy": 0.8212227821350098,
371
+ "loss": 0.33803296089172363,
372
+ "best_accuracy": 0.8356728553771973,
373
+ "n_train": 721682,
374
+ "n_val": 175570,
375
+ "mae": 4.076085090637207
376
+ },
377
+ "layer_5": {
378
+ "accuracy": 0.833043098449707,
379
+ "loss": 0.3156830370426178,
380
+ "best_accuracy": 0.8350316882133484,
381
+ "n_train": 721682,
382
+ "n_val": 175570,
383
+ "mae": 3.93052077293396
384
+ },
385
+ "layer_6": {
386
+ "accuracy": 0.8065394163131714,
387
+ "loss": 0.36579638719558716,
388
+ "best_accuracy": 0.81328946352005,
389
+ "n_train": 721682,
390
+ "n_val": 175570,
391
+ "mae": 4.352488994598389
392
+ },
393
  "layer_7": {
394
+ "accuracy": 0.7795088887214661,
395
+ "loss": 0.41690582036972046,
396
+ "best_accuracy": 0.7882944345474243,
397
+ "n_train": 721682,
398
+ "n_val": 175570,
399
+ "mae": 4.678890228271484
400
  }
401
  },
402
  "legal_move_count": {
403
+ "embed": {
404
+ "accuracy": 0.008694469928741455,
405
+ "loss": 149.88076782226562,
406
+ "best_accuracy": 0.00975710153579712,
407
+ "n_train": 721682,
408
+ "n_val": 175570,
409
+ "mae": 10.171092987060547
410
+ },
411
+ "layer_0": {
412
+ "accuracy": 0.43983858823776245,
413
+ "loss": 84.69378662109375,
414
+ "best_accuracy": 0.43983858823776245,
415
+ "n_train": 721682,
416
+ "n_val": 175570,
417
+ "mae": 7.150360584259033
418
+ },
419
+ "layer_1": {
420
+ "accuracy": 0.5228815078735352,
421
+ "loss": 72.13809204101562,
422
+ "best_accuracy": 0.5228815078735352,
423
+ "n_train": 721682,
424
+ "n_val": 175570,
425
+ "mae": 6.5377326011657715
426
+ },
427
+ "layer_2": {
428
+ "accuracy": 0.5866934061050415,
429
+ "loss": 62.49002456665039,
430
+ "best_accuracy": 0.5866934061050415,
431
+ "n_train": 721682,
432
+ "n_val": 175570,
433
+ "mae": 6.011066436767578
434
+ },
435
+ "layer_3": {
436
+ "accuracy": 0.5604725480079651,
437
+ "loss": 66.45449829101562,
438
+ "best_accuracy": 0.5607300996780396,
439
+ "n_train": 721682,
440
+ "n_val": 175570,
441
+ "mae": 6.218656063079834
442
+ },
443
+ "layer_4": {
444
+ "accuracy": 0.6754791140556335,
445
+ "loss": 49.0660400390625,
446
+ "best_accuracy": 0.6755585670471191,
447
+ "n_train": 721682,
448
+ "n_val": 175570,
449
+ "mae": 5.165564060211182
450
+ },
451
+ "layer_5": {
452
+ "accuracy": 0.6420835256576538,
453
+ "loss": 54.11530303955078,
454
+ "best_accuracy": 0.6492248773574829,
455
+ "n_train": 721682,
456
+ "n_val": 175570,
457
+ "mae": 5.334083557128906
458
+ },
459
+ "layer_6": {
460
+ "accuracy": 0.5348567962646484,
461
+ "loss": 70.32747650146484,
462
+ "best_accuracy": 0.567049503326416,
463
+ "n_train": 721682,
464
+ "n_val": 175570,
465
+ "mae": 6.1242218017578125
466
+ },
467
  "layer_7": {
468
+ "accuracy": 0.39110326766967773,
469
+ "loss": 92.06233978271484,
470
+ "best_accuracy": 0.42400068044662476,
471
+ "n_train": 721682,
472
+ "n_val": 175570,
473
+ "mae": 7.249655723571777
474
  }
475
  },
476
  "halfmove_clock": {
477
+ "embed": {
478
+ "accuracy": 0.005232453346252441,
479
+ "loss": 492.56304931640625,
480
+ "best_accuracy": 0.006348371505737305,
481
+ "n_train": 721682,
482
+ "n_val": 175570,
483
+ "mae": 14.510623931884766
484
+ },
485
+ "layer_0": {
486
+ "accuracy": 0.37127983570098877,
487
+ "loss": 311.3132629394531,
488
+ "best_accuracy": 0.37127983570098877,
489
+ "n_train": 721682,
490
+ "n_val": 175570,
491
+ "mae": 11.005152702331543
492
+ },
493
+ "layer_1": {
494
+ "accuracy": 0.43745899200439453,
495
+ "loss": 278.5444030761719,
496
+ "best_accuracy": 0.43745899200439453,
497
+ "n_train": 721682,
498
+ "n_val": 175570,
499
+ "mae": 10.431397438049316
500
+ },
501
+ "layer_2": {
502
+ "accuracy": 0.4526997208595276,
503
+ "loss": 270.9978942871094,
504
+ "best_accuracy": 0.4536823034286499,
505
+ "n_train": 721682,
506
+ "n_val": 175570,
507
+ "mae": 10.503276824951172
508
+ },
509
+ "layer_3": {
510
+ "accuracy": 0.4739035964012146,
511
+ "loss": 260.4986877441406,
512
+ "best_accuracy": 0.4743286967277527,
513
+ "n_train": 721682,
514
+ "n_val": 175570,
515
+ "mae": 10.437573432922363
516
+ },
517
+ "layer_4": {
518
+ "accuracy": 0.45564568042755127,
519
+ "loss": 269.5391540527344,
520
+ "best_accuracy": 0.45679765939712524,
521
+ "n_train": 721682,
522
+ "n_val": 175570,
523
+ "mae": 10.679705619812012
524
+ },
525
+ "layer_5": {
526
+ "accuracy": 0.4151163101196289,
527
+ "loss": 289.6074523925781,
528
+ "best_accuracy": 0.4151163101196289,
529
+ "n_train": 721682,
530
+ "n_val": 175570,
531
+ "mae": 11.022024154663086
532
+ },
533
+ "layer_6": {
534
+ "accuracy": 0.3814623951911926,
535
+ "loss": 306.27130126953125,
536
+ "best_accuracy": 0.3814623951911926,
537
+ "n_train": 721682,
538
+ "n_val": 175570,
539
+ "mae": 11.431619644165039
540
+ },
541
  "layer_7": {
542
+ "accuracy": 0.3014959692955017,
543
+ "loss": 345.86700439453125,
544
+ "best_accuracy": 0.3069889545440674,
545
+ "n_train": 721682,
546
+ "n_val": 175570,
547
+ "mae": 12.022778511047363
548
  }
549
  },
550
  "game_phase": {
551
+ "embed": {
552
+ "accuracy": 0.622520923614502,
553
+ "loss": 0.7939810752868652,
554
+ "best_accuracy": 0.6229594945907593,
555
+ "n_train": 721682,
556
+ "n_val": 175570
557
+ },
558
+ "layer_0": {
559
+ "accuracy": 0.9163581132888794,
560
+ "loss": 0.1934569925069809,
561
+ "best_accuracy": 0.9167283773422241,
562
+ "n_train": 721682,
563
+ "n_val": 175570
564
+ },
565
+ "layer_1": {
566
+ "accuracy": 0.9480605721473694,
567
+ "loss": 0.120170958340168,
568
+ "best_accuracy": 0.9480605721473694,
569
+ "n_train": 721682,
570
+ "n_val": 175570
571
+ },
572
+ "layer_2": {
573
+ "accuracy": 0.9529076218605042,
574
+ "loss": 0.10889476537704468,
575
+ "best_accuracy": 0.9529076218605042,
576
+ "n_train": 721682,
577
+ "n_val": 175570
578
+ },
579
+ "layer_3": {
580
+ "accuracy": 0.9525943994522095,
581
+ "loss": 0.11166463047266006,
582
+ "best_accuracy": 0.9525943994522095,
583
+ "n_train": 721682,
584
+ "n_val": 175570
585
+ },
586
+ "layer_4": {
587
+ "accuracy": 0.9572990536689758,
588
+ "loss": 0.10107019543647766,
589
+ "best_accuracy": 0.9584438800811768,
590
+ "n_train": 721682,
591
+ "n_val": 175570
592
+ },
593
+ "layer_5": {
594
+ "accuracy": 0.9517115354537964,
595
+ "loss": 0.13210734724998474,
596
+ "best_accuracy": 0.9521843194961548,
597
+ "n_train": 721682,
598
+ "n_val": 175570
599
+ },
600
+ "layer_6": {
601
+ "accuracy": 0.9353192448616028,
602
+ "loss": 0.27813100814819336,
603
+ "best_accuracy": 0.9375462532043457,
604
+ "n_train": 721682,
605
+ "n_val": 175570
606
+ },
607
  "layer_7": {
608
+ "accuracy": 0.9186364412307739,
609
+ "loss": 0.38030770421028137,
610
+ "best_accuracy": 0.9187902212142944,
611
+ "n_train": 721682,
612
+ "n_val": 175570
613
  }
614
  }
615
  },
616
  "diagnostics": {
617
  "in_check": {
618
+ "n_positions": 10000,
619
+ "terminal": false,
620
+ "mean_legal_rate": 0.9907619999999999,
621
+ "std_legal_rate": 0.030408211982949608,
622
+ "mean_pad_prob": 0.0007640491741631124,
623
+ "mean_entropy": 1.360506830084973,
624
+ "std_entropy": 0.4851868447382186
625
  },
626
  "double_check": {
627
+ "n_positions": 10000,
628
+ "terminal": false,
629
+ "mean_legal_rate": 0.968241,
630
+ "std_legal_rate": 0.06678679449561867,
631
+ "mean_pad_prob": 0.001569394861201583,
632
+ "mean_entropy": 1.098989733998195,
633
+ "std_entropy": 0.41889251754830115
634
  },
635
  "pin_restricts": {
636
+ "n_positions": 10000,
637
+ "terminal": false,
638
+ "mean_legal_rate": 0.9892730000000002,
639
+ "std_legal_rate": 0.021233027834013693,
640
+ "mean_pad_prob": 8.378310395977987e-05,
641
+ "mean_entropy": 3.179187242682418,
642
+ "std_entropy": 0.614420535115668
643
  },
644
  "ep_available": {
645
+ "n_positions": 10000,
646
+ "terminal": false,
647
+ "mean_legal_rate": 0.995693,
648
+ "std_legal_rate": 0.01136044677818615,
649
+ "mean_pad_prob": 4.877161065352252e-05,
650
+ "mean_entropy": 3.465905277723074,
651
+ "std_entropy": 0.3122574852442407
652
  },
653
  "castle_legal_k": {
654
+ "n_positions": 10000,
655
+ "terminal": false,
656
+ "mean_legal_rate": 0.9979520000000001,
657
+ "std_legal_rate": 0.0048400099173452156,
658
+ "mean_pad_prob": 7.714506284892467e-08,
659
+ "mean_entropy": 3.5851313720464706,
660
+ "std_entropy": 0.1854135106810934
661
  },
662
  "castle_legal_q": {
663
+ "n_positions": 10000,
664
+ "terminal": false,
665
+ "mean_legal_rate": 0.9969480000000002,
666
+ "std_legal_rate": 0.006473430002711087,
667
+ "mean_pad_prob": 8.240626183083216e-08,
668
+ "mean_entropy": 3.6590794766902923,
669
+ "std_entropy": 0.18080142984059425
670
  },
671
  "castle_blocked_check": {
672
+ "n_positions": 10000,
673
+ "terminal": false,
674
+ "mean_legal_rate": 0.9961120000000001,
675
+ "std_legal_rate": 0.010133284561286142,
676
+ "mean_pad_prob": 0.0004383320852224248,
677
+ "mean_entropy": 1.2391307091199792,
678
+ "std_entropy": 0.5261870073605922
679
  },
680
  "promotion_available": {
681
+ "n_positions": 10000,
682
+ "terminal": false,
683
+ "mean_legal_rate": 0.997017,
684
+ "std_legal_rate": 0.007707899259850253,
685
+ "mean_pad_prob": 9.902012749442277e-06,
686
+ "mean_entropy": 3.209924154102802,
687
+ "std_entropy": 0.479078440343986
688
  },
689
  "checkmate": {
690
+ "n_positions": 10000,
691
+ "terminal": true,
692
  "mean_legal_rate": 0.0,
693
  "std_legal_rate": 0.0,
694
+ "mean_pad_prob": 0.9151065862635662,
695
+ "mean_entropy": 0.314861747341415,
696
+ "std_entropy": 0.4386393359006536
697
  },
698
  "stalemate": {
699
+ "n_positions": 10000,
700
+ "terminal": true,
701
  "mean_legal_rate": 0.0,
702
  "std_legal_rate": 0.0,
703
+ "mean_pad_prob": 0.9670851592363986,
704
+ "mean_entropy": 0.09786651973089533,
705
+ "std_entropy": 0.2625593175802058
706
  }
707
  }
708
  }