TheodoreEhrenborg commited on
Commit
4babc3a
·
verified ·
1 Parent(s): d632da1

Upload results.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. results.json +94 -0
results.json ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "d_sae": 4096,
3
+ "actual_l0": 79.9205251,
4
+ "effective_l0": 42,
5
+ "cross_entropy": 228.38722282714843,
6
+ "sae_type": "saebench",
7
+ "sae_release": "adamkarvonen/saebench_gemma-2-2b_width-2pow12_date-0108",
8
+ "num_tokens": 10000000,
9
+ "num_epochs": 1,
10
+ "lr": 0.0005,
11
+ "loaded_dag": null,
12
+ "allow_negative_influence": false,
13
+ "history": {
14
+ "train_loss": [
15
+ 373.0598709106445,
16
+ 296.3568134852818,
17
+ 271.22952662876673,
18
+ 257.95599496023993,
19
+ 249.27438975742885,
20
+ 242.92079282488143,
21
+ 238.3831261771066,
22
+ 235.0788822719029,
23
+ 232.04134761265345,
24
+ 229.43816942487445,
25
+ 229.34045748029436
26
+ ],
27
+ "train_steps": [
28
+ 140,
29
+ 280,
30
+ 420,
31
+ 560,
32
+ 700,
33
+ 840,
34
+ 980,
35
+ 1120,
36
+ 1260,
37
+ 1400,
38
+ 1407
39
+ ],
40
+ "val_loss": [
41
+ 317.3101373046875,
42
+ 280.5291108398437,
43
+ 263.3136259277344,
44
+ 252.9333521484375,
45
+ 245.83410717773438,
46
+ 240.5973893798828,
47
+ 236.54287941894532,
48
+ 233.30607668457031,
49
+ 230.65738371582032,
50
+ 228.45383054199218,
51
+ 228.38722282714843
52
+ ],
53
+ "val_cross_entropy": [
54
+ 317.3101373046875,
55
+ 280.5291108398437,
56
+ 263.3136259277344,
57
+ 252.9333521484375,
58
+ 245.83410717773438,
59
+ 240.5973893798828,
60
+ 236.54287941894532,
61
+ 233.30607668457031,
62
+ 230.65738371582032,
63
+ 228.45383054199218,
64
+ 228.38722282714843
65
+ ],
66
+ "effective_l0": [
67
+ 62,
68
+ 54,
69
+ 50,
70
+ 47,
71
+ 46,
72
+ 44,
73
+ 44,
74
+ 43,
75
+ 42,
76
+ 42,
77
+ 42
78
+ ],
79
+ "val_steps": [
80
+ 140,
81
+ 280,
82
+ 420,
83
+ 560,
84
+ 700,
85
+ 840,
86
+ 980,
87
+ 1120,
88
+ 1260,
89
+ 1400,
90
+ 1407
91
+ ]
92
+ },
93
+ "sae_id": "MatryoshkaBatchTopK_gemma-2-2b__0108/resid_post_layer_12/trainer_2"
94
+ }