TheodoreEhrenborg commited on
Commit
a89b8ae
·
verified ·
1 Parent(s): 1fbef1e

Upload results.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. results.json +94 -0
results.json ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "d_sae": 16384,
3
+ "actual_l0": 47.6956591,
4
+ "effective_l0": 25,
5
+ "cross_entropy": 181.97386730957032,
6
+ "sae_type": "gemmascope",
7
+ "sae_release": "gemma-scope-2b-pt-res",
8
+ "num_tokens": 10000000,
9
+ "num_epochs": 1,
10
+ "lr": 0.0005,
11
+ "loaded_dag": null,
12
+ "allow_negative_influence": false,
13
+ "history": {
14
+ "train_loss": [
15
+ 293.03616899762835,
16
+ 258.30179617745534,
17
+ 235.7053546360561,
18
+ 220.71944950648717,
19
+ 210.05808933803013,
20
+ 202.00115487234933,
21
+ 196.05209132603235,
22
+ 191.12095217023577,
23
+ 187.18564692905971,
24
+ 183.54394280569895,
25
+ 183.36030752999443
26
+ ],
27
+ "train_steps": [
28
+ 140,
29
+ 280,
30
+ 420,
31
+ 560,
32
+ 700,
33
+ 840,
34
+ 980,
35
+ 1120,
36
+ 1260,
37
+ 1400,
38
+ 1407
39
+ ],
40
+ "val_loss": [
41
+ 273.068134765625,
42
+ 245.38075861816407,
43
+ 227.24295302734376,
44
+ 214.81135705566408,
45
+ 205.78304479980468,
46
+ 198.97213388671875,
47
+ 193.5232102783203,
48
+ 189.05871796875,
49
+ 185.3210973144531,
50
+ 182.09052497558594,
51
+ 181.97386730957032
52
+ ],
53
+ "val_cross_entropy": [
54
+ 273.068134765625,
55
+ 245.38075861816407,
56
+ 227.24295302734376,
57
+ 214.81135705566408,
58
+ 205.78304479980468,
59
+ 198.97213388671875,
60
+ 193.5232102783203,
61
+ 189.05871796875,
62
+ 185.3210973144531,
63
+ 182.09052497558594,
64
+ 181.97386730957032
65
+ ],
66
+ "effective_l0": [
67
+ 40,
68
+ 35,
69
+ 32,
70
+ 30,
71
+ 29,
72
+ 28,
73
+ 27,
74
+ 26,
75
+ 26,
76
+ 25,
77
+ 25
78
+ ],
79
+ "val_steps": [
80
+ 140,
81
+ 280,
82
+ 420,
83
+ 560,
84
+ 700,
85
+ 840,
86
+ 980,
87
+ 1120,
88
+ 1260,
89
+ 1400,
90
+ 1407
91
+ ]
92
+ },
93
+ "sae_id": "layer_12/width_16k/average_l0_41"
94
+ }