Sardean commited on
Commit
32b1d79
·
verified ·
1 Parent(s): d0623bc

Upload folder using huggingface_hub

Browse files
qwen3_06B.blocks.12.hook_resid_post.sae.sparsity40.mse0.001.kl0.01.physics10.exp8/history.json CHANGED
@@ -1,427 +1,427 @@
1
  {
2
  "loss": [
3
- 161.37722034741165,
4
- 14.045179295360594,
5
- 8.077628720075564,
6
- 4.122583417964161,
7
- 2.5219415246992183,
8
- 2.06097466156895,
9
- 1.8829072238807392,
10
- 1.7795192836818838,
11
- 1.714775740652156,
12
- 1.6608511110893767,
13
- 1.6202158954806793,
14
- 1.5819957202538513,
15
- 1.564438405789827,
16
- 1.5533855481255323,
17
- 1.5221090262993835
18
  ],
19
  "recon_loss": [
20
- 140.0506628500788,
21
- 0.7326222425116632,
22
- 0.5893944154556533,
23
- 0.5036597919643373,
24
- 0.43890226357861567,
25
- 0.40398927693976494,
26
- 0.37996214292103186,
27
- 0.36091685339920504,
28
- 0.34693841591365354,
29
- 0.3360904577307235,
30
- 0.3267555362299869,
31
- 0.31791340408468605,
32
- 0.31509057169121907,
33
- 0.31370528064724196,
34
- 0.30467172941767184
35
  ],
36
  "l1_loss": [
37
- 0.42969512043142677,
38
- 0.32295431129466323,
39
- 0.17879747386489594,
40
- 0.08334885067061375,
41
- 0.045875783645568935,
42
- 0.03566838005431613,
43
- 0.03240059402988369,
44
- 0.030739469285634227,
45
- 0.02970616555863753,
46
- 0.028877815693840944,
47
- 0.02822135618530718,
48
- 0.027641708129330686,
49
- 0.027252375155239178,
50
- 0.02695890189729687,
51
- 0.0266966949308053
52
  ],
53
  "sparsity": [
54
- 1024.7620009802338,
55
- 444.39608420465225,
56
- 253.88346656283042,
57
- 154.66245958141815,
58
- 108.07653016972363,
59
- 85.74527901097348,
60
- 72.25553965747804,
61
- 63.05037388048674,
62
- 56.60644691868832,
63
- 51.73212272242496,
64
- 48.164667516722716,
65
- 44.760779330604954,
66
- 42.48158496483824,
67
- 40.17802219821098,
68
- 38.265156251147275
69
  ],
70
  "recon_contribution": [
71
- 140.0506628500788,
72
- 0.7326222425116632,
73
- 0.5893944154556533,
74
- 0.5036597919643373,
75
- 0.43890226357861567,
76
- 0.40398927693976494,
77
- 0.37996214292103186,
78
- 0.36091685339920504,
79
- 0.34693841591365354,
80
- 0.3360904577307235,
81
- 0.3267555362299869,
82
- 0.31791340408468605,
83
- 0.31509057169121907,
84
- 0.31370528064724196,
85
- 0.30467172941767184
86
  ],
87
  "l1_contribution": [
88
- 17.187804788575136,
89
- 12.918172441927114,
90
- 7.151898925465749,
91
- 3.3339540205503764,
92
- 1.835031339100429,
93
- 1.4267352003800242,
94
- 1.2960237632120462,
95
- 1.2295787684003214,
96
- 1.1882466221214236,
97
- 1.1551126277536379,
98
- 1.1288542496530634,
99
- 1.1056683256213826,
100
- 1.0900950077781104,
101
- 1.0783560760039137,
102
- 1.0678677984646388
103
  ],
104
  "total_post_layer_mse": [
105
- 3466.1193810029135,
106
- 135.72650228855306,
107
- 109.76233570378525,
108
- 93.65179983341605,
109
- 82.23118221849427,
110
- 75.90325397902862,
111
- 70.13544425233863,
112
- 65.51640337996913,
113
- 62.85051740336239,
114
- 59.94068668323352,
115
- 58.36495986648072,
116
- 56.418407248823264,
117
- 56.196124968896235,
118
- 56.38954164972879,
119
- 54.015165600225444
120
  ],
121
  "block_mse_contribution": [
122
- 3.466119538798326,
123
- 0.13572650898074648,
124
- 0.10976234104666382,
125
- 0.09365180433492344,
126
- 0.08223118611389975,
127
- 0.07590325756976206,
128
- 0.07013544758092052,
129
- 0.06551640639908758,
130
- 0.0628505203381874,
131
- 0.05994068948430345,
132
- 0.058364962591331004,
133
- 0.056418409908480974,
134
- 0.056196127630878744,
135
- 0.05638954432854513,
136
- 0.0540151681478137
137
  ],
138
  "13_mse": [
139
- 141.05547107431227,
140
- 0.9044712454752815,
141
- 0.6802906644971747,
142
- 0.5671232255329763,
143
- 0.4921112134492487,
144
- 0.452086947914353,
145
- 0.42457839353640275,
146
- 0.40357935249357296,
147
- 0.38808650204113554,
148
- 0.37606826088482276,
149
- 0.36574127015314606,
150
- 0.35614806458466036,
151
- 0.35327644029954325,
152
- 0.3523842564650944,
153
- 0.34244708313529654
154
  ],
155
  "14_mse": [
156
- 141.4759453705379,
157
- 1.067271147455488,
158
- 0.7361706374283123,
159
- 0.6078729869279647,
160
- 0.5251424780913762,
161
- 0.48095350561285377,
162
- 0.450883397258314,
163
- 0.42757396276732135,
164
- 0.4106266482880241,
165
- 0.3975107873740949,
166
- 0.3862618566455698,
167
- 0.37582341800058694,
168
- 0.3727722705755019,
169
- 0.3719414600304195,
170
- 0.36111583969646827
171
  ],
172
  "15_mse": [
173
- 141.54926251827325,
174
- 1.1383816994222484,
175
- 0.8626467079148257,
176
- 0.7225316426807776,
177
- 0.6264448152448898,
178
- 0.5735527566052917,
179
- 0.5372263065406254,
180
- 0.5087978452219999,
181
- 0.48860213362184685,
182
- 0.4722401732788946,
183
- 0.4592554961380206,
184
- 0.4467338579041617,
185
- 0.4434954676412998,
186
- 0.44283442972297954,
187
- 0.4293699260044815
188
  ],
189
  "16_mse": [
190
- 143.03045174233,
191
- 1.6987399185510506,
192
- 1.3216133843687243,
193
- 1.124703217717938,
194
- 0.9853345155715942,
195
- 0.9061568598998221,
196
- 0.8473894515431913,
197
- 0.801016428416833,
198
- 0.7677389136830667,
199
- 0.7393958519275924,
200
- 0.7179285812198668,
201
- 0.6957756074747645,
202
- 0.6894614839912357,
203
- 0.6877471782211074,
204
- 0.6663001858650294
205
  ],
206
  "17_mse": [
207
- 144.51245766116264,
208
- 2.2298882590200666,
209
- 1.7312677587781633,
210
- 1.471432576502176,
211
- 1.2941743422271614,
212
- 1.1915115261436404,
213
- 1.1127150448641383,
214
- 1.0507948026621252,
215
- 1.0064882299953835,
216
- 0.9686674623561085,
217
- 0.9405611273937655,
218
- 0.9118711222383312,
219
- 0.9043035032157611,
220
- 0.9033431106043938,
221
- 0.8743758443602943
222
  ],
223
  "18_mse": [
224
- 147.05885417120797,
225
- 3.033295912850172,
226
- 2.3449739163979553,
227
- 1.997587423575552,
228
- 1.7571663990952915,
229
- 1.6170019251959664,
230
- 1.5060613325663976,
231
- 1.4197885703323478,
232
- 1.3571205878616275,
233
- 1.3024344829688395,
234
- 1.264607798784299,
235
- 1.2239774151852256,
236
- 1.21361012521543,
237
- 1.2122161558696203,
238
- 1.1708397318546038
239
  ],
240
  "19_mse": [
241
- 149.22605560417463,
242
- 4.0121383738697025,
243
- 3.2144290181927215,
244
- 2.758385919986811,
245
- 2.441610321962744,
246
- 2.253361161490132,
247
- 2.098138313544424,
248
- 1.9760035437748844,
249
- 1.889889953728009,
250
- 1.812320611530677,
251
- 1.759585898621638,
252
- 1.702195225801683,
253
- 1.6886369868328697,
254
- 1.6874478876142573,
255
- 1.6287031451562293
256
  ],
257
  "20_mse": [
258
- 153.7509368165095,
259
- 5.441977938315026,
260
- 4.45599501294301,
261
- 3.855638541673359,
262
- 3.425549186261973,
263
- 3.171866490428609,
264
- 2.9533604338653108,
265
- 2.7798046743063103,
266
- 2.6594780100915667,
267
- 2.5478323644265197,
268
- 2.4749457405922106,
269
- 2.393614544008011,
270
- 2.3758493975589148,
271
- 2.3745743018343934,
272
- 2.2899725939098157
273
  ],
274
  "21_mse": [
275
- 160.95929784703077,
276
- 7.135156624299243,
277
- 5.914923933215607,
278
- 5.128597829574929,
279
- 4.5511189026940135,
280
- 4.21936127296964,
281
- 3.923178972158217,
282
- 3.6860433341865253,
283
- 3.5265313610994724,
284
- 3.3750149181910922,
285
- 3.2811398739205266,
286
- 3.1704284553241013,
287
- 3.1523296922669375,
288
- 3.153335191253433,
289
- 3.038006474200944
290
  ],
291
  "22_mse": [
292
- 168.19452534582382,
293
- 8.998995719995714,
294
- 7.49461117005886,
295
- 6.505148278143173,
296
- 5.7850914288284185,
297
- 5.377504140810859,
298
- 4.994920544158247,
299
- 4.691322848312836,
300
- 4.492168329712143,
301
- 4.298624393635226,
302
- 4.181720306998805,
303
- 4.041896244637052,
304
- 4.022451925994758,
305
- 4.027708962447662,
306
- 3.877970751066853
307
  ],
308
  "23_mse": [
309
- 179.14986152218697,
310
- 11.38232209628686,
311
- 9.477492454356717,
312
- 8.241463334936844,
313
- 7.336874675033684,
314
- 6.833520828333116,
315
- 6.338973109883473,
316
- 5.948143514475428,
317
- 5.69784887213456,
318
- 5.448554730953131,
319
- 5.305850695846672,
320
- 5.128336178629022,
321
- 5.109391018860322,
322
- 5.121594647715862,
323
- 4.929774293325897
324
  ],
325
  "24_mse": [
326
- 196.0926439959304,
327
- 14.460908975816311,
328
- 11.960016910294842,
329
- 10.347328537388853,
330
- 9.194787832131063,
331
- 8.55697606739245,
332
- 7.927740344427582,
333
- 7.437671284926565,
334
- 7.125370538324342,
335
- 6.811064024616901,
336
- 6.636014590586038,
337
- 6.416975243647296,
338
- 6.396038030323229,
339
- 6.418769850766749,
340
- 6.16974963998436
341
  ],
342
  "25_mse": [
343
- 226.34073509847312,
344
- 17.973981964857057,
345
- 14.85763964975687,
346
- 12.867098894334378,
347
- 11.449179885978985,
348
- 10.659138199081994,
349
- 9.875030237929264,
350
- 9.260411262512207,
351
- 8.872144111117025,
352
- 8.481059440096518,
353
- 8.26239162100885,
354
- 7.988611952702802,
355
- 7.9641538455074,
356
- 7.9938539598221166,
357
- 7.682567366980072
358
  ],
359
  "26_mse": [
360
- 246.06104442051478,
361
- 19.748153715205373,
362
- 16.151449827323283,
363
- 13.924694405462509,
364
- 12.360495115581312,
365
- 11.494442358949131,
366
- 10.625836436909841,
367
- 9.951343536376953,
368
- 9.5391424903296,
369
- 9.113765042527278,
370
- 8.880022905822983,
371
- 8.591897032314673,
372
- 8.575884145005306,
373
- 8.61652408327375,
374
- 8.273485656967736
375
  ],
376
  "27_mse": [
377
- 1127.6618378144458,
378
- 36.50081869713346,
379
- 28.558814658258193,
380
- 23.532193018977804,
381
- 20.006101106342516,
382
- 18.115819938200758,
383
- 16.519411933153197,
384
- 15.17410841920322,
385
- 14.629280721334586,
386
- 13.796134138465824,
387
- 13.448932102748326,
388
- 12.974122886370896,
389
- 12.934470635607727,
390
- 13.025266174086951,
391
- 12.280487067717358
392
  ],
393
  "logit_kl": [
394
- 67.2636034399047,
395
- 25.865796340139287,
396
- 22.657304505656537,
397
- 19.131782417010545,
398
- 16.57767048455719,
399
- 15.434691192512226,
400
- 13.678588221843977,
401
- 12.350722470677885,
402
- 11.67401699553755,
403
- 10.970734416990352,
404
- 10.62411352028524,
405
- 10.199558932082097,
406
- 10.305670784828358,
407
- 10.493465681721393,
408
- 9.555433201610594
409
  ],
410
  "kl_contribution": [
411
- 0.6726360188839131,
412
- 0.2586579576022643,
413
- 0.22657303937843867,
414
- 0.19131781989918614,
415
- 0.16577670191015517,
416
- 0.1543469084496785,
417
- 0.13678587866680963,
418
- 0.12350722200664363,
419
- 0.1167401673090189,
420
- 0.10970734188655265,
421
- 0.10624113258786667,
422
- 0.10199558734893799,
423
- 0.10305670559182203,
424
- 0.10493465417757966,
425
- 0.09555432973499585
426
  ]
427
  }
 
1
  {
2
  "loss": [
3
+ 132.40072370830336,
4
+ 15.898285371916634,
5
+ 4.808860845135567,
6
+ 4.2647794995989114,
7
+ 3.7614752946043373,
8
+ 3.5804317333644495,
9
+ 3.621848736938677,
10
+ 3.311293805452218,
11
+ 3.3564420907120955,
12
+ 3.2430825179680847,
13
+ 3.1446165334909484,
14
+ 3.166066134334507,
15
+ 3.145363519962569,
16
+ 3.1751417849296915,
17
+ 3.1040466840105845
18
  ],
19
  "recon_loss": [
20
+ 91.53491892021401,
21
+ 1.127020146837808,
22
+ 0.5399636414490248,
23
+ 0.4608159236665955,
24
+ 0.3498118930965438,
25
+ 0.3483069581644876,
26
+ 0.38624757724372966,
27
+ 0.3225517376585114,
28
+ 0.3369383092661549,
29
+ 0.30339636519215163,
30
+ 0.29119090242941575,
31
+ 0.31196532981064085,
32
+ 0.307742903387188,
33
+ 0.32156725171813394,
34
+ 0.30149288374678535
35
  ],
36
  "l1_loss": [
37
+ 0.8785219717966882,
38
+ 0.3300659595603557,
39
+ 0.08405589065829613,
40
+ 0.07463387472737104,
41
+ 0.0716574577810733,
42
+ 0.06664694049500657,
43
+ 0.06470343093142698,
44
+ 0.06195041967934012,
45
+ 0.061602180788671614,
46
+ 0.0611304106064757,
47
+ 0.0603844676152768,
48
+ 0.05863903490896512,
49
+ 0.05944218401818123,
50
+ 0.05809492428079808,
51
+ 0.05800197750357981
52
  ],
53
  "sparsity": [
54
+ 1057.4835558439556,
55
+ 407.9275162202075,
56
+ 162.19449604005743,
57
+ 119.2390982262174,
58
+ 95.5933568854081,
59
+ 82.25088138150093,
60
+ 70.82447925366853,
61
+ 62.93163240762581,
62
+ 56.17579608573053,
63
+ 50.73961696051117,
64
+ 46.83539435020963,
65
+ 43.90063462938581,
66
+ 40.67231744034846,
67
+ 39.208685760211225,
68
+ 37.08526147397837
69
  ],
70
  "recon_contribution": [
71
+ 91.53491892021401,
72
+ 1.127020146837808,
73
+ 0.5399636414490248,
74
+ 0.4608159236665955,
75
+ 0.3498118930965438,
76
+ 0.3483069581644876,
77
+ 0.38624757724372966,
78
+ 0.3225517376585114,
79
+ 0.3369383092661549,
80
+ 0.30339636519215163,
81
+ 0.29119090242941575,
82
+ 0.31196532981064085,
83
+ 0.307742903387188,
84
+ 0.32156725171813394,
85
+ 0.30149288374678535
86
  ],
87
  "l1_contribution": [
88
+ 35.14087875982872,
89
+ 13.202638413673057,
90
+ 3.3622356299170875,
91
+ 2.9853549962653254,
92
+ 2.8662983100665245,
93
+ 2.6658776234415242,
94
+ 2.5881372282379553,
95
+ 2.478016788350012,
96
+ 2.4640872312667677,
97
+ 2.445216426723882,
98
+ 2.4153787063476733,
99
+ 2.345561395238217,
100
+ 2.3776873603351136,
101
+ 2.3237969747611453,
102
+ 2.3200791032242596
103
  ],
104
  "total_post_layer_mse": [
105
+ 3768.518025380776,
106
+ 634.3760369014472,
107
+ 281.5267423777876,
108
+ 257.9137649592152,
109
+ 121.86403825979932,
110
+ 132.82595429743142,
111
+ 182.3500442832036,
112
+ 120.80600859516098,
113
+ 148.72142278666334,
114
+ 119.53372874082928,
115
+ 96.44286261605365,
116
+ 132.2072357783528,
117
+ 119.37015544875224,
118
+ 140.67416488754571,
119
+ 125.15249402512957
120
  ],
121
  "block_mse_contribution": [
122
+ 3.768518193868248,
123
+ 0.6343760687253469,
124
+ 0.28152675526179427,
125
+ 0.257913777174597,
126
+ 0.12186404388013675,
127
+ 0.13282596073111194,
128
+ 0.18235005254360945,
129
+ 0.12080601431375555,
130
+ 0.14872143043109295,
131
+ 0.1195337344229062,
132
+ 0.09644286709981384,
133
+ 0.1322072420359626,
134
+ 0.11937016143081264,
135
+ 0.1406741713079483,
136
+ 0.12515250030259253
137
  ],
138
  "13_mse": [
139
+ 92.58617470228583,
140
+ 1.424407343443175,
141
+ 0.6843610000341458,
142
+ 0.5639535150581733,
143
+ 0.42544728976891455,
144
+ 0.4171061430658613,
145
+ 0.45088799185770795,
146
+ 0.3778063368080254,
147
+ 0.3880942987096041,
148
+ 0.3534062831921685,
149
+ 0.3343137366543139,
150
+ 0.35508942990598824,
151
+ 0.347726347863226,
152
+ 0.36387658421706437,
153
+ 0.34385311766002413
154
  ],
155
  "14_mse": [
156
+ 92.43770923874432,
157
+ 1.4219669226865124,
158
+ 0.7184918425361017,
159
+ 0.603204586003956,
160
+ 0.4554870707872219,
161
+ 0.4487679816950533,
162
+ 0.48403634332624595,
163
+ 0.40736286913541925,
164
+ 0.41743570364507515,
165
+ 0.38230037711616743,
166
+ 0.3595608007863052,
167
+ 0.3827579479692574,
168
+ 0.3731682823788851,
169
+ 0.3925049804655233,
170
+ 0.3724479387353237
171
  ],
172
  "15_mse": [
173
+ 92.73112112597416,
174
+ 1.5456405208074957,
175
+ 0.8291421245811577,
176
+ 0.696399899577736,
177
+ 0.530499174966848,
178
+ 0.5212662321956534,
179
+ 0.5569074418311729,
180
+ 0.47336215733137343,
181
+ 0.48270386916802344,
182
+ 0.44751030139457015,
183
+ 0.41891130648161234,
184
+ 0.44354036226308435,
185
+ 0.43207019791567236,
186
+ 0.4540229000543293,
187
+ 0.4348179030239134
188
  ],
189
  "16_mse": [
190
+ 93.72751782800918,
191
+ 2.088347224812759,
192
+ 1.2250121937210399,
193
+ 1.0437956295515363,
194
+ 0.8037037549162269,
195
+ 0.7893119821871134,
196
+ 0.831803834527955,
197
+ 0.714540472828356,
198
+ 0.716447467754658,
199
+ 0.6794583469181132,
200
+ 0.628354791299741,
201
+ 0.6565977841391599,
202
+ 0.6375507835606883,
203
+ 0.6720199679073534,
204
+ 0.6464301565087828
205
  ],
206
  "17_mse": [
207
+ 94.47222283818668,
208
+ 2.4767478825454425,
209
+ 1.5378725349454951,
210
+ 1.3074736180610227,
211
+ 1.0276811555364078,
212
+ 1.009038458193155,
213
+ 1.052105562579363,
214
+ 0.9169551736878273,
215
+ 0.9124030157139427,
216
+ 0.8749958547882568,
217
+ 0.8088635177092445,
218
+ 0.8403520140432774,
219
+ 0.8132623561791011,
220
+ 0.8571708014136866,
221
+ 0.8309605762474519
222
  ],
223
  "18_mse": [
224
+ 96.62282840739516,
225
+ 3.313168379597198,
226
+ 2.1050605021025004,
227
+ 1.7885640088776897,
228
+ 1.4142655618208693,
229
+ 1.3870145925005575,
230
+ 1.4408194030586041,
231
+ 1.2563351908124478,
232
+ 1.2509042515342397,
233
+ 1.2091203721842372,
234
+ 1.1067663614911245,
235
+ 1.1532457063072605,
236
+ 1.1120133261035259,
237
+ 1.1673076464269394,
238
+ 1.144940797995804
239
  ],
240
  "19_mse": [
241
+ 98.12952686610974,
242
+ 4.21422166842267,
243
+ 2.7761693278649697,
244
+ 2.3772155705251192,
245
+ 1.9103159030577295,
246
+ 1.8712453797347564,
247
+ 1.930497253747811,
248
+ 1.7012208476102442,
249
+ 1.6912268557046588,
250
+ 1.6499157534506088,
251
+ 1.5067807480804902,
252
+ 1.5715877149338113,
253
+ 1.50961379762879,
254
+ 1.5925079682715853,
255
+ 1.569648396924026
256
  ],
257
  "20_mse": [
258
+ 100.86349562774028,
259
+ 5.2358217391752655,
260
+ 3.5889427751526797,
261
+ 3.084748203144934,
262
+ 2.5231203943266904,
263
+ 2.466466988836016,
264
+ 2.515812956300893,
265
+ 2.2489302400359534,
266
+ 2.2176499926954283,
267
+ 2.1649505195761085,
268
+ 1.996861229713698,
269
+ 2.0641328773104157,
270
+ 1.9832459145918824,
271
+ 2.0868534244092785,
272
+ 2.056514573276491
273
  ],
274
  "21_mse": [
275
+ 106.23677720521626,
276
+ 7.429197506797045,
277
+ 4.934605420083928,
278
+ 4.241325343461861,
279
+ 3.4353638143467724,
280
+ 3.3451044389179776,
281
+ 3.3986762430434836,
282
+ 3.03673449674047,
283
+ 3.0061623476501693,
284
+ 2.8840246505307077,
285
+ 2.644449479597852,
286
+ 2.7081336916837477,
287
+ 2.554877420117084,
288
+ 2.698225707936108,
289
+ 2.655916364121258
290
  ],
291
  "22_mse": [
292
+ 111.03444346807953,
293
+ 8.813722875781526,
294
+ 5.975814478737967,
295
+ 5.13371875859741,
296
+ 4.210649632869806,
297
+ 4.100004742916365,
298
+ 4.144820572738361,
299
+ 3.7331808097380446,
300
+ 3.6716954000014113,
301
+ 3.5411856093801055,
302
+ 3.2662032493075035,
303
+ 3.32891203138165,
304
+ 3.150659145269179,
305
+ 3.3271091728282154,
306
+ 3.274116275005771
307
  ],
308
  "23_mse": [
309
+ 118.86912513317021,
310
+ 11.185627614645133,
311
+ 7.6775109463168265,
312
+ 6.536852415342977,
313
+ 5.326670237053606,
314
+ 5.195521380668296,
315
+ 5.26501534845596,
316
+ 4.727612521415367,
317
+ 4.681196536336627,
318
+ 4.525898637628197,
319
+ 4.15481556268563,
320
+ 4.256077368456618,
321
+ 4.0400548922388175,
322
+ 4.312153929158261,
323
+ 4.251093875196643
324
  ],
325
  "24_mse": [
326
+ 130.50960404173773,
327
+ 14.531528067768068,
328
+ 9.785240420721527,
329
+ 8.324993122789197,
330
+ 6.708341277631602,
331
+ 6.538236614456751,
332
+ 6.6201859363039635,
333
+ 5.944424200775032,
334
+ 5.905932158455813,
335
+ 5.711922184865277,
336
+ 5.222949343516414,
337
+ 5.336188742092678,
338
+ 5.064628631548774,
339
+ 5.40855013876033,
340
+ 5.332810629579358
341
  ],
342
  "25_mse": [
343
+ 149.70575552775446,
344
+ 18.781842669149988,
345
+ 12.454813014295764,
346
+ 10.676898454364977,
347
+ 8.50971511790627,
348
+ 8.30757270719772,
349
+ 8.442735458675184,
350
+ 7.540686890594941,
351
+ 7.51053103647734,
352
+ 7.272217981797412,
353
+ 6.6091292926243375,
354
+ 6.806205828387038,
355
+ 6.429451408242821,
356
+ 6.961337288519494,
357
+ 6.801972677833156
358
  ],
359
  "26_mse": [
360
+ 162.7475875983561,
361
+ 21.965660794336994,
362
+ 14.38764136536677,
363
+ 12.350393969313542,
364
+ 9.63491886361201,
365
+ 9.44224236782332,
366
+ 9.776316755696348,
367
+ 8.552372195666894,
368
+ 8.593469288116111,
369
+ 8.364798094096937,
370
+ 7.4954372115601275,
371
+ 7.8521559579031805,
372
+ 7.360022383524959,
373
+ 8.127834703689231,
374
+ 7.897967291953869
375
  ],
376
  "27_mse": [
377
+ 2227.8441357720167,
378
+ 529.9481356914779,
379
+ 212.84606443132674,
380
+ 199.18422786454508,
381
+ 74.94785901119835,
382
+ 86.98705428704284,
383
+ 135.43942318106056,
384
+ 79.17448419198058,
385
+ 107.27557056470025,
386
+ 79.47202377391041,
387
+ 59.889465984545254,
388
+ 94.45225832157566,
389
+ 83.56181056158883,
390
+ 102.2526896734883,
391
+ 87.5390034510677
392
  ],
393
  "logit_kl": [
394
+ 195.64052740971846,
395
+ 93.42507447694477,
396
+ 62.51348275349552,
397
+ 56.06948348454067,
398
+ 42.35010630026796,
399
+ 43.34211874008179,
400
+ 46.51138848828194,
401
+ 38.99192340750443,
402
+ 40.66951527989897,
403
+ 37.49360173806212,
404
+ 34.16040521277521,
405
+ 37.63321834937074,
406
+ 34.05630800777808,
407
+ 38.910339645873336,
408
+ 35.732220771617456
409
  ],
410
  "kl_contribution": [
411
+ 1.9564052279058255,
412
+ 0.9342507238226726,
413
+ 0.6251348145586207,
414
+ 0.5606948222993011,
415
+ 0.42350105397907417,
416
+ 0.433421177971632,
417
+ 0.4651138730403176,
418
+ 0.3899192253505825,
419
+ 0.40669514345271246,
420
+ 0.37493600797160226,
421
+ 0.34160404475895984,
422
+ 0.3763321751266494,
423
+ 0.34056307274596137,
424
+ 0.3891033879236171,
425
+ 0.3573221996762699
426
  ]
427
  }
qwen3_06B.blocks.12.hook_resid_post.sae.sparsity40.mse0.001.kl0.01.physics10.exp8/weights.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15db608906d09e1c583f067243fb19552c86d998b4dc207f5d42cf3f0d4efccb
3
  size 67148125
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:687d03590ec005360ddc659688f1136b454240d73d02ca5312ee3e101e5d93ec
3
  size 67148125