viveksil's picture
Add files using upload-large-folder tool
ba242ea verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00268859,0.01000,2.297
0,self_attn.v_proj,0.00012146,0.01000,1.532
0,self_attn.q_proj,0.00339818,0.01000,1.401
0,self_attn.o_proj,0.00007466,0.01000,3.458
0,mlp.up_proj,0.00165959,0.01000,3.002
0,mlp.gate_proj,0.00176081,0.01000,2.685
0,mlp.down_proj,0.00171541,0.01000,19.171
1,self_attn.k_proj,0.00514033,0.01000,3.422
1,self_attn.v_proj,0.00119326,0.01000,3.608
1,self_attn.q_proj,0.00603395,0.01000,1.613
1,self_attn.o_proj,0.00048323,0.01000,3.834
1,mlp.up_proj,0.00365061,0.01000,1.590
1,mlp.gate_proj,0.00421130,0.01000,6.380
1,mlp.down_proj,0.02673751,0.01000,7.127
2,self_attn.k_proj,0.00933676,0.01000,1.540
2,self_attn.v_proj,0.00363998,0.01000,2.579
2,self_attn.q_proj,0.01070433,0.01000,3.024
2,self_attn.o_proj,0.00095308,0.01000,1.640
2,mlp.up_proj,0.00610160,0.01000,10.450
2,mlp.gate_proj,0.00684849,0.01000,3.323
2,mlp.down_proj,0.00416326,0.01000,11.194
3,self_attn.k_proj,0.01245183,0.01000,3.158
3,self_attn.v_proj,0.00521770,0.01000,3.034
3,self_attn.q_proj,0.01259811,0.01000,3.280
3,self_attn.o_proj,0.00154380,0.01000,8.060
3,mlp.up_proj,0.00826654,0.01000,1.420
3,mlp.gate_proj,0.00868698,0.01000,1.575
3,mlp.down_proj,0.00818474,0.01000,12.702
4,self_attn.k_proj,0.01399883,0.01000,2.538
4,self_attn.v_proj,0.00609351,0.01000,9.978
4,self_attn.q_proj,0.01455349,0.01000,4.893
4,self_attn.o_proj,0.00308353,0.01000,1.867
4,mlp.up_proj,0.01101172,0.01000,1.507
4,mlp.gate_proj,0.01136096,0.01000,3.298
4,mlp.down_proj,0.01204515,0.01000,11.278
5,self_attn.k_proj,0.01381846,0.01000,5.158
5,self_attn.v_proj,0.00638836,0.01000,1.610
5,self_attn.q_proj,0.01450016,0.01000,1.798
5,self_attn.o_proj,0.00360254,0.01000,1.624
5,mlp.up_proj,0.01348488,0.01000,4.580
5,mlp.gate_proj,0.01340446,0.01000,1.761
5,mlp.down_proj,0.01536761,0.01000,22.166
6,self_attn.k_proj,0.01536616,0.01000,1.813
6,self_attn.v_proj,0.00765775,0.01000,1.057
6,self_attn.q_proj,0.01647044,0.01000,1.589
6,self_attn.o_proj,0.00484225,0.01000,1.817
6,mlp.up_proj,0.01586073,0.01000,2.670
6,mlp.gate_proj,0.01545403,0.01000,2.092
6,mlp.down_proj,0.01897714,0.01000,16.333
7,self_attn.k_proj,0.01551268,0.01000,2.392
7,self_attn.v_proj,0.00767670,0.01000,0.989
7,self_attn.q_proj,0.01955890,0.01000,2.897
7,self_attn.o_proj,0.00776187,0.01000,3.109
7,mlp.up_proj,0.02011534,0.01000,5.595
7,mlp.gate_proj,0.01881913,0.01000,8.879
7,mlp.down_proj,0.13795254,0.01000,5.252
8,self_attn.k_proj,0.01517920,0.01000,2.907
8,self_attn.v_proj,0.01077128,0.01000,3.195
8,self_attn.q_proj,0.01539815,0.01000,0.929
8,self_attn.o_proj,0.01244297,0.01000,8.706
8,mlp.up_proj,0.02336273,0.01000,1.006
8,mlp.gate_proj,0.02230725,0.01000,0.914
8,mlp.down_proj,0.03689886,0.01000,7.602
9,self_attn.k_proj,0.01419967,0.01000,3.176
9,self_attn.v_proj,0.00935659,0.01000,0.916
9,self_attn.q_proj,0.01437793,0.01000,7.752
9,self_attn.o_proj,0.01545753,0.01000,1.956
9,mlp.up_proj,0.02452471,0.01000,1.045
9,mlp.gate_proj,0.02163836,0.01000,0.934
9,mlp.down_proj,0.04093376,0.01000,8.590
10,self_attn.k_proj,0.01597095,0.01000,7.668
10,self_attn.v_proj,0.01030280,0.01000,0.955
10,self_attn.q_proj,0.01661386,0.01000,0.953
10,self_attn.o_proj,0.02046761,0.01000,0.961
10,mlp.up_proj,0.02449678,0.01000,1.783
10,mlp.gate_proj,0.02200876,0.01000,3.467
10,mlp.down_proj,0.04767245,0.01000,12.654
11,self_attn.k_proj,0.01583570,0.01000,0.988
11,self_attn.v_proj,0.01004474,0.01000,1.007
11,self_attn.q_proj,0.01681633,0.01000,0.953
11,self_attn.o_proj,0.02400013,0.01000,0.944
11,mlp.up_proj,0.02487121,0.01000,2.184
11,mlp.gate_proj,0.02244228,0.01000,0.996
11,mlp.down_proj,0.05173288,0.01000,18.105
12,self_attn.k_proj,0.01769731,0.01000,0.839
12,self_attn.v_proj,0.01472340,0.01000,0.551
12,self_attn.q_proj,0.01947594,0.01000,0.509
12,self_attn.o_proj,0.03308697,0.01000,0.642
12,mlp.up_proj,0.02705463,0.01000,0.573
12,mlp.gate_proj,0.02433215,0.01000,0.640
12,mlp.down_proj,0.06660484,0.01000,2.787
13,self_attn.k_proj,0.01724737,0.01000,0.509
13,self_attn.v_proj,0.01275570,0.01000,0.494
13,self_attn.q_proj,0.01846544,0.01000,0.557
13,self_attn.o_proj,0.02876754,0.01000,0.545
13,mlp.up_proj,0.02806181,0.01000,0.560
13,mlp.gate_proj,0.02527489,0.01000,0.524
13,mlp.down_proj,0.07755652,0.01000,2.416
14,self_attn.k_proj,0.01810676,0.01000,0.578
14,self_attn.v_proj,0.01431919,0.01000,0.505
14,self_attn.q_proj,0.01790303,0.01000,0.502
14,self_attn.o_proj,0.03729445,0.01000,0.527
14,mlp.up_proj,0.03043460,0.01000,0.550
14,mlp.gate_proj,0.02668553,0.01000,0.534
14,mlp.down_proj,0.10596363,0.01000,2.331
15,self_attn.k_proj,0.01930179,0.01000,0.515
15,self_attn.v_proj,0.02241649,0.01000,0.496
15,self_attn.q_proj,0.02011626,0.01000,0.497
15,self_attn.o_proj,0.05061907,0.01000,0.566
15,mlp.up_proj,0.03395730,0.01000,0.569
15,mlp.gate_proj,0.02911986,0.01000,0.593
15,mlp.down_proj,0.14194915,0.01000,2.274
16,self_attn.k_proj,0.02059570,0.01000,0.511
16,self_attn.v_proj,0.02086210,0.01000,0.496
16,self_attn.q_proj,0.02103812,0.01000,0.489
16,self_attn.o_proj,0.05604012,0.01000,0.514
16,mlp.up_proj,0.04187595,0.01000,0.539
16,mlp.gate_proj,0.03528344,0.01000,0.510
16,mlp.down_proj,0.21391028,0.01000,2.362
17,self_attn.k_proj,0.01972736,0.01000,0.528
17,self_attn.v_proj,0.02926025,0.01000,0.498
17,self_attn.q_proj,0.02005677,0.01000,0.498
17,self_attn.o_proj,0.09542210,0.01000,0.517
17,mlp.up_proj,0.04948561,0.01000,0.617
17,mlp.gate_proj,0.04208370,0.01000,0.527
17,mlp.down_proj,0.30404621,0.01000,2.336
18,self_attn.k_proj,0.01914989,0.01000,0.672
18,self_attn.v_proj,0.03310600,0.01000,0.540
18,self_attn.q_proj,0.02003000,0.01000,0.524
18,self_attn.o_proj,0.10906528,0.01000,0.543
18,mlp.up_proj,0.06152352,0.01000,0.530
18,mlp.gate_proj,0.05048580,0.01000,0.507
18,mlp.down_proj,0.47315487,0.01000,2.273
19,self_attn.k_proj,0.01988266,0.01000,0.521
19,self_attn.v_proj,0.04468218,0.01000,0.504
19,self_attn.q_proj,0.02098379,0.01000,0.499
19,self_attn.o_proj,0.11830558,0.01000,0.524
19,mlp.up_proj,0.07140406,0.01000,0.569
19,mlp.gate_proj,0.05682839,0.01000,0.516
19,mlp.down_proj,0.64388824,0.01000,2.303
20,self_attn.k_proj,0.01980521,0.01000,0.517
20,self_attn.v_proj,0.05296587,0.01000,0.492
20,self_attn.q_proj,0.02124322,0.01000,0.521
20,self_attn.o_proj,0.11964528,0.01000,0.517
20,mlp.up_proj,0.07959354,0.01000,0.533
20,mlp.gate_proj,0.06235816,0.01000,0.511
20,mlp.down_proj,0.80122459,0.01000,2.308
21,self_attn.k_proj,0.02273879,0.01000,0.526
21,self_attn.v_proj,0.06846954,0.01000,0.494
21,self_attn.q_proj,0.02335146,0.01000,0.498
21,self_attn.o_proj,0.21736440,0.01000,0.515
21,mlp.up_proj,0.09114946,0.01000,0.533
21,mlp.gate_proj,0.07021903,0.01000,0.509
21,mlp.down_proj,1.01436162,0.01000,2.285
22,self_attn.k_proj,0.02368175,0.01000,0.515
22,self_attn.v_proj,0.07183458,0.01000,0.500
22,self_attn.q_proj,0.02609063,0.01000,0.585
22,self_attn.o_proj,0.34090981,0.01000,0.516
22,mlp.up_proj,0.10087807,0.01000,0.555
22,mlp.gate_proj,0.07864191,0.01000,0.506
22,mlp.down_proj,1.41661644,0.01000,2.276
23,self_attn.k_proj,0.02159666,0.01000,0.523
23,self_attn.v_proj,0.08762348,0.01000,0.498
23,self_attn.q_proj,0.02072346,0.01000,0.494
23,self_attn.o_proj,0.76461768,0.01000,0.515
23,mlp.up_proj,0.09932031,0.01000,0.525
23,mlp.gate_proj,0.08260745,0.01000,0.506
23,mlp.down_proj,2.73030257,0.01000,2.283