Abdohaaland's picture
Upload folder using huggingface_hub
631e001 verified
layer,module,loss,samples,damp,time
0,self_attn.v_proj,0.0000002875,0.05000,6.079
0,self_attn.q_proj,0.0000129580,0.05000,6.072
0,self_attn.k_proj,0.0000065541,0.05000,6.166
0,self_attn.o_proj,0.0000000108,0.05000,1.322
0,mlp.up_proj,0.0000042795,0.05000,2.767
0,mlp.gate_proj,0.0000049425,0.05000,2.827
0,mlp.down_proj,0.0000000314,0.05000,3.129
1,self_attn.v_proj,0.0000006689,0.05000,5.451
1,self_attn.q_proj,0.0000126307,0.05000,5.730
1,self_attn.k_proj,0.0000075396,0.05000,5.728
1,self_attn.o_proj,0.0000000542,0.05000,1.178
1,mlp.up_proj,0.0000047425,0.05000,3.081
1,mlp.gate_proj,0.0000054370,0.05000,3.112
1,mlp.down_proj,0.0000014180,0.05000,3.606
2,self_attn.q_proj,0.0000451748,0.05000,5.432
2,self_attn.v_proj,0.0000023224,0.05000,5.532
2,self_attn.k_proj,0.0000278147,0.05000,5.595
2,self_attn.o_proj,0.0000000395,0.05000,1.582
2,mlp.gate_proj,0.0000069938,0.05000,3.056
2,mlp.up_proj,0.0000058359,0.05000,3.076
2,mlp.down_proj,0.0000000593,0.05000,3.429
3,self_attn.k_proj,0.0000122990,0.05000,5.539
3,self_attn.q_proj,0.0000217445,0.05000,5.617
3,self_attn.v_proj,0.0000017581,0.05000,5.651
3,self_attn.o_proj,0.0000000203,0.05000,1.148
3,mlp.up_proj,0.0000073834,0.05000,2.965
3,mlp.gate_proj,0.0000100123,0.05000,3.005
3,mlp.down_proj,0.0000000824,0.05000,3.236
4,self_attn.v_proj,0.0000018723,0.05000,5.579
4,self_attn.q_proj,0.0000233329,0.05000,5.656
4,self_attn.k_proj,0.0000122032,0.05000,5.675
4,self_attn.o_proj,0.0000000633,0.05000,1.160
4,mlp.gate_proj,0.0000134069,0.05000,2.868
4,mlp.up_proj,0.0000087210,0.05000,2.888
4,mlp.down_proj,0.0000001386,0.05000,3.249
5,self_attn.q_proj,0.0000320827,0.05000,5.716
5,self_attn.v_proj,0.0000018635,0.05000,5.766
5,self_attn.k_proj,0.0000201049,0.05000,5.805
5,self_attn.o_proj,0.0000000861,0.05000,1.145
5,mlp.up_proj,0.0000098045,0.05000,2.898
5,mlp.gate_proj,0.0000141574,0.05000,2.948
5,mlp.down_proj,0.0000001802,0.05000,3.211
6,self_attn.v_proj,0.0000016420,0.05000,5.570
6,self_attn.k_proj,0.0000132601,0.05000,5.575
6,self_attn.q_proj,0.0000247839,0.05000,5.591
6,self_attn.o_proj,0.0000001096,0.05000,1.109
6,mlp.up_proj,0.0000105212,0.05000,2.988
6,mlp.gate_proj,0.0000152134,0.05000,3.020
6,mlp.down_proj,0.0000002012,0.05000,3.370
7,self_attn.k_proj,0.0000120739,0.05000,5.535
7,self_attn.v_proj,0.0000014840,0.05000,5.605
7,self_attn.q_proj,0.0000204857,0.05000,5.640
7,self_attn.o_proj,0.0000002358,0.05000,1.129
7,mlp.gate_proj,0.0000128394,0.05000,3.091
7,mlp.up_proj,0.0000096388,0.05000,3.129
7,mlp.down_proj,0.0000002028,0.05000,3.140
8,self_attn.v_proj,0.0000015355,0.05000,5.690
8,self_attn.k_proj,0.0000140590,0.05000,5.747
8,self_attn.q_proj,0.0000230355,0.05000,5.764
8,self_attn.o_proj,0.0000001701,0.05000,1.138
8,mlp.up_proj,0.0000097746,0.05000,2.718
8,mlp.gate_proj,0.0000133103,0.05000,2.764
8,mlp.down_proj,0.0000001912,0.05000,3.235
9,self_attn.k_proj,0.0000125890,0.05000,5.656
9,self_attn.v_proj,0.0000019354,0.05000,5.697
9,self_attn.q_proj,0.0000210542,0.05000,5.709
9,self_attn.o_proj,0.0000001880,0.05000,1.125
9,mlp.gate_proj,0.0000120921,0.05000,2.345
9,mlp.up_proj,0.0000091294,0.05000,2.378
9,mlp.down_proj,0.0000001759,0.05000,3.018
10,self_attn.k_proj,0.0000123705,0.05000,5.145
10,self_attn.q_proj,0.0000194175,0.05000,5.205
10,self_attn.v_proj,0.0000013578,0.05000,5.219
10,self_attn.o_proj,0.0000001988,0.05000,1.069
10,mlp.up_proj,0.0000093869,0.05000,2.431
10,mlp.gate_proj,0.0000116347,0.05000,2.435
10,mlp.down_proj,0.0000001812,0.05000,3.010
11,self_attn.k_proj,0.0000083764,0.05000,5.029
11,self_attn.v_proj,0.0000015281,0.05000,5.087
11,self_attn.q_proj,0.0000145726,0.05000,5.109
11,self_attn.o_proj,0.0000002144,0.05000,1.055
11,mlp.gate_proj,0.0000117093,0.05000,2.358
11,mlp.up_proj,0.0000097968,0.05000,2.368
11,mlp.down_proj,0.0000001988,0.05000,3.045
12,self_attn.k_proj,0.0000136289,0.05000,5.094
12,self_attn.v_proj,0.0000016965,0.05000,5.144
12,self_attn.q_proj,0.0000224206,0.05000,5.161
12,self_attn.o_proj,0.0000002437,0.05000,1.047
12,mlp.gate_proj,0.0000121265,0.05000,2.366
12,mlp.up_proj,0.0000100321,0.05000,2.385
12,mlp.down_proj,0.0000002146,0.05000,3.073
13,self_attn.v_proj,0.0000018654,0.05000,5.003
13,self_attn.q_proj,0.0000215060,0.05000,5.062
13,self_attn.k_proj,0.0000140466,0.05000,5.070
13,self_attn.o_proj,0.0000002475,0.05000,1.040
13,mlp.gate_proj,0.0000145311,0.05000,2.448
13,mlp.up_proj,0.0000111055,0.05000,2.464
13,mlp.down_proj,0.0000002871,0.05000,2.965
14,self_attn.q_proj,0.0000244416,0.05000,4.975
14,self_attn.k_proj,0.0000109761,0.05000,5.087
14,self_attn.v_proj,0.0000021334,0.05000,5.103
14,self_attn.o_proj,0.0000004272,0.05000,1.061
14,mlp.gate_proj,0.0000144053,0.05000,2.369
14,mlp.up_proj,0.0000109751,0.05000,2.391
14,mlp.down_proj,0.0000002757,0.05000,3.033
15,self_attn.v_proj,0.0000019140,0.05000,5.057
15,self_attn.k_proj,0.0000115560,0.05000,5.108
15,self_attn.q_proj,0.0000219541,0.05000,5.133
15,self_attn.o_proj,0.0000003740,0.05000,1.044
15,mlp.gate_proj,0.0000141731,0.05000,2.447
15,mlp.up_proj,0.0000101552,0.05000,2.471
15,mlp.down_proj,0.0000002539,0.05000,3.024
16,self_attn.q_proj,0.0000201770,0.05000,4.931
16,self_attn.v_proj,0.0000019840,0.05000,5.031
16,self_attn.k_proj,0.0000116480,0.05000,5.075
16,self_attn.o_proj,0.0000002044,0.05000,1.058
16,mlp.gate_proj,0.0000144537,0.05000,2.390
16,mlp.up_proj,0.0000101879,0.05000,2.410
16,mlp.down_proj,0.0000002548,0.05000,3.036
17,self_attn.v_proj,0.0000019457,0.05000,5.025
17,self_attn.k_proj,0.0000103892,0.05000,5.091
17,self_attn.q_proj,0.0000190087,0.05000,5.127
17,self_attn.o_proj,0.0000001803,0.05000,1.055
17,mlp.up_proj,0.0000105910,0.05000,2.332
17,mlp.gate_proj,0.0000151940,0.05000,2.350
17,mlp.down_proj,0.0000002681,0.05000,3.039
18,self_attn.k_proj,0.0000125478,0.05000,5.233
18,self_attn.q_proj,0.0000225686,0.05000,5.229
18,self_attn.v_proj,0.0000024447,0.05000,5.291
18,self_attn.o_proj,0.0000000928,0.05000,1.089
18,mlp.up_proj,0.0000113110,0.05000,2.333
18,mlp.gate_proj,0.0000158267,0.05000,2.352
18,mlp.down_proj,0.0000002841,0.05000,3.043
19,self_attn.v_proj,0.0000024250,0.05000,5.080
19,self_attn.q_proj,0.0000203657,0.05000,5.166
19,self_attn.k_proj,0.0000117773,0.05000,5.181
19,self_attn.o_proj,0.0000001395,0.05000,1.059
19,mlp.up_proj,0.0000118265,0.05000,2.313
19,mlp.gate_proj,0.0000163829,0.05000,2.330
19,mlp.down_proj,0.0000003390,0.05000,3.025
20,self_attn.k_proj,0.0000131098,0.05000,5.081
20,self_attn.q_proj,0.0000216605,0.05000,5.130
20,self_attn.v_proj,0.0000028895,0.05000,5.157
20,self_attn.o_proj,0.0000000723,0.05000,1.023
20,mlp.up_proj,0.0000114745,0.05000,2.554
20,mlp.gate_proj,0.0000150741,0.05000,2.556
20,mlp.down_proj,0.0000002896,0.05000,3.027
21,self_attn.v_proj,0.0000038318,0.05000,5.045
21,self_attn.k_proj,0.0000127311,0.05000,5.085
21,self_attn.q_proj,0.0000215379,0.05000,5.122
21,self_attn.o_proj,0.0000000909,0.05000,1.051
21,mlp.up_proj,0.0000113903,0.05000,2.481
21,mlp.gate_proj,0.0000150505,0.05000,2.496
21,mlp.down_proj,0.0000002896,0.05000,3.067
22,self_attn.v_proj,0.0000036099,0.05000,5.172
22,self_attn.k_proj,0.0000112382,0.05000,5.192
22,self_attn.q_proj,0.0000197390,0.05000,5.234
22,self_attn.o_proj,0.0000000599,0.05000,1.053
22,mlp.gate_proj,0.0000153890,0.05000,2.339
22,mlp.up_proj,0.0000115268,0.05000,2.361
22,mlp.down_proj,0.0000003044,0.05000,3.107
23,self_attn.k_proj,0.0000127207,0.05000,5.052
23,self_attn.v_proj,0.0000033499,0.05000,5.106
23,self_attn.q_proj,0.0000205526,0.05000,5.127
23,self_attn.o_proj,0.0000000568,0.05000,1.063
23,mlp.up_proj,0.0000131494,0.05000,2.542
23,mlp.gate_proj,0.0000187574,0.05000,2.560
23,mlp.down_proj,0.0000004297,0.05000,3.052
24,self_attn.v_proj,0.0000050478,0.05000,5.095
24,self_attn.k_proj,0.0000132556,0.05000,5.190
24,self_attn.q_proj,0.0000210217,0.05000,5.220
24,self_attn.o_proj,0.0000002743,0.05000,1.064
24,mlp.gate_proj,0.0000177907,0.05000,2.397
24,mlp.up_proj,0.0000121369,0.05000,2.419
24,mlp.down_proj,0.0000003998,0.05000,3.048
25,self_attn.v_proj,0.0000035746,0.05000,5.082
25,self_attn.k_proj,0.0000085866,0.05000,5.154
25,self_attn.q_proj,0.0000167753,0.05000,5.200
25,self_attn.o_proj,0.0000006733,0.05000,1.076
25,mlp.up_proj,0.0000131685,0.05000,2.416
25,mlp.gate_proj,0.0000198001,0.05000,2.429
25,mlp.down_proj,0.0000007029,0.05000,3.048
26,self_attn.v_proj,0.0000052315,0.05000,5.138
26,self_attn.q_proj,0.0000171792,0.05000,5.155
26,self_attn.k_proj,0.0000105835,0.05000,5.196
26,self_attn.o_proj,0.0000003890,0.05000,1.061
26,mlp.up_proj,0.0000142373,0.05000,2.443
26,mlp.gate_proj,0.0000217037,0.05000,2.462
26,mlp.down_proj,0.0000014717,0.05000,3.041
27,self_attn.k_proj,0.0000074436,0.05000,5.060
27,self_attn.q_proj,0.0000136104,0.05000,5.123
27,self_attn.v_proj,0.0000038322,0.05000,5.142
27,self_attn.o_proj,0.0000033302,0.05000,1.107
27,mlp.up_proj,0.0000177582,0.05000,2.535
27,mlp.gate_proj,0.0000236296,0.05000,2.561
27,mlp.down_proj,0.0000210622,0.05000,3.164