Abdohaaland's picture
Upload folder using huggingface_hub
f235135 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000074843,0.05000,5.272
0,self_attn.q_proj,0.0000147214,0.05000,5.281
0,self_attn.v_proj,0.0000004168,0.05000,5.330
0,self_attn.o_proj,0.0000000187,0.05000,0.970
0,mlp.gate_proj,0.0000084507,0.05000,2.314
0,mlp.up_proj,0.0000073953,0.05000,2.321
0,mlp.down_proj,0.0000001043,0.05000,2.760
1,self_attn.q_proj,0.0000176587,0.05000,5.488
1,self_attn.v_proj,0.0000011781,0.05000,5.531
1,self_attn.k_proj,0.0000103479,0.05000,5.556
1,self_attn.o_proj,0.0000000659,0.05000,1.008
1,mlp.up_proj,0.0000101163,0.05000,2.793
1,mlp.gate_proj,0.0000115220,0.05000,2.857
1,mlp.down_proj,0.0000023786,0.05000,2.978
2,self_attn.v_proj,0.0000045326,0.05000,5.520
2,self_attn.k_proj,0.0000444663,0.05000,5.568
2,self_attn.q_proj,0.0000746845,0.05000,5.603
2,self_attn.o_proj,0.0000000708,0.05000,0.977
2,mlp.up_proj,0.0000157823,0.05000,2.370
2,mlp.gate_proj,0.0000186525,0.05000,2.381
2,mlp.down_proj,0.0000003235,0.05000,2.880
3,self_attn.q_proj,0.0000490428,0.05000,4.770
3,self_attn.v_proj,0.0000046019,0.05000,4.821
3,self_attn.k_proj,0.0000271964,0.05000,4.853
3,self_attn.o_proj,0.0000001303,0.05000,0.991
3,mlp.gate_proj,0.0000271254,0.05000,2.287
3,mlp.up_proj,0.0000203218,0.05000,2.309
3,mlp.down_proj,0.0000004725,0.05000,2.923
4,self_attn.v_proj,0.0000049324,0.05000,4.775
4,self_attn.q_proj,0.0000503491,0.05000,4.856
4,self_attn.k_proj,0.0000263398,0.05000,4.882
4,self_attn.o_proj,0.0000001964,0.05000,1.008
4,mlp.gate_proj,0.0000360828,0.05000,2.330
4,mlp.up_proj,0.0000242689,0.05000,2.349
4,mlp.down_proj,0.0000006482,0.05000,2.859
5,self_attn.q_proj,0.0000723580,0.05000,4.878
5,self_attn.k_proj,0.0000435308,0.05000,4.908
5,self_attn.v_proj,0.0000050953,0.05000,4.928
5,self_attn.o_proj,0.0000002506,0.05000,0.988
5,mlp.up_proj,0.0000276863,0.05000,2.221
5,mlp.gate_proj,0.0000389511,0.05000,2.249
5,mlp.down_proj,0.0000008920,0.05000,2.865
6,self_attn.v_proj,0.0000047490,0.05000,4.730
6,self_attn.k_proj,0.0000314569,0.05000,4.806
6,self_attn.q_proj,0.0000593003,0.05000,4.831
6,self_attn.o_proj,0.0000003914,0.05000,0.994
6,mlp.gate_proj,0.0000416038,0.05000,2.261
6,mlp.up_proj,0.0000296857,0.05000,2.274
6,mlp.down_proj,0.0000010432,0.05000,2.867
7,self_attn.v_proj,0.0000041414,0.05000,4.777
7,self_attn.k_proj,0.0000294888,0.05000,4.819
7,self_attn.q_proj,0.0000499796,0.05000,4.840
7,self_attn.o_proj,0.0000005414,0.05000,0.996
7,mlp.gate_proj,0.0000407815,0.05000,2.382
7,mlp.up_proj,0.0000316740,0.05000,2.395
7,mlp.down_proj,0.0000011954,0.05000,2.921
8,self_attn.k_proj,0.0000382184,0.05000,4.773
8,self_attn.q_proj,0.0000634405,0.05000,4.840
8,self_attn.v_proj,0.0000051689,0.05000,4.857
8,self_attn.o_proj,0.0000007112,0.05000,0.994
8,mlp.gate_proj,0.0000432118,0.05000,2.214
8,mlp.up_proj,0.0000328935,0.05000,2.231
8,mlp.down_proj,0.0000012622,0.05000,2.910
9,self_attn.v_proj,0.0000062167,0.05000,4.765
9,self_attn.k_proj,0.0000348470,0.05000,4.821
9,self_attn.q_proj,0.0000589752,0.05000,4.857
9,self_attn.o_proj,0.0000007339,0.05000,0.995
9,mlp.gate_proj,0.0000421141,0.05000,2.229
9,mlp.up_proj,0.0000330395,0.05000,2.241
9,mlp.down_proj,0.0000012594,0.05000,2.852
10,self_attn.k_proj,0.0000369369,0.05000,4.772
10,self_attn.v_proj,0.0000048285,0.05000,4.813
10,self_attn.q_proj,0.0000594491,0.05000,4.850
10,self_attn.o_proj,0.0000007190,0.05000,0.987
10,mlp.up_proj,0.0000361118,0.05000,2.281
10,mlp.gate_proj,0.0000430197,0.05000,2.303
10,mlp.down_proj,0.0000014489,0.05000,2.891
11,self_attn.v_proj,0.0000057577,0.05000,4.785
11,self_attn.k_proj,0.0000277935,0.05000,4.850
11,self_attn.q_proj,0.0000493928,0.05000,4.877
11,self_attn.o_proj,0.0000009189,0.05000,1.004
11,mlp.gate_proj,0.0000448819,0.05000,2.218
11,mlp.up_proj,0.0000388907,0.05000,2.235
11,mlp.down_proj,0.0000016271,0.05000,2.859
12,self_attn.q_proj,0.0000703840,0.05000,4.766
12,self_attn.k_proj,0.0000419931,0.05000,4.806
12,self_attn.v_proj,0.0000062611,0.05000,4.833
12,self_attn.o_proj,0.0000010599,0.05000,1.008
12,mlp.up_proj,0.0000416281,0.05000,2.392
12,mlp.gate_proj,0.0000476432,0.05000,2.410
12,mlp.down_proj,0.0000018099,0.05000,2.883
13,self_attn.v_proj,0.0000073646,0.05000,4.787
13,self_attn.k_proj,0.0000480065,0.05000,4.836
13,self_attn.q_proj,0.0000746108,0.05000,4.859
13,self_attn.o_proj,0.0000012881,0.05000,1.002
13,mlp.gate_proj,0.0000567143,0.05000,2.312
13,mlp.up_proj,0.0000464424,0.05000,2.333
13,mlp.down_proj,0.0000024285,0.05000,2.855
14,self_attn.v_proj,0.0000085554,0.05000,4.747
14,self_attn.k_proj,0.0000377909,0.05000,4.815
14,self_attn.q_proj,0.0000818829,0.05000,4.839
14,self_attn.o_proj,0.0000014739,0.05000,0.988
14,mlp.gate_proj,0.0000618665,0.05000,2.244
14,mlp.up_proj,0.0000501615,0.05000,2.275
14,mlp.down_proj,0.0000028961,0.05000,2.943
15,self_attn.k_proj,0.0000434869,0.05000,4.765
15,self_attn.q_proj,0.0000836033,0.05000,4.814
15,self_attn.v_proj,0.0000085927,0.05000,4.843
15,self_attn.o_proj,0.0000009176,0.05000,0.978
15,mlp.up_proj,0.0000501215,0.05000,2.199
15,mlp.gate_proj,0.0000664111,0.05000,2.224
15,mlp.down_proj,0.0000029919,0.05000,2.856
16,self_attn.v_proj,0.0000096999,0.05000,4.660
16,self_attn.k_proj,0.0000491510,0.05000,4.808
16,self_attn.q_proj,0.0000873152,0.05000,4.831
16,self_attn.o_proj,0.0000006891,0.05000,0.990
16,mlp.gate_proj,0.0000677998,0.05000,2.255
16,mlp.up_proj,0.0000498530,0.05000,2.270
16,mlp.down_proj,0.0000028770,0.05000,2.887
17,self_attn.k_proj,0.0000451024,0.05000,4.814
17,self_attn.q_proj,0.0000833279,0.05000,4.854
17,self_attn.v_proj,0.0000093786,0.05000,4.881
17,self_attn.o_proj,0.0000006592,0.05000,0.993
17,mlp.gate_proj,0.0000711968,0.05000,2.303
17,mlp.up_proj,0.0000515198,0.05000,2.313
17,mlp.down_proj,0.0000031699,0.05000,2.877
18,self_attn.v_proj,0.0000117244,0.05000,4.799
18,self_attn.q_proj,0.0000941548,0.05000,4.843
18,self_attn.k_proj,0.0000521436,0.05000,4.855
18,self_attn.o_proj,0.0000007543,0.05000,1.060
18,mlp.gate_proj,0.0000748079,0.05000,2.265
18,mlp.up_proj,0.0000554492,0.05000,2.288
18,mlp.down_proj,0.0000033983,0.05000,2.867
19,self_attn.k_proj,0.0000492243,0.05000,4.762
19,self_attn.v_proj,0.0000116459,0.05000,4.852
19,self_attn.q_proj,0.0000846121,0.05000,4.881
19,self_attn.o_proj,0.0000010064,0.05000,0.996
19,mlp.gate_proj,0.0000798135,0.05000,2.413
19,mlp.up_proj,0.0000598702,0.05000,2.435
19,mlp.down_proj,0.0000041946,0.05000,2.896
20,self_attn.v_proj,0.0000138354,0.05000,4.743
20,self_attn.k_proj,0.0000525729,0.05000,4.779
20,self_attn.q_proj,0.0000871055,0.05000,4.804
20,self_attn.o_proj,0.0000007463,0.05000,1.062
20,mlp.gate_proj,0.0000772857,0.05000,2.329
20,mlp.up_proj,0.0000608534,0.05000,2.344
20,mlp.down_proj,0.0000040513,0.05000,2.916
21,self_attn.k_proj,0.0000516450,0.05000,4.799
21,self_attn.q_proj,0.0000864292,0.05000,4.834
21,self_attn.v_proj,0.0000178772,0.05000,4.858
21,self_attn.o_proj,0.0000009117,0.05000,1.007
21,mlp.up_proj,0.0000644529,0.05000,2.339
21,mlp.gate_proj,0.0000826544,0.05000,2.358
21,mlp.down_proj,0.0000043396,0.05000,2.849
22,self_attn.k_proj,0.0000493620,0.05000,4.685
22,self_attn.q_proj,0.0000846314,0.05000,4.768
22,self_attn.v_proj,0.0000178073,0.05000,4.804
22,self_attn.o_proj,0.0000007427,0.05000,0.985
22,mlp.up_proj,0.0000691359,0.05000,2.223
22,mlp.gate_proj,0.0000892200,0.05000,2.242
22,mlp.down_proj,0.0000049096,0.05000,2.858
23,self_attn.k_proj,0.0000528449,0.05000,4.804
23,self_attn.q_proj,0.0000848596,0.05000,4.884
23,self_attn.v_proj,0.0000174951,0.05000,4.895
23,self_attn.o_proj,0.0000011734,0.05000,0.995
23,mlp.up_proj,0.0000761134,0.05000,2.367
23,mlp.gate_proj,0.0001037115,0.05000,2.376
23,mlp.down_proj,0.0000060200,0.05000,2.890
24,self_attn.v_proj,0.0000255699,0.05000,4.749
24,self_attn.k_proj,0.0000586351,0.05000,4.825
24,self_attn.q_proj,0.0000929255,0.05000,4.852
24,self_attn.o_proj,0.0000017205,0.05000,1.011
24,mlp.gate_proj,0.0001158564,0.05000,2.337
24,mlp.up_proj,0.0000833232,0.05000,2.350
24,mlp.down_proj,0.0000070803,0.05000,2.862
25,self_attn.v_proj,0.0000219677,0.05000,4.786
25,self_attn.k_proj,0.0000455065,0.05000,4.819
25,self_attn.q_proj,0.0000875274,0.05000,4.842
25,self_attn.o_proj,0.0000018091,0.05000,0.995
25,mlp.gate_proj,0.0001257230,0.05000,2.238
25,mlp.up_proj,0.0000896462,0.05000,2.241
25,mlp.down_proj,0.0000089616,0.05000,2.927
26,self_attn.v_proj,0.0000301434,0.05000,4.714
26,self_attn.q_proj,0.0000821644,0.05000,4.799
26,self_attn.k_proj,0.0000533734,0.05000,4.827
26,self_attn.o_proj,0.0000028081,0.05000,1.033
26,mlp.gate_proj,0.0001326795,0.05000,2.426
26,mlp.up_proj,0.0000931492,0.05000,2.448
26,mlp.down_proj,0.0000130549,0.05000,2.898
27,self_attn.q_proj,0.0000648963,0.05000,4.827
27,self_attn.v_proj,0.0000198264,0.05000,4.863
27,self_attn.k_proj,0.0000367513,0.05000,4.890
27,self_attn.o_proj,0.0000078769,0.05000,1.015
27,mlp.gate_proj,0.0001287943,0.05000,2.227
27,mlp.up_proj,0.0001021746,0.05000,2.234
27,mlp.down_proj,0.0000386645,0.05000,2.917