Abdohaaland's picture
Upload folder using huggingface_hub
316b026 verified
layer,module,loss,samples,damp,time
0,self_attn.v_proj,0.0000000281,0.05000,4.670
0,self_attn.k_proj,0.0000000335,0.05000,4.718
0,self_attn.q_proj,0.0000001225,0.05000,4.760
0,self_attn.o_proj,0.0000000638,0.05000,1.479
0,mlp.gate_proj,0.0000083850,0.05000,1.913
0,mlp.up_proj,0.0000072816,0.05000,1.916
0,mlp.down_proj,0.0000004270,0.05000,3.658
1,self_attn.v_proj,0.0000000562,0.05000,4.730
1,self_attn.q_proj,0.0000002102,0.05000,4.830
1,self_attn.k_proj,0.0000000580,0.05000,4.839
1,self_attn.o_proj,0.0000000563,0.05000,1.447
1,mlp.gate_proj,0.0002669175,0.05000,2.458
1,mlp.up_proj,0.0001192833,0.05000,2.516
1,mlp.down_proj,0.0000007279,0.05000,3.921
2,self_attn.v_proj,0.0000001416,0.05000,4.924
2,self_attn.q_proj,0.0000005442,0.05000,4.999
2,self_attn.k_proj,0.0000001599,0.05000,5.030
2,self_attn.o_proj,0.0000000774,0.05000,1.461
2,mlp.gate_proj,0.0004706195,0.05000,2.073
2,mlp.up_proj,0.0003679584,0.05000,2.095
2,mlp.down_proj,0.0000005296,0.05000,3.701
3,self_attn.v_proj,0.0000002583,0.05000,4.187
3,self_attn.k_proj,0.0000002787,0.05000,4.232
3,self_attn.q_proj,0.0000010549,0.05000,4.253
3,self_attn.o_proj,0.0000001789,0.05000,1.442
3,mlp.up_proj,0.0001859692,0.05000,1.984
3,mlp.gate_proj,0.0003880208,0.05000,2.003
3,mlp.down_proj,0.0000008290,0.05000,3.716
4,self_attn.v_proj,0.0000004453,0.05000,4.170
4,self_attn.q_proj,0.0000017503,0.05000,4.240
4,self_attn.k_proj,0.0000004929,0.05000,4.270
4,self_attn.o_proj,0.0000001841,0.05000,1.432
4,mlp.gate_proj,0.0003188560,0.05000,1.952
4,mlp.up_proj,0.0001058938,0.05000,1.977
4,mlp.down_proj,0.0000009877,0.05000,3.709
5,self_attn.v_proj,0.0000004747,0.05000,4.207
5,self_attn.k_proj,0.0000004808,0.05000,4.254
5,self_attn.q_proj,0.0000018170,0.05000,4.288
5,self_attn.o_proj,0.0000003358,0.05000,1.449
5,mlp.gate_proj,0.0001046843,0.05000,2.039
5,mlp.up_proj,0.0000414282,0.05000,2.070
5,mlp.down_proj,0.0000013782,0.05000,3.819
6,self_attn.v_proj,0.0000010176,0.05000,4.233
6,self_attn.q_proj,0.0000040303,0.05000,4.253
6,self_attn.k_proj,0.0000009895,0.05000,4.313
6,self_attn.o_proj,0.0000006622,0.05000,1.448
6,mlp.up_proj,0.0000503757,0.05000,2.014
6,mlp.gate_proj,0.0001110306,0.05000,2.035
6,mlp.down_proj,0.0000206670,0.05000,3.659
7,self_attn.k_proj,0.0000024329,0.05000,4.064
7,self_attn.q_proj,0.0000085931,0.05000,4.123
7,self_attn.v_proj,0.0000019982,0.05000,4.144
7,self_attn.o_proj,0.0000009256,0.05000,1.444
7,mlp.gate_proj,0.0001217811,0.05000,2.071
7,mlp.up_proj,0.0000577930,0.05000,2.092
7,mlp.down_proj,0.0000025102,0.05000,3.710
8,self_attn.v_proj,0.0000027738,0.05000,4.201
8,self_attn.q_proj,0.0000114360,0.05000,4.238
8,self_attn.k_proj,0.0000030762,0.05000,4.259
8,self_attn.o_proj,0.0000009674,0.05000,1.412
8,mlp.gate_proj,0.0000708923,0.05000,2.010
8,mlp.up_proj,0.0000563776,0.05000,2.033
8,mlp.down_proj,0.0000032682,0.05000,3.754
9,self_attn.v_proj,0.0000035083,0.05000,4.188
9,self_attn.k_proj,0.0000047883,0.05000,4.223
9,self_attn.q_proj,0.0000157103,0.05000,4.262
9,self_attn.o_proj,0.0000014919,0.05000,1.426
9,mlp.up_proj,0.0000711674,0.05000,2.011
9,mlp.gate_proj,0.0001187128,0.05000,2.031
9,mlp.down_proj,0.0000035517,0.05000,3.705
10,self_attn.k_proj,0.0000056646,0.05000,4.156
10,self_attn.q_proj,0.0000214887,0.05000,4.234
10,self_attn.v_proj,0.0000053920,0.05000,4.256
10,self_attn.o_proj,0.0000015159,0.05000,1.484
10,mlp.gate_proj,0.0000876355,0.05000,2.018
10,mlp.up_proj,0.0000582840,0.05000,2.034
10,mlp.down_proj,0.0000028648,0.05000,3.671
11,self_attn.k_proj,0.0000029401,0.05000,4.225
11,self_attn.v_proj,0.0000024203,0.05000,4.303
11,self_attn.q_proj,0.0000103068,0.05000,4.329
11,self_attn.o_proj,0.0000008888,0.05000,1.416
11,mlp.gate_proj,0.0000741166,0.05000,1.917
11,mlp.up_proj,0.0000566025,0.05000,1.941
11,mlp.down_proj,0.0000030860,0.05000,3.775
12,self_attn.k_proj,0.0000038472,0.05000,4.211
12,self_attn.q_proj,0.0000137759,0.05000,4.249
12,self_attn.v_proj,0.0000034272,0.05000,4.280
12,self_attn.o_proj,0.0000018546,0.05000,1.426
12,mlp.up_proj,0.0000580738,0.05000,2.071
12,mlp.gate_proj,0.0000685725,0.05000,2.094
12,mlp.down_proj,0.0000032841,0.05000,3.679
13,self_attn.v_proj,0.0000025200,0.05000,4.194
13,self_attn.q_proj,0.0000111981,0.05000,4.230
13,self_attn.k_proj,0.0000030891,0.05000,4.257
13,self_attn.o_proj,0.0000013833,0.05000,1.412
13,mlp.gate_proj,0.0000692568,0.05000,1.954
13,mlp.up_proj,0.0000647811,0.05000,1.973
13,mlp.down_proj,0.0000043834,0.05000,3.687
14,self_attn.q_proj,0.0000175752,0.05000,4.123
14,self_attn.k_proj,0.0000045994,0.05000,4.169
14,self_attn.v_proj,0.0000043383,0.05000,4.177
14,self_attn.o_proj,0.0000019435,0.05000,1.440
14,mlp.up_proj,0.0000720079,0.05000,1.933
14,mlp.gate_proj,0.0000766432,0.05000,1.958
14,mlp.down_proj,0.0000047673,0.05000,3.682
15,self_attn.k_proj,0.0000054351,0.05000,4.116
15,self_attn.v_proj,0.0000046581,0.05000,4.200
15,self_attn.q_proj,0.0000211606,0.05000,4.223
15,self_attn.o_proj,0.0000018997,0.05000,1.429
15,mlp.gate_proj,0.0000754266,0.05000,1.990
15,mlp.up_proj,0.0000740122,0.05000,2.015
15,mlp.down_proj,0.0000053597,0.05000,3.737
16,self_attn.q_proj,0.0000386672,0.05000,4.067
16,self_attn.k_proj,0.0000093139,0.05000,4.130
16,self_attn.v_proj,0.0000103499,0.05000,4.155
16,self_attn.o_proj,0.0000026699,0.05000,1.403
16,mlp.up_proj,0.0000855751,0.05000,2.041
16,mlp.gate_proj,0.0000930978,0.05000,2.061
16,mlp.down_proj,0.0000275581,0.05000,3.699
17,self_attn.q_proj,0.0000392438,0.05000,4.191
17,self_attn.k_proj,0.0000084165,0.05000,4.234
17,self_attn.v_proj,0.0000087300,0.05000,4.253
17,self_attn.o_proj,0.0000026301,0.05000,1.434
17,mlp.gate_proj,0.0000779856,0.05000,2.005
17,mlp.up_proj,0.0000724824,0.05000,2.024
17,mlp.down_proj,0.0000052021,0.05000,3.706
18,self_attn.q_proj,0.0000359746,0.05000,4.202
18,self_attn.v_proj,0.0000089155,0.05000,4.239
18,self_attn.k_proj,0.0000086172,0.05000,4.263
18,self_attn.o_proj,0.0000026857,0.05000,1.403
18,mlp.gate_proj,0.0000826436,0.05000,1.962
18,mlp.up_proj,0.0000786649,0.05000,1.977
18,mlp.down_proj,0.0000061125,0.05000,3.797
19,self_attn.k_proj,0.0000154321,0.05000,4.153
19,self_attn.v_proj,0.0000145288,0.05000,4.226
19,self_attn.q_proj,0.0000669893,0.05000,4.257
19,self_attn.o_proj,0.0000072475,0.05000,1.420
19,mlp.up_proj,0.0000763673,0.05000,1.958
19,mlp.gate_proj,0.0000795653,0.05000,1.983
19,mlp.down_proj,0.0000063999,0.05000,3.722
20,self_attn.k_proj,0.0000139938,0.05000,4.166
20,self_attn.v_proj,0.0000126008,0.05000,4.255
20,self_attn.q_proj,0.0000648620,0.05000,4.270
20,self_attn.o_proj,0.0000058633,0.05000,1.471
20,mlp.gate_proj,0.0000927177,0.05000,1.983
20,mlp.up_proj,0.0000909301,0.05000,2.005
20,mlp.down_proj,0.0000085226,0.05000,3.687
21,self_attn.v_proj,0.0000157023,0.05000,4.200
21,self_attn.q_proj,0.0000732686,0.05000,4.246
21,self_attn.k_proj,0.0000162576,0.05000,4.279
21,self_attn.o_proj,0.0000064938,0.05000,1.451
21,mlp.up_proj,0.0000938207,0.05000,2.061
21,mlp.gate_proj,0.0000953118,0.05000,2.069
21,mlp.down_proj,0.0000094180,0.05000,3.670
22,self_attn.v_proj,0.0000290647,0.05000,4.262
22,self_attn.q_proj,0.0001376551,0.05000,4.291
22,self_attn.k_proj,0.0000316722,0.05000,4.321
22,self_attn.o_proj,0.0000139498,0.05000,1.408
22,mlp.up_proj,0.0001028317,0.05000,1.960
22,mlp.gate_proj,0.0001130452,0.05000,1.982
22,mlp.down_proj,0.0000150741,0.05000,3.654
23,self_attn.q_proj,0.0001271593,0.05000,4.130
23,self_attn.k_proj,0.0000288629,0.05000,4.167
23,self_attn.v_proj,0.0000286624,0.05000,4.196
23,self_attn.o_proj,0.0000121074,0.05000,1.435
23,mlp.up_proj,0.0001123853,0.05000,1.978
23,mlp.gate_proj,0.0001318009,0.05000,2.002
23,mlp.down_proj,0.0000158443,0.05000,3.680
24,self_attn.k_proj,0.0000445231,0.05000,4.180
24,self_attn.v_proj,0.0000517156,0.05000,4.218
24,self_attn.q_proj,0.0001876024,0.05000,4.237
24,self_attn.o_proj,0.0000197756,0.05000,1.443
24,mlp.gate_proj,0.0001390896,0.05000,2.028
24,mlp.up_proj,0.0001163446,0.05000,2.052
24,mlp.down_proj,0.0000183784,0.05000,3.721
25,self_attn.k_proj,0.0000309183,0.05000,4.098
25,self_attn.v_proj,0.0000312976,0.05000,4.159
25,self_attn.q_proj,0.0001220958,0.05000,4.188
25,self_attn.o_proj,0.0000078953,0.05000,1.390
25,mlp.gate_proj,0.0001551162,0.05000,1.971
25,mlp.up_proj,0.0001274080,0.05000,1.993
25,mlp.down_proj,0.0000235486,0.05000,3.673
26,self_attn.v_proj,0.0000490624,0.05000,4.113
26,self_attn.k_proj,0.0000464167,0.05000,4.161
26,self_attn.q_proj,0.0001926069,0.05000,4.185
26,self_attn.o_proj,0.0000066098,0.05000,1.387
26,mlp.gate_proj,0.0001770693,0.05000,1.976
26,mlp.up_proj,0.0001508838,0.05000,1.975
26,mlp.down_proj,0.0000279487,0.05000,3.647
27,self_attn.k_proj,0.0000556290,0.05000,4.077
27,self_attn.q_proj,0.0002357567,0.05000,4.141
27,self_attn.v_proj,0.0000654981,0.05000,4.174
27,self_attn.o_proj,0.0000107555,0.05000,1.416
27,mlp.gate_proj,0.0001936240,0.05000,1.989
27,mlp.up_proj,0.0001708205,0.05000,2.008
27,mlp.down_proj,0.0000438858,0.05000,3.659
28,self_attn.k_proj,0.0000705007,0.05000,4.196
28,self_attn.v_proj,0.0000715719,0.05000,4.249
28,self_attn.q_proj,0.0002718625,0.05000,4.266
28,self_attn.o_proj,0.0000191249,0.05000,1.394
28,mlp.gate_proj,0.0002182023,0.05000,2.015
28,mlp.up_proj,0.0002019346,0.05000,2.031
28,mlp.down_proj,0.0000732407,0.05000,3.797
29,self_attn.k_proj,0.0001816301,0.05000,4.092
29,self_attn.q_proj,0.0007383766,0.05000,4.169
29,self_attn.v_proj,0.0002443326,0.05000,4.195
29,self_attn.o_proj,0.0000448207,0.05000,1.481
29,mlp.up_proj,0.0002562076,0.05000,1.942
29,mlp.gate_proj,0.0002613911,0.05000,1.958
29,mlp.down_proj,0.0000526463,0.05000,3.700
30,self_attn.v_proj,0.0002320336,0.05000,4.041
30,self_attn.k_proj,0.0001986943,0.05000,4.134
30,self_attn.q_proj,0.0007668271,0.05000,4.142
30,self_attn.o_proj,0.0000478573,0.05000,1.459
30,mlp.gate_proj,0.0002683302,0.05000,1.898
30,mlp.up_proj,0.0002727380,0.05000,1.920
30,mlp.down_proj,0.0000663494,0.05000,3.662
31,self_attn.q_proj,0.0010675234,0.05000,4.039
31,self_attn.k_proj,0.0003015756,0.05000,4.116
31,self_attn.v_proj,0.0003918752,0.05000,4.162
31,self_attn.o_proj,0.0000612622,0.05000,1.394
31,mlp.up_proj,0.0002870251,0.05000,2.027
31,mlp.gate_proj,0.0002682364,0.05000,2.032
31,mlp.down_proj,0.0000840589,0.05000,3.717
32,self_attn.q_proj,0.0016584295,0.05000,4.132
32,self_attn.v_proj,0.0006243234,0.05000,4.233
32,self_attn.k_proj,0.0004182623,0.05000,4.253
32,self_attn.o_proj,0.0001057172,0.05000,1.428
32,mlp.up_proj,0.0003151746,0.05000,1.983
32,mlp.gate_proj,0.0002878729,0.05000,2.006
32,mlp.down_proj,0.0001186975,0.05000,3.678
33,self_attn.v_proj,0.0016297800,0.05000,4.071
33,self_attn.k_proj,0.0008791048,0.05000,4.100
33,self_attn.q_proj,0.0041213692,0.05000,4.145
33,self_attn.o_proj,0.0001997127,0.05000,1.434
33,mlp.gate_proj,0.0003185476,0.05000,1.865
33,mlp.up_proj,0.0003529478,0.05000,1.881
33,mlp.down_proj,0.0001623388,0.05000,3.669
34,self_attn.q_proj,0.0027944569,0.05000,4.110
34,self_attn.k_proj,0.0006274358,0.05000,4.194
34,self_attn.v_proj,0.0009633384,0.05000,4.209
34,self_attn.o_proj,0.0002593519,0.05000,1.436
34,mlp.up_proj,0.0004195679,0.05000,1.947
34,mlp.gate_proj,0.0004068270,0.05000,1.970
34,mlp.down_proj,0.0003025797,0.05000,3.683
35,self_attn.v_proj,0.0003734207,0.05000,4.091
35,self_attn.k_proj,0.0003153036,0.05000,4.159
35,self_attn.q_proj,0.0011829730,0.05000,4.173
35,self_attn.o_proj,0.0001886140,0.05000,1.407
35,mlp.gate_proj,0.0009205786,0.05000,1.941
35,mlp.up_proj,0.0009714007,0.05000,1.939
35,mlp.down_proj,0.0008959190,0.05000,3.653