frankdarkluo's picture
Upload folder using huggingface_hub
1695c1e verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000044,0.05000,2.464
0,self_attn.v_proj,0.0000000008,0.05000,2.488
0,self_attn.q_proj,0.0000000191,0.05000,2.543
0,self_attn.o_proj,0.0000000203,0.05000,0.861
0,mlp.up_proj,0.0000000307,0.05000,2.166
0,mlp.gate_proj,0.0000000795,0.05000,2.175
0,mlp.down_proj,0.0000000207,0.05000,5.497
1,self_attn.v_proj,0.0000000008,0.05000,3.146
1,self_attn.k_proj,0.0000000022,0.05000,3.175
1,self_attn.q_proj,0.0000000085,0.05000,3.193
1,self_attn.o_proj,0.0000000040,0.05000,0.825
1,mlp.up_proj,0.0000008692,0.05000,1.366
1,mlp.gate_proj,0.0000012902,0.05000,1.372
1,mlp.down_proj,0.0000000284,0.05000,5.618
2,self_attn.k_proj,0.0000000123,0.05000,3.202
2,self_attn.v_proj,0.0000000028,0.05000,3.210
2,self_attn.q_proj,0.0000000484,0.05000,3.295
2,self_attn.o_proj,0.0000000079,0.05000,0.838
2,mlp.up_proj,0.0000008670,0.05000,2.285
2,mlp.gate_proj,0.0000012831,0.05000,2.291
2,mlp.down_proj,0.0000000571,0.05000,5.648
3,self_attn.q_proj,0.0000000671,0.05000,3.347
3,self_attn.v_proj,0.0000000060,0.05000,3.451
3,self_attn.k_proj,0.0000000151,0.05000,3.490
3,self_attn.o_proj,0.0000000252,0.05000,0.890
3,mlp.up_proj,0.0000020149,0.05000,2.103
3,mlp.gate_proj,0.0000023558,0.05000,2.110
3,mlp.down_proj,0.0000006257,0.05000,5.511
4,self_attn.k_proj,0.0000000315,0.05000,2.993
4,self_attn.v_proj,0.0000000167,0.05000,3.009
4,self_attn.q_proj,0.0000001521,0.05000,3.086
4,self_attn.o_proj,0.0000000164,0.05000,0.890
4,mlp.gate_proj,0.0000023605,0.05000,2.241
4,mlp.up_proj,0.0000018879,0.05000,2.255
4,mlp.down_proj,0.0000002817,0.05000,5.677
5,self_attn.k_proj,0.0000000341,0.05000,3.653
5,self_attn.v_proj,0.0000000171,0.05000,3.675
5,self_attn.q_proj,0.0000001700,0.05000,3.707
5,self_attn.o_proj,0.0000000157,0.05000,0.918
5,mlp.up_proj,0.0000030345,0.05000,2.204
5,mlp.gate_proj,0.0000033247,0.05000,2.219
5,mlp.down_proj,0.0000000732,0.05000,5.558
6,self_attn.k_proj,0.0000000210,0.05000,2.998
6,self_attn.v_proj,0.0000000125,0.05000,3.003
6,self_attn.q_proj,0.0000001101,0.05000,3.088
6,self_attn.o_proj,0.0000000269,0.05000,0.896
6,mlp.up_proj,0.0000007844,0.05000,2.153
6,mlp.gate_proj,0.0000010371,0.05000,2.159
6,mlp.down_proj,0.0000001627,0.05000,5.748
7,self_attn.k_proj,0.0000000239,0.05000,3.633
7,self_attn.v_proj,0.0000000261,0.05000,3.659
7,self_attn.q_proj,0.0000001492,0.05000,3.664
7,self_attn.o_proj,0.0000000598,0.05000,0.844
7,mlp.up_proj,0.0000007770,0.05000,2.100
7,mlp.gate_proj,0.0000008227,0.05000,2.109
7,mlp.down_proj,0.0000002494,0.05000,5.609
8,self_attn.k_proj,0.0000000450,0.05000,3.464
8,self_attn.q_proj,0.0000002250,0.05000,3.475
8,self_attn.v_proj,0.0000000253,0.05000,3.480
8,self_attn.o_proj,0.0000000541,0.05000,0.843
8,mlp.up_proj,0.0000009107,0.05000,2.163
8,mlp.gate_proj,0.0000009393,0.05000,2.169
8,mlp.down_proj,0.0000002649,0.05000,5.567
9,self_attn.q_proj,0.0000002020,0.05000,2.928
9,self_attn.v_proj,0.0000000356,0.05000,2.950
9,self_attn.k_proj,0.0000000332,0.05000,3.041
9,self_attn.o_proj,0.0000000851,0.05000,0.852
9,mlp.up_proj,0.0000018742,0.05000,2.121
9,mlp.gate_proj,0.0000025099,0.05000,2.130
9,mlp.down_proj,0.0000003172,0.05000,5.574
10,self_attn.q_proj,0.0000001846,0.05000,2.718
10,self_attn.k_proj,0.0000000335,0.05000,2.737
10,self_attn.v_proj,0.0000000234,0.05000,2.836
10,self_attn.o_proj,0.0000000614,0.05000,0.838
10,mlp.gate_proj,0.0000010436,0.05000,2.127
10,mlp.up_proj,0.0000009895,0.05000,2.136
10,mlp.down_proj,0.0000002303,0.05000,5.724
11,self_attn.k_proj,0.0000000413,0.05000,3.974
11,self_attn.q_proj,0.0000002067,0.05000,3.992
11,self_attn.v_proj,0.0000000216,0.05000,4.085
11,self_attn.o_proj,0.0000000655,0.05000,0.886
11,mlp.up_proj,0.0000009311,0.05000,2.553
11,mlp.gate_proj,0.0000009437,0.05000,2.563
11,mlp.down_proj,0.0000002879,0.05000,5.553
12,self_attn.v_proj,0.0000000269,0.05000,4.333
12,self_attn.q_proj,0.0000002253,0.05000,4.347
12,self_attn.k_proj,0.0000000432,0.05000,4.384
12,self_attn.o_proj,0.0000000747,0.05000,0.874
12,mlp.gate_proj,0.0000009145,0.05000,2.833
12,mlp.up_proj,0.0000009364,0.05000,2.844
12,mlp.down_proj,0.0000002613,0.05000,5.630
13,self_attn.v_proj,0.0000000339,0.05000,2.604
13,self_attn.k_proj,0.0000000372,0.05000,2.632
13,self_attn.q_proj,0.0000002266,0.05000,2.640
13,self_attn.o_proj,0.0000001181,0.05000,0.857
13,mlp.up_proj,0.0000009420,0.05000,1.799
13,mlp.gate_proj,0.0000009377,0.05000,1.798
13,mlp.down_proj,0.0000002500,0.05000,5.592
14,self_attn.k_proj,0.0000000547,0.05000,3.282
14,self_attn.v_proj,0.0000000395,0.05000,3.297
14,self_attn.q_proj,0.0000003236,0.05000,3.427
14,self_attn.o_proj,0.0000000939,0.05000,0.851
14,mlp.gate_proj,0.0000010082,0.05000,1.820
14,mlp.up_proj,0.0000010460,0.05000,1.823
14,mlp.down_proj,0.0000002847,0.05000,5.866
15,self_attn.v_proj,0.0000000321,0.05000,3.789
15,self_attn.k_proj,0.0000000497,0.05000,3.805
15,self_attn.q_proj,0.0000002612,0.05000,3.890
15,self_attn.o_proj,0.0000000868,0.05000,0.862
15,mlp.up_proj,0.0000009975,0.05000,1.744
15,mlp.gate_proj,0.0000009431,0.05000,1.748
15,mlp.down_proj,0.0000003023,0.05000,5.621
16,self_attn.q_proj,0.0000002790,0.05000,2.622
16,self_attn.k_proj,0.0000000447,0.05000,2.629
16,self_attn.v_proj,0.0000000462,0.05000,2.644
16,self_attn.o_proj,0.0000001286,0.05000,0.839
16,mlp.up_proj,0.0000010595,0.05000,1.755
16,mlp.gate_proj,0.0000010016,0.05000,1.755
16,mlp.down_proj,0.0000003172,0.05000,5.590
17,self_attn.q_proj,0.0000003178,0.05000,2.550
17,self_attn.v_proj,0.0000000503,0.05000,2.574
17,self_attn.k_proj,0.0000000467,0.05000,2.594
17,self_attn.o_proj,0.0000001092,0.05000,0.865
17,mlp.up_proj,0.0000012212,0.05000,1.691
17,mlp.gate_proj,0.0000011384,0.05000,1.691
17,mlp.down_proj,0.0000004105,0.05000,5.573
18,self_attn.v_proj,0.0000000558,0.05000,2.441
18,self_attn.k_proj,0.0000000355,0.05000,2.474
18,self_attn.q_proj,0.0000002488,0.05000,2.482
18,self_attn.o_proj,0.0000002174,0.05000,0.858
18,mlp.up_proj,0.0000012998,0.05000,1.713
18,mlp.gate_proj,0.0000012134,0.05000,1.719
18,mlp.down_proj,0.0000004943,0.05000,5.604
19,self_attn.q_proj,0.0000002946,0.05000,2.463
19,self_attn.k_proj,0.0000000362,0.05000,2.486
19,self_attn.v_proj,0.0000000733,0.05000,2.516
19,self_attn.o_proj,0.0000002530,0.05000,0.848
19,mlp.up_proj,0.0000014108,0.05000,1.724
19,mlp.gate_proj,0.0000013564,0.05000,1.730
19,mlp.down_proj,0.0000006319,0.05000,5.626
20,self_attn.q_proj,0.0000002772,0.05000,2.549
20,self_attn.v_proj,0.0000000775,0.05000,2.581
20,self_attn.k_proj,0.0000000353,0.05000,2.595
20,self_attn.o_proj,0.0000001905,0.05000,0.848
20,mlp.gate_proj,0.0000017158,0.05000,1.712
20,mlp.up_proj,0.0000017782,0.05000,1.716
20,mlp.down_proj,0.0000011989,0.05000,5.666
21,self_attn.k_proj,0.0000000390,0.05000,2.589
21,self_attn.v_proj,0.0000001106,0.05000,2.622
21,self_attn.q_proj,0.0000003375,0.05000,2.633
21,self_attn.o_proj,0.0000003695,0.05000,0.867
21,mlp.up_proj,0.0000022832,0.05000,1.698
21,mlp.gate_proj,0.0000022574,0.05000,1.705
21,mlp.down_proj,0.0000017943,0.05000,5.606
22,self_attn.q_proj,0.0000005025,0.05000,2.727
22,self_attn.k_proj,0.0000000550,0.05000,2.731
22,self_attn.v_proj,0.0000001965,0.05000,2.739
22,self_attn.o_proj,0.0000003003,0.05000,0.861
22,mlp.up_proj,0.0000031518,0.05000,1.768
22,mlp.gate_proj,0.0000030812,0.05000,1.776
22,mlp.down_proj,0.0000031401,0.05000,5.648
23,self_attn.k_proj,0.0000000747,0.05000,2.695
23,self_attn.v_proj,0.0000002885,0.05000,2.705
23,self_attn.q_proj,0.0000006291,0.05000,2.714
23,self_attn.o_proj,0.0000006152,0.05000,0.871
23,mlp.up_proj,0.0000041236,0.05000,1.787
23,mlp.gate_proj,0.0000039755,0.05000,1.794
23,mlp.down_proj,0.0000037470,0.05000,5.645
24,self_attn.q_proj,0.0000005010,0.05000,3.537
24,self_attn.v_proj,0.0000002462,0.05000,3.574
24,self_attn.k_proj,0.0000000591,0.05000,3.643
24,self_attn.o_proj,0.0000004400,0.05000,0.855
24,mlp.gate_proj,0.0000040475,0.05000,1.760
24,mlp.up_proj,0.0000044454,0.05000,1.770
24,mlp.down_proj,0.0000049576,0.05000,5.640
25,self_attn.v_proj,0.0000003608,0.05000,2.477
25,self_attn.q_proj,0.0000005041,0.05000,2.507
25,self_attn.k_proj,0.0000000499,0.05000,2.533
25,self_attn.o_proj,0.0000006603,0.05000,0.887
25,mlp.up_proj,0.0000053732,0.05000,1.737
25,mlp.gate_proj,0.0000047783,0.05000,1.737
25,mlp.down_proj,0.0000070089,0.05000,5.685
26,self_attn.q_proj,0.0000007222,0.05000,3.921
26,self_attn.v_proj,0.0000006790,0.05000,3.977
26,self_attn.k_proj,0.0000000789,0.05000,4.082
26,self_attn.o_proj,0.0000011606,0.05000,0.862
26,mlp.up_proj,0.0000056787,0.05000,2.722
26,mlp.gate_proj,0.0000050093,0.05000,2.732
26,mlp.down_proj,0.0000140491,0.05000,5.705
27,self_attn.v_proj,0.0000007066,0.05000,2.857
27,self_attn.q_proj,0.0000010869,0.05000,2.898
27,self_attn.k_proj,0.0000001030,0.05000,2.932
27,self_attn.o_proj,0.0000015821,0.05000,0.909
27,mlp.up_proj,0.0000063775,0.05000,1.905
27,mlp.gate_proj,0.0000059692,0.05000,1.912
27,mlp.down_proj,0.0000325339,0.05000,5.683