frankdarkluo's picture
Upload folder using huggingface_hub
2ba16d4 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000074,0.05000,4.076
0,self_attn.q_proj,0.0000000206,0.05000,4.106
0,self_attn.v_proj,0.0000000015,0.05000,4.122
0,self_attn.o_proj,0.0000000157,0.05000,1.158
0,mlp.up_proj,0.0000000114,0.05000,3.470
0,mlp.gate_proj,0.0000000133,0.05000,3.490
0,mlp.down_proj,0.0000000193,0.05000,3.869
1,self_attn.q_proj,0.0000000006,0.05000,4.900
1,self_attn.k_proj,0.0000000002,0.05000,4.926
1,self_attn.v_proj,0.0000000001,0.05000,4.943
1,self_attn.o_proj,0.0000000002,0.05000,1.201
1,mlp.up_proj,0.0000000479,0.05000,3.198
1,mlp.gate_proj,0.0000001445,0.05000,3.210
1,mlp.down_proj,0.0000000009,0.05000,3.574
2,self_attn.v_proj,0.0000000004,0.05000,4.326
2,self_attn.q_proj,0.0000000029,0.05000,4.358
2,self_attn.k_proj,0.0000000011,0.05000,4.433
2,self_attn.o_proj,0.0000000015,0.05000,1.285
2,mlp.gate_proj,0.0000002588,0.05000,3.458
2,mlp.up_proj,0.0000001298,0.05000,3.476
2,mlp.down_proj,0.0000000050,0.05000,3.544
3,self_attn.k_proj,0.0000000071,0.05000,3.937
3,self_attn.q_proj,0.0000000193,0.05000,3.959
3,self_attn.v_proj,0.0000000026,0.05000,3.972
3,self_attn.o_proj,0.0000000043,0.05000,1.206
3,mlp.gate_proj,0.0000003206,0.05000,3.242
3,mlp.up_proj,0.0000001479,0.05000,3.252
3,mlp.down_proj,0.0000000121,0.05000,3.914
4,self_attn.q_proj,0.0000000231,0.05000,4.343
4,self_attn.v_proj,0.0000000033,0.05000,4.405
4,self_attn.k_proj,0.0000000086,0.05000,4.416
4,self_attn.o_proj,0.0000000077,0.05000,1.169
4,mlp.up_proj,0.0000002798,0.05000,3.357
4,mlp.gate_proj,0.0000005087,0.05000,3.379
4,mlp.down_proj,0.0001496382,0.05000,3.528
5,self_attn.k_proj,0.0000000318,0.05000,3.794
5,self_attn.q_proj,0.0000001019,0.05000,3.870
5,self_attn.v_proj,0.0000000151,0.05000,3.907
5,self_attn.o_proj,0.0000000132,0.05000,1.150
5,mlp.up_proj,0.0000004159,0.05000,2.522
5,mlp.gate_proj,0.0000007649,0.05000,2.546
5,mlp.down_proj,0.0000001460,0.05000,3.541
6,self_attn.q_proj,0.0000001069,0.05000,3.811
6,self_attn.k_proj,0.0000000310,0.05000,3.860
6,self_attn.v_proj,0.0000000184,0.05000,3.866
6,self_attn.o_proj,0.0000000110,0.05000,1.143
6,mlp.up_proj,0.0000006236,0.05000,2.564
6,mlp.gate_proj,0.0000011021,0.05000,2.570
6,mlp.down_proj,0.0000001073,0.05000,3.539
7,self_attn.k_proj,0.0000000430,0.05000,3.557
7,self_attn.v_proj,0.0000000261,0.05000,3.639
7,self_attn.q_proj,0.0000001502,0.05000,3.650
7,self_attn.o_proj,0.0000000111,0.05000,1.151
7,mlp.up_proj,0.0000007642,0.05000,2.499
7,mlp.gate_proj,0.0000013492,0.05000,2.508
7,mlp.down_proj,0.0000000492,0.05000,3.530
8,self_attn.q_proj,0.0000001647,0.05000,3.726
8,self_attn.k_proj,0.0000000498,0.05000,3.742
8,self_attn.v_proj,0.0000000280,0.05000,3.749
8,self_attn.o_proj,0.0000000091,0.05000,1.195
8,mlp.gate_proj,0.0000008816,0.05000,2.494
8,mlp.up_proj,0.0000005125,0.05000,2.498
8,mlp.down_proj,0.0000000619,0.05000,3.521
9,self_attn.k_proj,0.0000000422,0.05000,3.545
9,self_attn.v_proj,0.0000000267,0.05000,3.561
9,self_attn.q_proj,0.0000001460,0.05000,3.581
9,self_attn.o_proj,0.0000000168,0.05000,1.141
9,mlp.up_proj,0.0000003213,0.05000,2.513
9,mlp.gate_proj,0.0000003591,0.05000,2.522
9,mlp.down_proj,0.0000000803,0.05000,3.551
10,self_attn.q_proj,0.0000002188,0.05000,3.755
10,self_attn.k_proj,0.0000000617,0.05000,3.799
10,self_attn.v_proj,0.0000000361,0.05000,3.813
10,self_attn.o_proj,0.0000000154,0.05000,1.153
10,mlp.up_proj,0.0000003657,0.05000,2.443
10,mlp.gate_proj,0.0000004093,0.05000,2.448
10,mlp.down_proj,0.0000000965,0.05000,3.616
11,self_attn.k_proj,0.0000000474,0.05000,3.524
11,self_attn.v_proj,0.0000000273,0.05000,3.604
11,self_attn.q_proj,0.0000001692,0.05000,3.612
11,self_attn.o_proj,0.0000000241,0.05000,1.142
11,mlp.up_proj,0.0000004200,0.05000,2.538
11,mlp.gate_proj,0.0000005279,0.05000,2.555
11,mlp.down_proj,0.0000000851,0.05000,3.562
12,self_attn.q_proj,0.0000002061,0.05000,3.418
12,self_attn.v_proj,0.0000000328,0.05000,3.534
12,self_attn.k_proj,0.0000000577,0.05000,3.571
12,self_attn.o_proj,0.0000000278,0.05000,1.146
12,mlp.gate_proj,0.0000004661,0.05000,2.530
12,mlp.up_proj,0.0000004365,0.05000,2.534
12,mlp.down_proj,0.0000001030,0.05000,3.555
13,self_attn.q_proj,0.0000002177,0.05000,3.406
13,self_attn.k_proj,0.0000000620,0.05000,3.407
13,self_attn.v_proj,0.0000000392,0.05000,3.455
13,self_attn.o_proj,0.0000000293,0.05000,1.144
13,mlp.up_proj,0.0000004977,0.05000,2.513
13,mlp.gate_proj,0.0000005316,0.05000,2.535
13,mlp.down_proj,0.0000001189,0.05000,3.533
14,self_attn.q_proj,0.0000002546,0.05000,3.494
14,self_attn.v_proj,0.0000000387,0.05000,3.545
14,self_attn.k_proj,0.0000000740,0.05000,3.582
14,self_attn.o_proj,0.0000000303,0.05000,1.150
14,mlp.up_proj,0.0000005113,0.05000,2.471
14,mlp.gate_proj,0.0000005438,0.05000,2.477
14,mlp.down_proj,0.0000001245,0.05000,3.503
15,self_attn.k_proj,0.0000000593,0.05000,3.810
15,self_attn.q_proj,0.0000002137,0.05000,3.904
15,self_attn.v_proj,0.0000000407,0.05000,3.915
15,self_attn.o_proj,0.0000000397,0.05000,1.140
15,mlp.up_proj,0.0000005303,0.05000,2.377
15,mlp.gate_proj,0.0000005843,0.05000,2.391
15,mlp.down_proj,0.0000001302,0.05000,3.542
16,self_attn.q_proj,0.0000002011,0.05000,3.929
16,self_attn.v_proj,0.0000000299,0.05000,3.952
16,self_attn.k_proj,0.0000000633,0.05000,3.954
16,self_attn.o_proj,0.0000000320,0.05000,1.149
16,mlp.gate_proj,0.0000005026,0.05000,2.592
16,mlp.up_proj,0.0000004937,0.05000,2.598
16,mlp.down_proj,0.0000001260,0.05000,3.540
17,self_attn.k_proj,0.0000000676,0.05000,3.510
17,self_attn.v_proj,0.0000000323,0.05000,3.521
17,self_attn.q_proj,0.0000002323,0.05000,3.567
17,self_attn.o_proj,0.0000000340,0.05000,1.144
17,mlp.up_proj,0.0000004876,0.05000,2.553
17,mlp.gate_proj,0.0000004806,0.05000,2.580
17,mlp.down_proj,0.0000001191,0.05000,3.525
18,self_attn.q_proj,0.0000002289,0.05000,4.095
18,self_attn.v_proj,0.0000000371,0.05000,4.126
18,self_attn.k_proj,0.0000000658,0.05000,4.139
18,self_attn.o_proj,0.0000000409,0.05000,1.130
18,mlp.gate_proj,0.0000004643,0.05000,2.561
18,mlp.up_proj,0.0000004858,0.05000,2.569
18,mlp.down_proj,0.0000001185,0.05000,3.517
19,self_attn.q_proj,0.0000002764,0.05000,3.542
19,self_attn.v_proj,0.0000000402,0.05000,3.615
19,self_attn.k_proj,0.0000000741,0.05000,3.641
19,self_attn.o_proj,0.0000000308,0.05000,1.134
19,mlp.up_proj,0.0000005025,0.05000,2.549
19,mlp.gate_proj,0.0000004797,0.05000,2.579
19,mlp.down_proj,0.0000001231,0.05000,3.523
20,self_attn.q_proj,0.0000002709,0.05000,3.825
20,self_attn.v_proj,0.0000000383,0.05000,3.901
20,self_attn.k_proj,0.0000000785,0.05000,3.915
20,self_attn.o_proj,0.0000000425,0.05000,1.137
20,mlp.gate_proj,0.0000004417,0.05000,2.506
20,mlp.up_proj,0.0000004883,0.05000,2.505
20,mlp.down_proj,0.0000001268,0.05000,3.520
21,self_attn.k_proj,0.0000000683,0.05000,3.726
21,self_attn.q_proj,0.0000002360,0.05000,3.801
21,self_attn.v_proj,0.0000000327,0.05000,3.827
21,self_attn.o_proj,0.0000000444,0.05000,1.143
21,mlp.up_proj,0.0000004921,0.05000,2.515
21,mlp.gate_proj,0.0000004432,0.05000,2.532
21,mlp.down_proj,0.0000001214,0.05000,3.528
22,self_attn.v_proj,0.0000000495,0.05000,3.738
22,self_attn.k_proj,0.0000000745,0.05000,3.762
22,self_attn.q_proj,0.0000002610,0.05000,3.799
22,self_attn.o_proj,0.0000000528,0.05000,1.136
22,mlp.up_proj,0.0000004986,0.05000,2.533
22,mlp.gate_proj,0.0000004491,0.05000,2.540
22,mlp.down_proj,0.0000001492,0.05000,3.513
23,self_attn.k_proj,0.0000000683,0.05000,3.437
23,self_attn.v_proj,0.0000000480,0.05000,3.463
23,self_attn.q_proj,0.0000002551,0.05000,3.499
23,self_attn.o_proj,0.0000000544,0.05000,1.134
23,mlp.up_proj,0.0000005058,0.05000,2.529
23,mlp.gate_proj,0.0000004802,0.05000,2.532
23,mlp.down_proj,0.0000001372,0.05000,3.507
24,self_attn.q_proj,0.0000002997,0.05000,3.422
24,self_attn.k_proj,0.0000000956,0.05000,3.438
24,self_attn.v_proj,0.0000000430,0.05000,3.493
24,self_attn.o_proj,0.0000000590,0.05000,1.137
24,mlp.gate_proj,0.0000004554,0.05000,2.581
24,mlp.up_proj,0.0000004873,0.05000,2.587
24,mlp.down_proj,0.0000001235,0.05000,3.525
25,self_attn.k_proj,0.0000000914,0.05000,3.659
25,self_attn.v_proj,0.0000000552,0.05000,3.760
25,self_attn.q_proj,0.0000003244,0.05000,3.775
25,self_attn.o_proj,0.0000000401,0.05000,1.152
25,mlp.up_proj,0.0000004959,0.05000,2.504
25,mlp.gate_proj,0.0000004476,0.05000,2.527
25,mlp.down_proj,0.0000001325,0.05000,3.525
26,self_attn.q_proj,0.0000002927,0.05000,3.843
26,self_attn.v_proj,0.0000000365,0.05000,3.916
26,self_attn.k_proj,0.0000000829,0.05000,3.932
26,self_attn.o_proj,0.0000000480,0.05000,1.141
26,mlp.gate_proj,0.0000004655,0.05000,2.653
26,mlp.up_proj,0.0000005360,0.05000,2.661
26,mlp.down_proj,0.0000001535,0.05000,3.544
27,self_attn.k_proj,0.0000000845,0.05000,3.682
27,self_attn.q_proj,0.0000002836,0.05000,3.766
27,self_attn.v_proj,0.0000000448,0.05000,3.771
27,self_attn.o_proj,0.0000000720,0.05000,1.142
27,mlp.up_proj,0.0000005640,0.05000,2.558
27,mlp.gate_proj,0.0000004908,0.05000,2.587
27,mlp.down_proj,0.0000001856,0.05000,3.556
28,self_attn.q_proj,0.0000002748,0.05000,3.603
28,self_attn.v_proj,0.0000000634,0.05000,3.624
28,self_attn.k_proj,0.0000000678,0.05000,3.634
28,self_attn.o_proj,0.0000000759,0.05000,1.132
28,mlp.gate_proj,0.0000004960,0.05000,2.536
28,mlp.up_proj,0.0000005713,0.05000,2.547
28,mlp.down_proj,0.0000002030,0.05000,3.496
29,self_attn.q_proj,0.0000003218,0.05000,3.824
29,self_attn.k_proj,0.0000000896,0.05000,3.852
29,self_attn.v_proj,0.0000000643,0.05000,3.875
29,self_attn.o_proj,0.0000000759,0.05000,1.173
29,mlp.up_proj,0.0000005743,0.05000,2.581
29,mlp.gate_proj,0.0000005014,0.05000,2.612
29,mlp.down_proj,0.0000002231,0.05000,3.538
30,self_attn.k_proj,0.0000000758,0.05000,3.898
30,self_attn.v_proj,0.0000000699,0.05000,3.898
30,self_attn.q_proj,0.0000002911,0.05000,3.909
30,self_attn.o_proj,0.0000000963,0.05000,1.151
30,mlp.gate_proj,0.0000005358,0.05000,2.578
30,mlp.up_proj,0.0000006059,0.05000,2.588
30,mlp.down_proj,0.0000002535,0.05000,3.543
31,self_attn.k_proj,0.0000000760,0.05000,3.357
31,self_attn.v_proj,0.0000000656,0.05000,3.472
31,self_attn.q_proj,0.0000002968,0.05000,3.484
31,self_attn.o_proj,0.0000000876,0.05000,1.145
31,mlp.up_proj,0.0000006837,0.05000,2.533
31,mlp.gate_proj,0.0000006198,0.05000,2.561
31,mlp.down_proj,0.0000003191,0.05000,3.539
32,self_attn.v_proj,0.0000000970,0.05000,3.365
32,self_attn.k_proj,0.0000000867,0.05000,3.400
32,self_attn.q_proj,0.0000003585,0.05000,3.454
32,self_attn.o_proj,0.0000000881,0.05000,1.140
32,mlp.up_proj,0.0000007260,0.05000,2.497
32,mlp.gate_proj,0.0000006735,0.05000,2.508
32,mlp.down_proj,0.0000003660,0.05000,3.544
33,self_attn.q_proj,0.0000003616,0.05000,3.409
33,self_attn.v_proj,0.0000000883,0.05000,3.419
33,self_attn.k_proj,0.0000000866,0.05000,3.445
33,self_attn.o_proj,0.0000001073,0.05000,1.146
33,mlp.up_proj,0.0000008888,0.05000,2.491
33,mlp.gate_proj,0.0000008382,0.05000,2.503
33,mlp.down_proj,0.0000005407,0.05000,3.533
34,self_attn.q_proj,0.0000004201,0.05000,4.001
34,self_attn.v_proj,0.0000001121,0.05000,4.025
34,self_attn.k_proj,0.0000000911,0.05000,4.040
34,self_attn.o_proj,0.0000000971,0.05000,1.147
34,mlp.gate_proj,0.0000010043,0.05000,2.583
34,mlp.up_proj,0.0000010385,0.05000,2.590
34,mlp.down_proj,0.0000006755,0.05000,3.535
35,self_attn.k_proj,0.0000000967,0.05000,3.599
35,self_attn.v_proj,0.0000001044,0.05000,3.693
35,self_attn.q_proj,0.0000003993,0.05000,3.725
35,self_attn.o_proj,0.0000001738,0.05000,1.149
35,mlp.up_proj,0.0000011876,0.05000,2.531
35,mlp.gate_proj,0.0000011666,0.05000,2.562
35,mlp.down_proj,0.0000008386,0.05000,3.509
36,self_attn.q_proj,0.0000004909,0.05000,3.529
36,self_attn.v_proj,0.0000001891,0.05000,3.537
36,self_attn.k_proj,0.0000001019,0.05000,3.595
36,self_attn.o_proj,0.0000001320,0.05000,1.139
36,mlp.up_proj,0.0000012988,0.05000,2.582
36,mlp.gate_proj,0.0000012655,0.05000,2.586
36,mlp.down_proj,0.0000010114,0.05000,3.563
37,self_attn.k_proj,0.0000001170,0.05000,3.401
37,self_attn.q_proj,0.0000005350,0.05000,3.436
37,self_attn.v_proj,0.0000001738,0.05000,3.502
37,self_attn.o_proj,0.0000001674,0.05000,1.149
37,mlp.up_proj,0.0000014454,0.05000,2.447
37,mlp.gate_proj,0.0000014013,0.05000,2.463
37,mlp.down_proj,0.0000011469,0.05000,3.576
38,self_attn.v_proj,0.0000001754,0.05000,3.757
38,self_attn.k_proj,0.0000001155,0.05000,3.769
38,self_attn.q_proj,0.0000005264,0.05000,3.782
38,self_attn.o_proj,0.0000001730,0.05000,1.162
38,mlp.up_proj,0.0000016110,0.05000,2.521
38,mlp.gate_proj,0.0000015450,0.05000,2.527
38,mlp.down_proj,0.0000013149,0.05000,3.546
39,self_attn.k_proj,0.0000001116,0.05000,3.312
39,self_attn.v_proj,0.0000001994,0.05000,3.365
39,self_attn.q_proj,0.0000005239,0.05000,3.436
39,self_attn.o_proj,0.0000002415,0.05000,1.161
39,mlp.up_proj,0.0000017928,0.05000,2.457
39,mlp.gate_proj,0.0000017018,0.05000,2.480
39,mlp.down_proj,0.0000015803,0.05000,3.542
40,self_attn.k_proj,0.0000001218,0.05000,3.695
40,self_attn.v_proj,0.0000002551,0.05000,3.695
40,self_attn.q_proj,0.0000005873,0.05000,3.705
40,self_attn.o_proj,0.0000002292,0.05000,1.161
40,mlp.up_proj,0.0000019417,0.05000,2.560
40,mlp.gate_proj,0.0000018318,0.05000,2.565
40,mlp.down_proj,0.0000018159,0.05000,3.546
41,self_attn.k_proj,0.0000001183,0.05000,3.569
41,self_attn.q_proj,0.0000005899,0.05000,3.615
41,self_attn.v_proj,0.0000002547,0.05000,3.669
41,self_attn.o_proj,0.0000001957,0.05000,1.160
41,mlp.up_proj,0.0000020936,0.05000,2.531
41,mlp.gate_proj,0.0000019421,0.05000,2.559
41,mlp.down_proj,0.0000020503,0.05000,3.620
42,self_attn.q_proj,0.0000006111,0.05000,4.035
42,self_attn.k_proj,0.0000001178,0.05000,4.064
42,self_attn.v_proj,0.0000002594,0.05000,4.076
42,self_attn.o_proj,0.0000002111,0.05000,1.154
42,mlp.up_proj,0.0000022532,0.05000,2.615
42,mlp.gate_proj,0.0000020654,0.05000,2.621
42,mlp.down_proj,0.0000024288,0.05000,3.587
43,self_attn.k_proj,0.0000001174,0.05000,3.388
43,self_attn.v_proj,0.0000004101,0.05000,3.428
43,self_attn.q_proj,0.0000006248,0.05000,3.506
43,self_attn.o_proj,0.0000003921,0.05000,1.144
43,mlp.up_proj,0.0000024706,0.05000,2.569
43,mlp.gate_proj,0.0000022215,0.05000,2.600
43,mlp.down_proj,0.0000029538,0.05000,3.545
44,self_attn.v_proj,0.0000004372,0.05000,3.535
44,self_attn.q_proj,0.0000005866,0.05000,3.572
44,self_attn.k_proj,0.0000001027,0.05000,3.589
44,self_attn.o_proj,0.0000005251,0.05000,1.141
44,mlp.gate_proj,0.0000023094,0.05000,2.631
44,mlp.up_proj,0.0000026141,0.05000,2.639
44,mlp.down_proj,0.0000044741,0.05000,3.559
45,self_attn.k_proj,0.0000001031,0.05000,3.699
45,self_attn.v_proj,0.0000005164,0.05000,3.829
45,self_attn.q_proj,0.0000006073,0.05000,3.843
45,self_attn.o_proj,0.0000005373,0.05000,1.156
45,mlp.up_proj,0.0000027213,0.05000,2.508
45,mlp.gate_proj,0.0000024398,0.05000,2.544
45,mlp.down_proj,0.0000050870,0.05000,3.565
46,self_attn.q_proj,0.0000005609,0.05000,4.140
46,self_attn.k_proj,0.0000000954,0.05000,4.193
46,self_attn.v_proj,0.0000005434,0.05000,4.204
46,self_attn.o_proj,0.0000009439,0.05000,1.152
46,mlp.up_proj,0.0000027407,0.05000,2.600
46,mlp.gate_proj,0.0000025642,0.05000,2.607
46,mlp.down_proj,0.0000072006,0.05000,3.551
47,self_attn.k_proj,0.0000000795,0.05000,3.488
47,self_attn.v_proj,0.0000002801,0.05000,3.552
47,self_attn.q_proj,0.0000004749,0.05000,3.603
47,self_attn.o_proj,0.0000004404,0.05000,1.152
47,mlp.up_proj,0.0000028646,0.05000,2.518
47,mlp.gate_proj,0.0000027463,0.05000,2.543
47,mlp.down_proj,0.0000116770,0.05000,3.533