Llama_3_2_1B_GPTQ_4bit / quant_log.csv
dhdbsrlw's picture
Upload checkpoint folder
29cd4ae verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000015231,0.05000,2.649
0,self_attn.q_proj,0.0000032633,0.05000,2.865
0,self_attn.v_proj,0.0000000485,0.05000,2.876
0,self_attn.o_proj,0.0000000048,0.05000,0.521
0,mlp.up_proj,0.0000023772,0.05000,1.145
0,mlp.gate_proj,0.0000030530,0.05000,1.156
0,mlp.down_proj,0.0000000174,0.05000,1.825
1,self_attn.k_proj,0.0000033035,0.05000,3.590
1,self_attn.v_proj,0.0000002005,0.05000,3.655
1,self_attn.q_proj,0.0000065693,0.05000,3.670
1,self_attn.o_proj,0.0000000153,0.05000,0.519
1,mlp.gate_proj,0.0000053029,0.05000,1.177
1,mlp.up_proj,0.0000038697,0.05000,1.184
1,mlp.down_proj,0.0000010461,0.05000,1.814
2,self_attn.q_proj,0.0000140619,0.05000,2.400
2,self_attn.k_proj,0.0000069570,0.05000,2.432
2,self_attn.v_proj,0.0000005373,0.05000,2.445
2,self_attn.o_proj,0.0000000230,0.05000,0.498
2,mlp.up_proj,0.0000052275,0.05000,1.069
2,mlp.gate_proj,0.0000083361,0.05000,1.086
2,mlp.down_proj,0.0000000661,0.05000,1.822
3,self_attn.k_proj,0.0000039491,0.05000,3.246
3,self_attn.v_proj,0.0000005910,0.05000,3.304
3,self_attn.q_proj,0.0000087343,0.05000,3.311
3,self_attn.o_proj,0.0000000422,0.05000,0.510
3,mlp.gate_proj,0.0000128088,0.05000,1.226
3,mlp.up_proj,0.0000064482,0.05000,1.236
3,mlp.down_proj,0.0000000967,0.05000,1.870
4,self_attn.q_proj,0.0000093078,0.05000,2.659
4,self_attn.v_proj,0.0000005821,0.05000,2.708
4,self_attn.k_proj,0.0000045687,0.05000,2.790
4,self_attn.o_proj,0.0000000687,0.05000,0.517
4,mlp.gate_proj,0.0000141758,0.05000,1.119
4,mlp.up_proj,0.0000066277,0.05000,1.129
4,mlp.down_proj,0.0000001093,0.05000,1.827
5,self_attn.v_proj,0.0000005532,0.05000,3.302
5,self_attn.k_proj,0.0000067406,0.05000,3.330
5,self_attn.q_proj,0.0000127724,0.05000,3.383
5,self_attn.o_proj,0.0000000714,0.05000,0.476
5,mlp.gate_proj,0.0000129943,0.05000,2.022
5,mlp.up_proj,0.0000070792,0.05000,2.055
5,mlp.down_proj,0.0000001317,0.05000,1.859
6,self_attn.k_proj,0.0000053446,0.05000,4.033
6,self_attn.q_proj,0.0000086090,0.05000,4.139
6,self_attn.v_proj,0.0000006527,0.05000,4.209
6,self_attn.o_proj,0.0000001050,0.05000,0.503
6,mlp.up_proj,0.0000074241,0.05000,1.226
6,mlp.gate_proj,0.0000134288,0.05000,1.230
6,mlp.down_proj,0.0000001399,0.05000,2.160
7,self_attn.v_proj,0.0000007160,0.05000,3.509
7,self_attn.k_proj,0.0000053550,0.05000,3.564
7,self_attn.q_proj,0.0000100636,0.05000,3.571
7,self_attn.o_proj,0.0000001051,0.05000,0.516
7,mlp.gate_proj,0.0000131917,0.05000,1.253
7,mlp.up_proj,0.0000080153,0.05000,1.253
7,mlp.down_proj,0.0000001663,0.05000,1.868
8,self_attn.k_proj,0.0000072736,0.05000,3.180
8,self_attn.q_proj,0.0000120220,0.05000,3.234
8,self_attn.v_proj,0.0000007166,0.05000,3.278
8,self_attn.o_proj,0.0000001545,0.05000,0.509
8,mlp.gate_proj,0.0000156649,0.05000,1.268
8,mlp.up_proj,0.0000095675,0.05000,1.273
8,mlp.down_proj,0.0000002313,0.05000,1.829
9,self_attn.k_proj,0.0000051501,0.05000,3.377
9,self_attn.q_proj,0.0000128264,0.05000,3.396
9,self_attn.v_proj,0.0000008294,0.05000,3.415
9,self_attn.o_proj,0.0000001717,0.05000,0.502
9,mlp.gate_proj,0.0000162905,0.05000,1.234
9,mlp.up_proj,0.0000097715,0.05000,1.238
9,mlp.down_proj,0.0000002682,0.05000,1.827
10,self_attn.v_proj,0.0000011443,0.05000,3.313
10,self_attn.q_proj,0.0000139861,0.05000,3.381
10,self_attn.k_proj,0.0000061532,0.05000,3.411
10,self_attn.o_proj,0.0000001267,0.05000,0.493
10,mlp.gate_proj,0.0000173171,0.05000,1.220
10,mlp.up_proj,0.0000108839,0.05000,1.223
10,mlp.down_proj,0.0000003280,0.05000,1.864
11,self_attn.k_proj,0.0000066866,0.05000,2.985
11,self_attn.v_proj,0.0000009090,0.05000,3.134
11,self_attn.q_proj,0.0000124617,0.05000,3.157
11,self_attn.o_proj,0.0000000955,0.05000,0.526
11,mlp.gate_proj,0.0000174840,0.05000,1.241
11,mlp.up_proj,0.0000111882,0.05000,1.240
11,mlp.down_proj,0.0000003564,0.05000,1.859
12,self_attn.q_proj,0.0000122400,0.05000,2.690
12,self_attn.v_proj,0.0000009516,0.05000,2.745
12,self_attn.k_proj,0.0000063789,0.05000,2.766
12,self_attn.o_proj,0.0000000996,0.05000,0.490
12,mlp.gate_proj,0.0000166709,0.05000,1.183
12,mlp.up_proj,0.0000111118,0.05000,1.190
12,mlp.down_proj,0.0000003938,0.05000,1.853
13,self_attn.q_proj,0.0000141233,0.05000,3.080
13,self_attn.v_proj,0.0000016864,0.05000,3.151
13,self_attn.k_proj,0.0000064695,0.05000,3.185
13,self_attn.o_proj,0.0000001103,0.05000,0.499
13,mlp.gate_proj,0.0000172082,0.05000,1.233
13,mlp.up_proj,0.0000123625,0.05000,1.240
13,mlp.down_proj,0.0000005548,0.05000,1.880
14,self_attn.v_proj,0.0000036409,0.05000,3.412
14,self_attn.k_proj,0.0000066772,0.05000,3.422
14,self_attn.q_proj,0.0000137069,0.05000,3.440
14,self_attn.o_proj,0.0000002190,0.05000,0.501
14,mlp.up_proj,0.0000129504,0.05000,1.224
14,mlp.gate_proj,0.0000192394,0.05000,1.234
14,mlp.down_proj,0.0000007553,0.05000,1.884
15,self_attn.q_proj,0.0000123336,0.05000,3.152
15,self_attn.k_proj,0.0000072337,0.05000,3.281
15,self_attn.v_proj,0.0000035618,0.05000,3.288
15,self_attn.o_proj,0.0000011874,0.05000,0.511
15,mlp.up_proj,0.0000154439,0.05000,1.126
15,mlp.gate_proj,0.0000206278,0.05000,1.132
15,mlp.down_proj,0.0000024395,0.05000,1.842