8B-instruct-int4 / quant_log.csv
Matt300209's picture
Upload folder using huggingface_hub
e33a532 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.36111963,0.01000,1.132
0,self_attn.v_proj,0.00330429,0.01000,0.942
0,self_attn.q_proj,0.52731681,0.01000,0.963
0,self_attn.o_proj,0.00026867,0.01000,0.983
0,mlp.up_proj,0.23463088,0.01000,0.968
0,mlp.gate_proj,0.28276342,0.01000,0.967
0,mlp.down_proj,0.00119561,0.01000,4.012
1,self_attn.k_proj,0.24816991,0.01000,0.951
1,self_attn.v_proj,0.00948147,0.01000,0.942
1,self_attn.q_proj,0.44486734,0.01000,0.962
1,self_attn.o_proj,0.00069429,0.01000,0.968
1,mlp.up_proj,0.44346130,0.01000,0.977
1,mlp.gate_proj,0.52371848,0.01000,0.978
1,mlp.down_proj,0.16304456,0.01000,4.006
2,self_attn.k_proj,1.27576137,0.01000,0.947
2,self_attn.v_proj,0.05388402,0.01000,0.972
2,self_attn.q_proj,1.91546702,0.01000,0.963
2,self_attn.o_proj,0.00095444,0.01000,0.962
2,mlp.up_proj,0.75267899,0.01000,0.978
2,mlp.gate_proj,0.93858600,0.01000,0.971
2,mlp.down_proj,0.00534942,0.01000,4.054
3,self_attn.k_proj,1.07618117,0.01000,0.951
3,self_attn.v_proj,0.09808896,0.01000,0.966
3,self_attn.q_proj,1.91644359,0.01000,0.963
3,self_attn.o_proj,0.00214759,0.01000,0.961
3,mlp.up_proj,1.06110489,0.01000,0.982
3,mlp.gate_proj,1.51582575,0.01000,0.989
3,mlp.down_proj,0.01012792,0.01000,3.993
4,self_attn.k_proj,1.03121889,0.01000,0.952
4,self_attn.v_proj,0.09737435,0.01000,0.943
4,self_attn.q_proj,1.78057146,0.01000,0.967
4,self_attn.o_proj,0.00524764,0.01000,0.964
4,mlp.up_proj,1.38912082,0.01000,0.981
4,mlp.gate_proj,2.25040221,0.01000,0.976
4,mlp.down_proj,0.01820908,0.01000,4.032
5,self_attn.k_proj,1.77245164,0.01000,0.949
5,self_attn.v_proj,0.10094162,0.01000,0.958
5,self_attn.q_proj,2.76073647,0.01000,0.963
5,self_attn.o_proj,0.00572381,0.01000,0.962
5,mlp.up_proj,1.76203442,0.01000,0.984
5,mlp.gate_proj,2.82282686,0.01000,0.978
5,mlp.down_proj,0.02650169,0.01000,4.003
6,self_attn.k_proj,1.46186721,0.01000,0.951
6,self_attn.v_proj,0.11557909,0.01000,0.950
6,self_attn.q_proj,2.57779884,0.01000,0.960
6,self_attn.o_proj,0.01030868,0.01000,0.965
6,mlp.up_proj,1.95960164,0.01000,0.987
6,mlp.gate_proj,3.18044949,0.01000,0.982
6,mlp.down_proj,0.03279492,0.01000,4.409
7,self_attn.k_proj,1.48253345,0.01000,0.948
7,self_attn.v_proj,0.12368202,0.01000,0.944
7,self_attn.q_proj,2.45336533,0.01000,0.955
7,self_attn.o_proj,0.01420613,0.01000,0.970
7,mlp.up_proj,2.13492918,0.01000,0.988
7,mlp.gate_proj,3.24488592,0.01000,0.983
7,mlp.down_proj,0.03850950,0.01000,4.023
8,self_attn.k_proj,1.93849897,0.01000,0.954
8,self_attn.v_proj,0.16590264,0.01000,0.950
8,self_attn.q_proj,3.13656378,0.01000,0.970
8,self_attn.o_proj,0.01967191,0.01000,0.958
8,mlp.up_proj,2.29845905,0.01000,0.982
8,mlp.gate_proj,3.54030752,0.01000,0.982
8,mlp.down_proj,0.04251836,0.01000,4.048
9,self_attn.k_proj,1.89687407,0.01000,0.955
9,self_attn.v_proj,0.23918010,0.01000,0.973
9,self_attn.q_proj,3.16648197,0.01000,0.965
9,self_attn.o_proj,0.02422045,0.01000,0.962
9,mlp.up_proj,2.43423367,0.01000,1.343
9,mlp.gate_proj,3.77251744,0.01000,0.981
9,mlp.down_proj,0.04667648,0.01000,4.252
10,self_attn.k_proj,2.30144119,0.01000,0.954
10,self_attn.v_proj,0.18498819,0.01000,0.965
10,self_attn.q_proj,3.73618531,0.01000,0.973
10,self_attn.o_proj,0.02161483,0.01000,0.963
10,mlp.up_proj,2.54761338,0.01000,0.989
10,mlp.gate_proj,3.68303084,0.01000,0.980
10,mlp.down_proj,0.04879866,0.01000,4.002
11,self_attn.k_proj,2.10925364,0.01000,0.953
11,self_attn.v_proj,0.19330561,0.01000,0.947
11,self_attn.q_proj,3.28746176,0.01000,0.961
11,self_attn.o_proj,0.02294213,0.01000,0.965
11,mlp.up_proj,2.67688942,0.01000,0.983
11,mlp.gate_proj,3.74871111,0.01000,0.980
11,mlp.down_proj,0.05176591,0.01000,4.099
12,self_attn.k_proj,1.64494085,0.01000,0.949
12,self_attn.v_proj,0.22913060,0.01000,0.956
12,self_attn.q_proj,2.86509371,0.01000,0.969
12,self_attn.o_proj,0.02996064,0.01000,0.961
12,mlp.up_proj,2.74297428,0.01000,0.989
12,mlp.gate_proj,3.63758588,0.01000,0.985
12,mlp.down_proj,0.05879739,0.01000,4.043
13,self_attn.k_proj,2.44561863,0.01000,0.956
13,self_attn.v_proj,0.25090086,0.01000,0.978
13,self_attn.q_proj,3.72013021,0.01000,0.972
13,self_attn.o_proj,0.03329192,0.01000,0.967
13,mlp.up_proj,2.89052248,0.01000,0.989
13,mlp.gate_proj,3.83109856,0.01000,1.001
13,mlp.down_proj,0.06681926,0.01000,4.075
14,self_attn.k_proj,2.59889841,0.01000,0.956
14,self_attn.v_proj,0.25943100,0.01000,0.980
14,self_attn.q_proj,3.71864319,0.01000,0.979
14,self_attn.o_proj,0.03607188,0.01000,0.963
14,mlp.up_proj,3.16311407,0.01000,0.986
14,mlp.gate_proj,4.43673038,0.01000,0.983
14,mlp.down_proj,0.08331311,0.01000,4.020
15,self_attn.k_proj,2.41041493,0.01000,0.961
15,self_attn.v_proj,0.32465303,0.01000,0.970
15,self_attn.q_proj,4.43637896,0.01000,0.982
15,self_attn.o_proj,0.04316147,0.01000,0.970
15,mlp.up_proj,3.33997822,0.01000,0.988
15,mlp.gate_proj,4.94344902,0.01000,1.021
15,mlp.down_proj,0.10118946,0.01000,4.714
16,self_attn.k_proj,2.50961113,0.01000,0.965
16,self_attn.v_proj,0.29429543,0.01000,0.957
16,self_attn.q_proj,4.07947636,0.01000,0.968
16,self_attn.o_proj,0.03333106,0.01000,0.975
16,mlp.up_proj,3.60199404,0.01000,0.984
16,mlp.gate_proj,5.63074589,0.01000,0.976
16,mlp.down_proj,0.11140943,0.01000,4.086
17,self_attn.k_proj,2.74082637,0.01000,0.961
17,self_attn.v_proj,0.32146555,0.01000,0.955
17,self_attn.q_proj,4.31714869,0.01000,0.977
17,self_attn.o_proj,0.03052786,0.01000,0.967
17,mlp.up_proj,3.74027133,0.01000,0.986
17,mlp.gate_proj,5.97789478,0.01000,0.992
17,mlp.down_proj,0.12818229,0.01000,4.005
18,self_attn.k_proj,3.02894711,0.01000,0.957
18,self_attn.v_proj,0.33139157,0.01000,0.962
18,self_attn.q_proj,4.38174438,0.01000,1.187
18,self_attn.o_proj,0.02073601,0.01000,0.973
18,mlp.up_proj,3.95718646,0.01000,1.081
18,mlp.gate_proj,6.38988972,0.01000,1.134
18,mlp.down_proj,0.12699364,0.01000,4.431
19,self_attn.k_proj,2.72588944,0.01000,1.079
19,self_attn.v_proj,0.36277997,0.01000,1.053
19,self_attn.q_proj,4.48861694,0.01000,1.078
19,self_attn.o_proj,0.01849649,0.01000,1.106
19,mlp.up_proj,4.11148834,0.01000,1.104
19,mlp.gate_proj,6.76255035,0.01000,1.077
19,mlp.down_proj,0.13344963,0.01000,4.397
20,self_attn.k_proj,2.99772930,0.01000,1.048
20,self_attn.v_proj,0.39009190,0.01000,1.045
20,self_attn.q_proj,4.62490082,0.01000,1.075
20,self_attn.o_proj,0.02120636,0.01000,1.091
20,mlp.up_proj,4.43619490,0.01000,1.133
20,mlp.gate_proj,7.22839403,0.01000,1.113
20,mlp.down_proj,0.14441478,0.01000,4.425
21,self_attn.k_proj,2.94480252,0.01000,1.066
21,self_attn.v_proj,0.42260897,0.01000,1.056
21,self_attn.q_proj,4.43837166,0.01000,1.074
21,self_attn.o_proj,0.02850885,0.01000,1.062
21,mlp.up_proj,4.73225355,0.01000,1.021
21,mlp.gate_proj,7.77117300,0.01000,1.070
21,mlp.down_proj,0.16843449,0.01000,5.555
22,self_attn.k_proj,3.09630203,0.01000,0.971
22,self_attn.v_proj,0.49371791,0.01000,1.004
22,self_attn.q_proj,4.48650932,0.01000,0.987
22,self_attn.o_proj,0.02654779,0.01000,0.978
22,mlp.up_proj,4.93645144,0.01000,1.015
22,mlp.gate_proj,8.03310680,0.01000,1.009
22,mlp.down_proj,0.17289530,0.01000,4.040
23,self_attn.k_proj,2.98398399,0.01000,0.954
23,self_attn.v_proj,0.53825200,0.01000,0.972
23,self_attn.q_proj,4.67381859,0.01000,0.961
23,self_attn.o_proj,0.02713704,0.01000,0.963
23,mlp.up_proj,5.21848965,0.01000,0.993
23,mlp.gate_proj,8.43232536,0.01000,0.997
23,mlp.down_proj,0.18386570,0.01000,4.056
24,self_attn.k_proj,2.98328638,0.01000,0.953
24,self_attn.v_proj,0.67641538,0.01000,0.944
24,self_attn.q_proj,4.71260357,0.01000,0.964
24,self_attn.o_proj,0.02995079,0.01000,0.968
24,mlp.up_proj,5.57473373,0.01000,0.982
24,mlp.gate_proj,9.01408386,0.01000,0.981
24,mlp.down_proj,0.19735718,0.01000,4.019
25,self_attn.k_proj,2.80995131,0.01000,0.971
25,self_attn.v_proj,0.70912492,0.01000,0.987
25,self_attn.q_proj,4.73544788,0.01000,0.968
25,self_attn.o_proj,0.03377030,0.01000,0.962
25,mlp.up_proj,5.95643902,0.01000,0.983
25,mlp.gate_proj,9.63203812,0.01000,0.981
25,mlp.down_proj,0.21878015,0.01000,4.016
26,self_attn.k_proj,2.99053884,0.01000,0.956
26,self_attn.v_proj,0.65835601,0.01000,0.969
26,self_attn.q_proj,4.58326244,0.01000,0.982
26,self_attn.o_proj,0.04630172,0.01000,0.966
26,mlp.up_proj,6.38272285,0.01000,0.983
26,mlp.gate_proj,10.33224392,0.01000,0.979
26,mlp.down_proj,0.24722236,0.01000,4.049
27,self_attn.k_proj,3.26289296,0.01000,0.950
27,self_attn.v_proj,0.95175558,0.01000,0.966
27,self_attn.q_proj,4.78752518,0.01000,0.960
27,self_attn.o_proj,0.06208333,0.01000,0.982
27,mlp.up_proj,7.02820301,0.01000,0.990
27,mlp.gate_proj,11.29987144,0.01000,0.986
27,mlp.down_proj,0.29721794,0.01000,4.009
28,self_attn.k_proj,2.59787798,0.01000,0.953
28,self_attn.v_proj,0.84426367,0.01000,0.946
28,self_attn.q_proj,4.46915436,0.01000,0.964
28,self_attn.o_proj,0.09729099,0.01000,0.970
28,mlp.up_proj,7.81499147,0.01000,0.996
28,mlp.gate_proj,11.99997711,0.01000,0.981
28,mlp.down_proj,0.38746351,0.01000,4.051
29,self_attn.k_proj,2.69152451,0.01000,0.954
29,self_attn.v_proj,1.02270174,0.01000,0.950
29,self_attn.q_proj,4.71809244,0.01000,0.973
29,self_attn.o_proj,0.08194697,0.01000,0.969
29,mlp.up_proj,8.35252285,0.01000,0.995
29,mlp.gate_proj,12.24577141,0.01000,1.003
29,mlp.down_proj,0.53259313,0.01000,4.059
30,self_attn.k_proj,2.70090246,0.01000,0.956
30,self_attn.v_proj,1.38668847,0.01000,1.731
30,self_attn.q_proj,4.37570143,0.01000,1.174
30,self_attn.o_proj,0.16421506,0.01000,0.969
30,mlp.up_proj,8.91942406,0.01000,0.990
30,mlp.gate_proj,13.37013245,0.01000,0.986
30,mlp.down_proj,0.85872936,0.01000,4.022
31,self_attn.k_proj,1.97329688,0.01000,0.959
31,self_attn.v_proj,0.84535497,0.01000,0.967
31,self_attn.q_proj,3.81004381,0.01000,1.001
31,self_attn.o_proj,0.26083553,0.01000,0.969
31,mlp.up_proj,8.20458317,0.01000,0.988
31,mlp.gate_proj,11.96145439,0.01000,0.987
31,mlp.down_proj,2.20310783,0.01000,4.006