phi-2-gptq-4bit / quant_log.csv
Crusadersk's picture
Self-quantized phi-2-gptq 4-bit (group_size=128, seed=42)
4d7ab2b verified
layer,module,loss,samples,damp,time
0,self_attn.q_proj,0.0000858512,0.05000,1.097
0,self_attn.k_proj,0.0001029116,0.05000,1.129
0,self_attn.v_proj,0.0000302286,0.05000,0.869
0,self_attn.dense,0.0000123729,0.05000,0.857
0,mlp.fc1,0.0001053048,0.05000,0.953
0,mlp.fc2,0.0000069301,0.05000,4.047
1,self_attn.q_proj,0.0000778551,0.05000,0.913
1,self_attn.k_proj,0.0000812629,0.05000,0.925
1,self_attn.v_proj,0.0000198182,0.05000,0.865
1,self_attn.dense,0.0000046095,0.05000,0.893
1,mlp.fc1,0.0002500907,0.05000,0.915
1,mlp.fc2,0.0000168595,0.05000,3.982
2,self_attn.q_proj,0.0001165650,0.05000,0.969
2,self_attn.k_proj,0.0001173934,0.05000,0.950
2,self_attn.v_proj,0.0000463347,0.05000,0.882
2,self_attn.dense,0.0000052613,0.05000,0.881
2,mlp.fc1,0.0004108166,0.05000,1.135
2,mlp.fc2,0.0000199922,0.05000,4.276
3,self_attn.q_proj,0.0001364429,0.05000,0.991
3,self_attn.k_proj,0.0001284486,0.05000,0.984
3,self_attn.v_proj,0.0000970313,0.05000,0.888
3,self_attn.dense,0.0000050054,0.05000,0.920
3,mlp.fc1,0.0006537699,0.05000,0.965
3,mlp.fc2,0.0000279560,0.05000,4.165
4,self_attn.q_proj,0.0001806877,0.05000,1.029
4,self_attn.k_proj,0.0001703575,0.05000,0.915
4,self_attn.v_proj,0.0001177177,0.05000,0.927
4,self_attn.dense,0.0000071838,0.05000,0.914
4,mlp.fc1,0.0006948134,0.05000,0.997
4,mlp.fc2,0.0000382566,0.05000,4.367
5,self_attn.q_proj,0.0001677401,0.05000,1.003
5,self_attn.k_proj,0.0001583099,0.05000,0.936
5,self_attn.v_proj,0.0001066596,0.05000,0.892
5,self_attn.dense,0.0000078510,0.05000,0.975
5,mlp.fc1,0.0006093672,0.05000,1.055
5,mlp.fc2,0.0000421267,0.05000,4.136
6,self_attn.q_proj,0.0002005054,0.05000,1.016
6,self_attn.k_proj,0.0001911783,0.05000,0.982
6,self_attn.v_proj,0.0001320928,0.05000,0.967
6,self_attn.dense,0.0000092071,0.05000,0.945
6,mlp.fc1,0.0006585670,0.05000,0.935
6,mlp.fc2,0.0000462386,0.05000,4.468
7,self_attn.q_proj,0.0002163916,0.05000,1.070
7,self_attn.k_proj,0.0002072118,0.05000,0.937
7,self_attn.v_proj,0.0001352158,0.05000,0.978
7,self_attn.dense,0.0000117110,0.05000,0.970
7,mlp.fc1,0.0006694943,0.05000,0.943
7,mlp.fc2,0.0000498323,0.05000,4.157
8,self_attn.q_proj,0.0002109012,0.05000,0.949
8,self_attn.k_proj,0.0002039318,0.05000,1.241
8,self_attn.v_proj,0.0001560394,0.05000,0.996
8,self_attn.dense,0.0000082801,0.05000,0.990
8,mlp.fc1,0.0006576708,0.05000,1.030
8,mlp.fc2,0.0000524794,0.05000,4.458
9,self_attn.q_proj,0.0002133507,0.05000,1.027
9,self_attn.k_proj,0.0002043295,0.05000,0.955
9,self_attn.v_proj,0.0001553389,0.05000,0.979
9,self_attn.dense,0.0000089070,0.05000,0.967
9,mlp.fc1,0.0006463157,0.05000,1.011
9,mlp.fc2,0.0000528918,0.05000,4.181
10,self_attn.q_proj,0.0002181723,0.05000,0.950
10,self_attn.k_proj,0.0002149413,0.05000,0.952
10,self_attn.v_proj,0.0001367607,0.05000,0.928
10,self_attn.dense,0.0000134973,0.05000,0.896
10,mlp.fc1,0.0006295212,0.05000,0.923
10,mlp.fc2,0.0000522401,0.05000,4.083
11,self_attn.q_proj,0.0002261469,0.05000,0.958
11,self_attn.k_proj,0.0002225379,0.05000,0.977
11,self_attn.v_proj,0.0001492103,0.05000,0.945
11,self_attn.dense,0.0000167664,0.05000,0.914
11,mlp.fc1,0.0006092769,0.05000,0.930
11,mlp.fc2,0.0000528684,0.05000,5.138
12,self_attn.q_proj,0.0002321886,0.05000,0.974
12,self_attn.k_proj,0.0002303848,0.05000,0.891
12,self_attn.v_proj,0.0001530323,0.05000,0.908
12,self_attn.dense,0.0000169518,0.05000,0.920
12,mlp.fc1,0.0006060201,0.05000,0.973
12,mlp.fc2,0.0000549961,0.05000,4.304
13,self_attn.q_proj,0.0002252652,0.05000,0.972
13,self_attn.k_proj,0.0002252355,0.05000,1.009
13,self_attn.v_proj,0.0001491018,0.05000,0.952
13,self_attn.dense,0.0000157061,0.05000,0.996
13,mlp.fc1,0.0006169498,0.05000,1.020
13,mlp.fc2,0.0000539558,0.05000,4.684
14,self_attn.q_proj,0.0002650832,0.05000,1.065
14,self_attn.k_proj,0.0002238111,0.05000,0.999
14,self_attn.v_proj,0.0001467716,0.05000,0.949
14,self_attn.dense,0.0000165920,0.05000,0.983
14,mlp.fc1,0.0006014784,0.05000,0.989
14,mlp.fc2,0.0000545418,0.05000,4.357
15,self_attn.q_proj,0.0002222408,0.05000,0.952
15,self_attn.k_proj,0.0002214731,0.05000,0.935
15,self_attn.v_proj,0.0001403913,0.05000,0.971
15,self_attn.dense,0.0000169734,0.05000,0.912
15,mlp.fc1,0.0005749508,0.05000,0.944
15,mlp.fc2,0.0000612357,0.05000,4.166
16,self_attn.q_proj,0.0002301284,0.05000,1.015
16,self_attn.k_proj,0.0002283591,0.05000,0.881
16,self_attn.v_proj,0.0001480706,0.05000,0.896
16,self_attn.dense,0.0000156473,0.05000,0.876
16,mlp.fc1,0.0005911736,0.05000,0.936
16,mlp.fc2,0.0000615094,0.05000,4.146
17,self_attn.q_proj,0.0002169144,0.05000,0.949
17,self_attn.k_proj,0.0002164072,0.05000,0.980
17,self_attn.v_proj,0.0001373301,0.05000,0.942
17,self_attn.dense,0.0000168942,0.05000,0.929
17,mlp.fc1,0.0005453525,0.05000,0.907
17,mlp.fc2,0.0000619073,0.05000,4.035
18,self_attn.q_proj,0.0002519506,0.05000,0.997
18,self_attn.k_proj,0.0002533842,0.05000,0.974
18,self_attn.v_proj,0.0001425683,0.05000,0.953
18,self_attn.dense,0.0000179922,0.05000,0.886
18,mlp.fc1,0.0005474294,0.05000,0.933
18,mlp.fc2,0.0000634956,0.05000,4.298
19,self_attn.q_proj,0.0002300704,0.05000,1.044
19,self_attn.k_proj,0.0002330887,0.05000,0.926
19,self_attn.v_proj,0.0001444852,0.05000,0.995
19,self_attn.dense,0.0000164025,0.05000,1.168
19,mlp.fc1,0.0005811269,0.05000,1.058
19,mlp.fc2,0.0000723687,0.05000,4.503
20,self_attn.q_proj,0.0002827060,0.05000,1.040
20,self_attn.k_proj,0.0002414499,0.05000,0.943
20,self_attn.v_proj,0.0001363139,0.05000,0.986
20,self_attn.dense,0.0000187169,0.05000,1.034
20,mlp.fc1,0.0005760693,0.05000,1.011
20,mlp.fc2,0.0000753935,0.05000,4.585
21,self_attn.q_proj,0.0002291035,0.05000,1.085
21,self_attn.k_proj,0.0002217587,0.05000,0.947
21,self_attn.v_proj,0.0001625256,0.05000,0.968
21,self_attn.dense,0.0000147600,0.05000,0.959
21,mlp.fc1,0.0006096665,0.05000,1.005
21,mlp.fc2,0.0000837082,0.05000,4.373
22,self_attn.q_proj,0.0002641166,0.05000,1.019
22,self_attn.k_proj,0.0002266009,0.05000,1.127
22,self_attn.v_proj,0.0001701314,0.05000,0.935
22,self_attn.dense,0.0000122861,0.05000,0.906
22,mlp.fc1,0.0006319354,0.05000,0.929
22,mlp.fc2,0.0000845768,0.05000,4.132
23,self_attn.q_proj,0.0002803879,0.05000,0.939
23,self_attn.k_proj,0.0002535842,0.05000,0.996
23,self_attn.v_proj,0.0001640246,0.05000,0.914
23,self_attn.dense,0.0000198861,0.05000,0.889
23,mlp.fc1,0.0006627535,0.05000,0.919
23,mlp.fc2,0.0000945106,0.05000,4.222
24,self_attn.q_proj,0.0002384906,0.05000,0.962
24,self_attn.k_proj,0.0002369107,0.05000,0.904
24,self_attn.v_proj,0.0001989545,0.05000,0.933
24,self_attn.dense,0.0000162029,0.05000,0.887
24,mlp.fc1,0.0007166684,0.05000,0.989
24,mlp.fc2,0.0001029097,0.05000,4.025
25,self_attn.q_proj,0.0003113051,0.05000,1.047
25,self_attn.k_proj,0.0002572589,0.05000,1.003
25,self_attn.v_proj,0.0002068744,0.05000,0.917
25,self_attn.dense,0.0000187007,0.05000,0.979
25,mlp.fc1,0.0007801538,0.05000,0.941
25,mlp.fc2,0.0001016458,0.05000,4.126
26,self_attn.q_proj,0.0003590267,0.05000,0.980
26,self_attn.k_proj,0.0002574304,0.05000,0.954
26,self_attn.v_proj,0.0002369789,0.05000,0.952
26,self_attn.dense,0.0000299120,0.05000,0.937
26,mlp.fc1,0.0007834066,0.05000,0.999
26,mlp.fc2,0.0001124531,0.05000,4.201
27,self_attn.q_proj,0.0003025899,0.05000,0.952
27,self_attn.k_proj,0.0003528239,0.05000,0.908
27,self_attn.v_proj,0.0002532654,0.05000,0.892
27,self_attn.dense,0.0000275395,0.05000,0.961
27,mlp.fc1,0.0008518580,0.05000,0.971
27,mlp.fc2,0.0001470365,0.05000,4.424
28,self_attn.q_proj,0.0002637209,0.05000,1.063
28,self_attn.k_proj,0.0002721585,0.05000,0.953
28,self_attn.v_proj,0.0002665452,0.05000,0.952
28,self_attn.dense,0.0000327637,0.05000,0.881
28,mlp.fc1,0.0008877072,0.05000,0.929
28,mlp.fc2,0.0001765151,0.05000,4.167
29,self_attn.q_proj,0.0037034005,0.05000,0.975
29,self_attn.k_proj,0.0030506286,0.05000,1.012
29,self_attn.v_proj,0.0001793814,0.05000,0.972
29,self_attn.dense,0.0000784153,0.05000,0.954
29,mlp.fc1,0.0012136550,0.05000,1.026
29,mlp.fc2,0.0001923476,0.05000,4.545
30,self_attn.q_proj,0.0124896431,0.05000,1.096
30,self_attn.k_proj,0.0038405387,0.05000,1.110
30,self_attn.v_proj,0.0001383956,0.05000,1.107
30,self_attn.dense,0.0000560131,0.05000,1.004
30,mlp.fc1,0.0013959989,0.05000,1.031
30,mlp.fc2,0.0001954762,0.05000,4.354
31,self_attn.q_proj,0.0038123704,0.05000,0.988
31,self_attn.k_proj,0.0006134240,0.05000,0.890
31,self_attn.v_proj,0.0000717409,0.05000,0.939
31,self_attn.dense,0.0000127410,0.05000,0.895
31,mlp.fc1,0.0007779660,0.05000,0.936
31,mlp.fc2,0.0001298984,0.05000,4.108