opt-1.3b-random-b / quant_log.csv
iproskurina's picture
Add files using upload-large-folder tool
5a2de59 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00409379,0.01000,0.993
0,self_attn.v_proj,0.00072114,0.01000,1.013
0,self_attn.q_proj,0.00414090,0.01000,1.025
0,self_attn.out_proj,0.00001093,0.01000,0.995
0,fc1,0.01083721,0.01000,0.997
0,fc2,0.00014591,0.01000,4.290
1,self_attn.k_proj,0.00460731,0.01000,0.993
1,self_attn.v_proj,0.00057901,0.01000,0.989
1,self_attn.q_proj,0.00501648,0.01000,1.004
1,self_attn.out_proj,0.00000384,0.01000,0.980
1,fc1,0.01723385,0.01000,1.018
1,fc2,0.00027718,0.01000,4.274
2,self_attn.k_proj,0.00625587,0.01000,1.028
2,self_attn.v_proj,0.00100671,0.01000,0.992
2,self_attn.q_proj,0.00620751,0.01000,1.017
2,self_attn.out_proj,0.00001057,0.01000,0.986
2,fc1,0.01686204,0.01000,1.000
2,fc2,0.00013050,0.01000,4.262
3,self_attn.k_proj,0.00688523,0.01000,0.981
3,self_attn.v_proj,0.00138955,0.01000,0.989
3,self_attn.q_proj,0.00759731,0.01000,0.988
3,self_attn.out_proj,0.00001236,0.01000,0.998
3,fc1,0.01656991,0.01000,1.003
3,fc2,0.00012674,0.01000,4.207
4,self_attn.k_proj,0.01033037,0.01000,1.005
4,self_attn.v_proj,0.00170416,0.01000,0.988
4,self_attn.q_proj,0.01105807,0.01000,0.985
4,self_attn.out_proj,0.00002068,0.01000,0.996
4,fc1,0.01853193,0.01000,1.005
4,fc2,0.00013410,0.01000,4.235
5,self_attn.k_proj,0.01293353,0.01000,1.007
5,self_attn.v_proj,0.00222387,0.01000,0.989
5,self_attn.q_proj,0.01334210,0.01000,1.003
5,self_attn.out_proj,0.00002222,0.01000,1.007
5,fc1,0.02076346,0.01000,0.994
5,fc2,0.00014411,0.01000,4.170
6,self_attn.k_proj,0.01992640,0.01000,1.042
6,self_attn.v_proj,0.00283416,0.01000,1.005
6,self_attn.q_proj,0.01790950,0.01000,1.015
6,self_attn.out_proj,0.00004584,0.01000,0.994
6,fc1,0.02586313,0.01000,0.987
6,fc2,0.00019328,0.01000,4.243
7,self_attn.k_proj,0.02163527,0.01000,0.981
7,self_attn.v_proj,0.00339857,0.01000,0.978
7,self_attn.q_proj,0.01917062,0.01000,0.995
7,self_attn.out_proj,0.00005514,0.01000,0.994
7,fc1,0.03230386,0.01000,1.036
7,fc2,0.00027319,0.01000,4.248
8,self_attn.k_proj,0.02458253,0.01000,0.986
8,self_attn.v_proj,0.00393817,0.01000,0.977
8,self_attn.q_proj,0.02009545,0.01000,0.996
8,self_attn.out_proj,0.00007193,0.01000,0.990
8,fc1,0.03901298,0.01000,1.007
8,fc2,0.00036630,0.01000,4.221
9,self_attn.k_proj,0.02626408,0.01000,1.021
9,self_attn.v_proj,0.00449418,0.01000,0.980
9,self_attn.q_proj,0.02207199,0.01000,0.988
9,self_attn.out_proj,0.00009974,0.01000,0.992
9,fc1,0.04441365,0.01000,1.009
9,fc2,0.00049525,0.01000,4.350
10,self_attn.k_proj,0.02680579,0.01000,0.992
10,self_attn.v_proj,0.00567766,0.01000,0.980
10,self_attn.q_proj,0.02212340,0.01000,0.996
10,self_attn.out_proj,0.00013059,0.01000,0.977
10,fc1,0.05002769,0.01000,1.000
10,fc2,0.00073721,0.01000,4.189
11,self_attn.k_proj,0.02718079,0.01000,1.009
11,self_attn.v_proj,0.00700397,0.01000,0.978
11,self_attn.q_proj,0.02239926,0.01000,1.007
11,self_attn.out_proj,0.00017297,0.01000,1.003
11,fc1,0.05576458,0.01000,1.005
11,fc2,0.00095275,0.01000,4.233
12,self_attn.k_proj,0.03069451,0.01000,0.995
12,self_attn.v_proj,0.00774106,0.01000,0.989
12,self_attn.q_proj,0.02362737,0.01000,0.977
12,self_attn.out_proj,0.00025744,0.01000,0.994
12,fc1,0.05810564,0.01000,1.012
12,fc2,0.00123986,0.01000,4.256
13,self_attn.k_proj,0.03295046,0.01000,0.995
13,self_attn.v_proj,0.00860731,0.01000,0.977
13,self_attn.q_proj,0.02428213,0.01000,0.986
13,self_attn.out_proj,0.00027379,0.01000,1.068
13,fc1,0.06419239,0.01000,1.021
13,fc2,0.00162063,0.01000,4.230
14,self_attn.k_proj,0.03117430,0.01000,1.009
14,self_attn.v_proj,0.01099943,0.01000,0.983
14,self_attn.q_proj,0.02365817,0.01000,0.991
14,self_attn.out_proj,0.00030741,0.01000,0.996
14,fc1,0.07080662,0.01000,1.012
14,fc2,0.00221463,0.01000,4.206
15,self_attn.k_proj,0.02812890,0.01000,1.004
15,self_attn.v_proj,0.01401449,0.01000,0.977
15,self_attn.q_proj,0.02391200,0.01000,1.010
15,self_attn.out_proj,0.00029116,0.01000,0.986
15,fc1,0.07525838,0.01000,1.011
15,fc2,0.00280922,0.01000,4.259
16,self_attn.k_proj,0.02830217,0.01000,0.986
16,self_attn.v_proj,0.01540015,0.01000,0.994
16,self_attn.q_proj,0.02135721,0.01000,0.997
16,self_attn.out_proj,0.00044422,0.01000,0.996
16,fc1,0.08256883,0.01000,1.011
16,fc2,0.00352829,0.01000,4.263
17,self_attn.k_proj,0.02758769,0.01000,1.023
17,self_attn.v_proj,0.01700824,0.01000,0.972
17,self_attn.q_proj,0.02158560,0.01000,0.995
17,self_attn.out_proj,0.00051447,0.01000,0.989
17,fc1,0.09083328,0.01000,0.998
17,fc2,0.00448523,0.01000,4.202
18,self_attn.k_proj,0.02513609,0.01000,0.985
18,self_attn.v_proj,0.01950069,0.01000,0.998
18,self_attn.q_proj,0.02091608,0.01000,0.986
18,self_attn.out_proj,0.00059864,0.01000,1.026
18,fc1,0.09597015,0.01000,0.994
18,fc2,0.00544927,0.01000,4.187
19,self_attn.k_proj,0.02561334,0.01000,1.077
19,self_attn.v_proj,0.02522137,0.01000,1.002
19,self_attn.q_proj,0.02101323,0.01000,1.015
19,self_attn.out_proj,0.00087916,0.01000,0.984
19,fc1,0.10437368,0.01000,0.997
19,fc2,0.00673680,0.01000,4.163
20,self_attn.k_proj,0.02653702,0.01000,0.983
20,self_attn.v_proj,0.02878364,0.01000,0.993
20,self_attn.q_proj,0.02050654,0.01000,0.975
20,self_attn.out_proj,0.00057599,0.01000,0.986
20,fc1,0.10855858,0.01000,0.998
20,fc2,0.00745274,0.01000,4.255
21,self_attn.k_proj,0.02398171,0.01000,1.003
21,self_attn.v_proj,0.02851950,0.01000,0.985
21,self_attn.q_proj,0.02189942,0.01000,0.983
21,self_attn.out_proj,0.00025027,0.01000,0.998
21,fc1,0.10575759,0.01000,0.985
21,fc2,0.00817760,0.01000,4.237
22,self_attn.k_proj,0.02366718,0.01000,0.994
22,self_attn.v_proj,0.03047793,0.01000,0.985
22,self_attn.q_proj,0.02532681,0.01000,0.996
22,self_attn.out_proj,0.00129898,0.01000,1.022
22,fc1,0.10098480,0.01000,1.009
22,fc2,0.00862298,0.01000,4.217
23,self_attn.k_proj,0.02841244,0.01000,1.030
23,self_attn.v_proj,0.02046534,0.01000,1.014
23,self_attn.q_proj,0.05300370,0.01000,1.000
23,self_attn.out_proj,0.00440506,0.01000,0.987
23,fc1,0.09355172,0.01000,1.001
23,fc2,0.00552451,0.01000,4.275