opt-1.3b-test2 / quant_log.csv
iproskurina's picture
Add files using upload-large-folder tool
0ae92f3 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.01193101,0.01000,1.103
0,self_attn.v_proj,0.00204742,0.01000,0.744
0,self_attn.q_proj,0.01151794,0.01000,0.754
0,self_attn.out_proj,0.00000879,0.01000,0.743
0,fc1,0.07220605,0.01000,0.762
0,fc2,0.00009904,0.01000,3.275
1,self_attn.k_proj,0.02748547,0.01000,0.762
1,self_attn.v_proj,0.00377348,0.01000,0.761
1,self_attn.q_proj,0.03053766,0.01000,0.761
1,self_attn.out_proj,0.00000212,0.01000,0.765
1,fc1,0.10564113,0.01000,0.772
1,fc2,0.00011769,0.01000,3.326
2,self_attn.k_proj,0.03364365,0.01000,0.780
2,self_attn.v_proj,0.00638163,0.01000,0.773
2,self_attn.q_proj,0.03404787,0.01000,0.764
2,self_attn.out_proj,0.00000442,0.01000,0.764
2,fc1,0.10685527,0.01000,0.769
2,fc2,0.00007892,0.01000,3.315
3,self_attn.k_proj,0.03226093,0.01000,0.768
3,self_attn.v_proj,0.00772221,0.01000,0.770
3,self_attn.q_proj,0.03518277,0.01000,0.769
3,self_attn.out_proj,0.00000809,0.01000,0.762
3,fc1,0.09162843,0.01000,0.785
3,fc2,0.00007157,0.01000,3.323
4,self_attn.k_proj,0.03976664,0.01000,0.773
4,self_attn.v_proj,0.00833308,0.01000,0.757
4,self_attn.q_proj,0.04298474,0.01000,0.751
4,self_attn.out_proj,0.00001194,0.01000,0.764
4,fc1,0.08744164,0.01000,0.768
4,fc2,0.00008075,0.01000,3.306
5,self_attn.k_proj,0.04211287,0.01000,0.778
5,self_attn.v_proj,0.00969345,0.01000,0.761
5,self_attn.q_proj,0.04678004,0.01000,0.765
5,self_attn.out_proj,0.00001155,0.01000,0.761
5,fc1,0.08947679,0.01000,0.771
5,fc2,0.00009699,0.01000,3.314
6,self_attn.k_proj,0.06050922,0.01000,0.772
6,self_attn.v_proj,0.01090727,0.01000,0.778
6,self_attn.q_proj,0.05891616,0.01000,0.763
6,self_attn.out_proj,0.00003464,0.01000,0.765
6,fc1,0.09683321,0.01000,0.767
6,fc2,0.00013900,0.01000,3.308
7,self_attn.k_proj,0.06143640,0.01000,0.770
7,self_attn.v_proj,0.01166906,0.01000,0.755
7,self_attn.q_proj,0.05640485,0.01000,0.768
7,self_attn.out_proj,0.00004408,0.01000,0.767
7,fc1,0.10895248,0.01000,0.764
7,fc2,0.00020347,0.01000,3.324
8,self_attn.k_proj,0.06507521,0.01000,0.763
8,self_attn.v_proj,0.01208323,0.01000,0.767
8,self_attn.q_proj,0.05399566,0.01000,0.769
8,self_attn.out_proj,0.00005616,0.01000,0.763
8,fc1,0.11881161,0.01000,0.765
8,fc2,0.00026443,0.01000,3.316
9,self_attn.k_proj,0.06506123,0.01000,0.771
9,self_attn.v_proj,0.01248781,0.01000,0.764
9,self_attn.q_proj,0.05453248,0.01000,0.770
9,self_attn.out_proj,0.00007938,0.01000,0.764
9,fc1,0.12274915,0.01000,0.785
9,fc2,0.00035536,0.01000,3.319
10,self_attn.k_proj,0.06140727,0.01000,0.776
10,self_attn.v_proj,0.01420014,0.01000,0.780
10,self_attn.q_proj,0.05016806,0.01000,0.786
10,self_attn.out_proj,0.00011017,0.01000,0.762
10,fc1,0.12526228,0.01000,0.773
10,fc2,0.00056714,0.01000,3.312
11,self_attn.k_proj,0.05852431,0.01000,0.772
11,self_attn.v_proj,0.01596023,0.01000,0.753
11,self_attn.q_proj,0.04750057,0.01000,0.761
11,self_attn.out_proj,0.00014029,0.01000,0.755
11,fc1,0.12785329,0.01000,0.780
11,fc2,0.00075469,0.01000,3.314
12,self_attn.k_proj,0.06211779,0.01000,0.768
12,self_attn.v_proj,0.01650352,0.01000,0.770
12,self_attn.q_proj,0.04717031,0.01000,0.785
12,self_attn.out_proj,0.00022129,0.01000,0.764
12,fc1,0.12406510,0.01000,0.778
12,fc2,0.00102223,0.01000,3.306
13,self_attn.k_proj,0.06443056,0.01000,0.776
13,self_attn.v_proj,0.01726957,0.01000,0.753
13,self_attn.q_proj,0.04661303,0.01000,0.762
13,self_attn.out_proj,0.00023633,0.01000,0.757
13,fc1,0.13054048,0.01000,0.784
13,fc2,0.00139816,0.01000,3.359
14,self_attn.k_proj,0.05847587,0.01000,0.770
14,self_attn.v_proj,0.02090536,0.01000,0.769
14,self_attn.q_proj,0.04376426,0.01000,0.761
14,self_attn.out_proj,0.00027757,0.01000,0.763
14,fc1,0.13830929,0.01000,0.767
14,fc2,0.00192462,0.01000,3.332
15,self_attn.k_proj,0.05246258,0.01000,0.776
15,self_attn.v_proj,0.02610055,0.01000,0.768
15,self_attn.q_proj,0.04327298,0.01000,0.762
15,self_attn.out_proj,0.00027173,0.01000,0.762
15,fc1,0.14475755,0.01000,0.780
15,fc2,0.00244589,0.01000,3.317
16,self_attn.k_proj,0.05219132,0.01000,0.768
16,self_attn.v_proj,0.02799954,0.01000,0.759
16,self_attn.q_proj,0.03783621,0.01000,0.764
16,self_attn.out_proj,0.00039026,0.01000,0.765
16,fc1,0.15572587,0.01000,0.795
16,fc2,0.00316169,0.01000,3.313
17,self_attn.k_proj,0.05054565,0.01000,0.766
17,self_attn.v_proj,0.03031302,0.01000,0.769
17,self_attn.q_proj,0.03752312,0.01000,0.770
17,self_attn.out_proj,0.00044570,0.01000,0.768
17,fc1,0.16843134,0.01000,0.771
17,fc2,0.00403455,0.01000,3.313
18,self_attn.k_proj,0.04542822,0.01000,0.773
18,self_attn.v_proj,0.03442155,0.01000,0.762
18,self_attn.q_proj,0.03605321,0.01000,0.765
18,self_attn.out_proj,0.00050592,0.01000,0.759
18,fc1,0.17868196,0.01000,0.768
18,fc2,0.00501038,0.01000,3.326
19,self_attn.k_proj,0.04690968,0.01000,0.766
19,self_attn.v_proj,0.04475790,0.01000,0.766
19,self_attn.q_proj,0.03639612,0.01000,0.761
19,self_attn.out_proj,0.00078457,0.01000,0.748
19,fc1,0.19376262,0.01000,0.783
19,fc2,0.00626677,0.01000,3.340
20,self_attn.k_proj,0.04897357,0.01000,0.764
20,self_attn.v_proj,0.05148327,0.01000,0.758
20,self_attn.q_proj,0.03587547,0.01000,0.761
20,self_attn.out_proj,0.00091725,0.01000,0.764
20,fc1,0.20390676,0.01000,0.769
20,fc2,0.00819971,0.01000,3.323
21,self_attn.k_proj,0.04592828,0.01000,0.775
21,self_attn.v_proj,0.05410574,0.01000,0.763
21,self_attn.q_proj,0.04011959,0.01000,0.771
21,self_attn.out_proj,0.00081666,0.01000,0.768
21,fc1,0.20928091,0.01000,0.783
21,fc2,0.00960784,0.01000,3.343
22,self_attn.k_proj,0.04860422,0.01000,0.769
22,self_attn.v_proj,0.06308914,0.01000,0.767
22,self_attn.q_proj,0.05071734,0.01000,0.762
22,self_attn.out_proj,0.00084933,0.01000,0.756
22,fc1,0.21024571,0.01000,0.760
22,fc2,0.01009148,0.01000,3.305
23,self_attn.k_proj,0.07043971,0.01000,0.771
23,self_attn.v_proj,0.04643616,0.01000,0.758
23,self_attn.q_proj,0.11800774,0.01000,0.758
23,self_attn.out_proj,0.00239992,0.01000,0.768
23,fc1,0.20430349,0.01000,0.770
23,fc2,0.00738119,0.01000,3.345