File size: 6,025 Bytes
0ae92f3 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.01193101,0.01000,1.103
0,self_attn.v_proj,0.00204742,0.01000,0.744
0,self_attn.q_proj,0.01151794,0.01000,0.754
0,self_attn.out_proj,0.00000879,0.01000,0.743
0,fc1,0.07220605,0.01000,0.762
0,fc2,0.00009904,0.01000,3.275
1,self_attn.k_proj,0.02748547,0.01000,0.762
1,self_attn.v_proj,0.00377348,0.01000,0.761
1,self_attn.q_proj,0.03053766,0.01000,0.761
1,self_attn.out_proj,0.00000212,0.01000,0.765
1,fc1,0.10564113,0.01000,0.772
1,fc2,0.00011769,0.01000,3.326
2,self_attn.k_proj,0.03364365,0.01000,0.780
2,self_attn.v_proj,0.00638163,0.01000,0.773
2,self_attn.q_proj,0.03404787,0.01000,0.764
2,self_attn.out_proj,0.00000442,0.01000,0.764
2,fc1,0.10685527,0.01000,0.769
2,fc2,0.00007892,0.01000,3.315
3,self_attn.k_proj,0.03226093,0.01000,0.768
3,self_attn.v_proj,0.00772221,0.01000,0.770
3,self_attn.q_proj,0.03518277,0.01000,0.769
3,self_attn.out_proj,0.00000809,0.01000,0.762
3,fc1,0.09162843,0.01000,0.785
3,fc2,0.00007157,0.01000,3.323
4,self_attn.k_proj,0.03976664,0.01000,0.773
4,self_attn.v_proj,0.00833308,0.01000,0.757
4,self_attn.q_proj,0.04298474,0.01000,0.751
4,self_attn.out_proj,0.00001194,0.01000,0.764
4,fc1,0.08744164,0.01000,0.768
4,fc2,0.00008075,0.01000,3.306
5,self_attn.k_proj,0.04211287,0.01000,0.778
5,self_attn.v_proj,0.00969345,0.01000,0.761
5,self_attn.q_proj,0.04678004,0.01000,0.765
5,self_attn.out_proj,0.00001155,0.01000,0.761
5,fc1,0.08947679,0.01000,0.771
5,fc2,0.00009699,0.01000,3.314
6,self_attn.k_proj,0.06050922,0.01000,0.772
6,self_attn.v_proj,0.01090727,0.01000,0.778
6,self_attn.q_proj,0.05891616,0.01000,0.763
6,self_attn.out_proj,0.00003464,0.01000,0.765
6,fc1,0.09683321,0.01000,0.767
6,fc2,0.00013900,0.01000,3.308
7,self_attn.k_proj,0.06143640,0.01000,0.770
7,self_attn.v_proj,0.01166906,0.01000,0.755
7,self_attn.q_proj,0.05640485,0.01000,0.768
7,self_attn.out_proj,0.00004408,0.01000,0.767
7,fc1,0.10895248,0.01000,0.764
7,fc2,0.00020347,0.01000,3.324
8,self_attn.k_proj,0.06507521,0.01000,0.763
8,self_attn.v_proj,0.01208323,0.01000,0.767
8,self_attn.q_proj,0.05399566,0.01000,0.769
8,self_attn.out_proj,0.00005616,0.01000,0.763
8,fc1,0.11881161,0.01000,0.765
8,fc2,0.00026443,0.01000,3.316
9,self_attn.k_proj,0.06506123,0.01000,0.771
9,self_attn.v_proj,0.01248781,0.01000,0.764
9,self_attn.q_proj,0.05453248,0.01000,0.770
9,self_attn.out_proj,0.00007938,0.01000,0.764
9,fc1,0.12274915,0.01000,0.785
9,fc2,0.00035536,0.01000,3.319
10,self_attn.k_proj,0.06140727,0.01000,0.776
10,self_attn.v_proj,0.01420014,0.01000,0.780
10,self_attn.q_proj,0.05016806,0.01000,0.786
10,self_attn.out_proj,0.00011017,0.01000,0.762
10,fc1,0.12526228,0.01000,0.773
10,fc2,0.00056714,0.01000,3.312
11,self_attn.k_proj,0.05852431,0.01000,0.772
11,self_attn.v_proj,0.01596023,0.01000,0.753
11,self_attn.q_proj,0.04750057,0.01000,0.761
11,self_attn.out_proj,0.00014029,0.01000,0.755
11,fc1,0.12785329,0.01000,0.780
11,fc2,0.00075469,0.01000,3.314
12,self_attn.k_proj,0.06211779,0.01000,0.768
12,self_attn.v_proj,0.01650352,0.01000,0.770
12,self_attn.q_proj,0.04717031,0.01000,0.785
12,self_attn.out_proj,0.00022129,0.01000,0.764
12,fc1,0.12406510,0.01000,0.778
12,fc2,0.00102223,0.01000,3.306
13,self_attn.k_proj,0.06443056,0.01000,0.776
13,self_attn.v_proj,0.01726957,0.01000,0.753
13,self_attn.q_proj,0.04661303,0.01000,0.762
13,self_attn.out_proj,0.00023633,0.01000,0.757
13,fc1,0.13054048,0.01000,0.784
13,fc2,0.00139816,0.01000,3.359
14,self_attn.k_proj,0.05847587,0.01000,0.770
14,self_attn.v_proj,0.02090536,0.01000,0.769
14,self_attn.q_proj,0.04376426,0.01000,0.761
14,self_attn.out_proj,0.00027757,0.01000,0.763
14,fc1,0.13830929,0.01000,0.767
14,fc2,0.00192462,0.01000,3.332
15,self_attn.k_proj,0.05246258,0.01000,0.776
15,self_attn.v_proj,0.02610055,0.01000,0.768
15,self_attn.q_proj,0.04327298,0.01000,0.762
15,self_attn.out_proj,0.00027173,0.01000,0.762
15,fc1,0.14475755,0.01000,0.780
15,fc2,0.00244589,0.01000,3.317
16,self_attn.k_proj,0.05219132,0.01000,0.768
16,self_attn.v_proj,0.02799954,0.01000,0.759
16,self_attn.q_proj,0.03783621,0.01000,0.764
16,self_attn.out_proj,0.00039026,0.01000,0.765
16,fc1,0.15572587,0.01000,0.795
16,fc2,0.00316169,0.01000,3.313
17,self_attn.k_proj,0.05054565,0.01000,0.766
17,self_attn.v_proj,0.03031302,0.01000,0.769
17,self_attn.q_proj,0.03752312,0.01000,0.770
17,self_attn.out_proj,0.00044570,0.01000,0.768
17,fc1,0.16843134,0.01000,0.771
17,fc2,0.00403455,0.01000,3.313
18,self_attn.k_proj,0.04542822,0.01000,0.773
18,self_attn.v_proj,0.03442155,0.01000,0.762
18,self_attn.q_proj,0.03605321,0.01000,0.765
18,self_attn.out_proj,0.00050592,0.01000,0.759
18,fc1,0.17868196,0.01000,0.768
18,fc2,0.00501038,0.01000,3.326
19,self_attn.k_proj,0.04690968,0.01000,0.766
19,self_attn.v_proj,0.04475790,0.01000,0.766
19,self_attn.q_proj,0.03639612,0.01000,0.761
19,self_attn.out_proj,0.00078457,0.01000,0.748
19,fc1,0.19376262,0.01000,0.783
19,fc2,0.00626677,0.01000,3.340
20,self_attn.k_proj,0.04897357,0.01000,0.764
20,self_attn.v_proj,0.05148327,0.01000,0.758
20,self_attn.q_proj,0.03587547,0.01000,0.761
20,self_attn.out_proj,0.00091725,0.01000,0.764
20,fc1,0.20390676,0.01000,0.769
20,fc2,0.00819971,0.01000,3.323
21,self_attn.k_proj,0.04592828,0.01000,0.775
21,self_attn.v_proj,0.05410574,0.01000,0.763
21,self_attn.q_proj,0.04011959,0.01000,0.771
21,self_attn.out_proj,0.00081666,0.01000,0.768
21,fc1,0.20928091,0.01000,0.783
21,fc2,0.00960784,0.01000,3.343
22,self_attn.k_proj,0.04860422,0.01000,0.769
22,self_attn.v_proj,0.06308914,0.01000,0.767
22,self_attn.q_proj,0.05071734,0.01000,0.762
22,self_attn.out_proj,0.00084933,0.01000,0.756
22,fc1,0.21024571,0.01000,0.760
22,fc2,0.01009148,0.01000,3.305
23,self_attn.k_proj,0.07043971,0.01000,0.771
23,self_attn.v_proj,0.04643616,0.01000,0.758
23,self_attn.q_proj,0.11800774,0.01000,0.758
23,self_attn.out_proj,0.00239992,0.01000,0.768
23,fc1,0.20430349,0.01000,0.770
23,fc2,0.00738119,0.01000,3.345
|