File size: 6,025 Bytes
5a2de59 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00409379,0.01000,0.993
0,self_attn.v_proj,0.00072114,0.01000,1.013
0,self_attn.q_proj,0.00414090,0.01000,1.025
0,self_attn.out_proj,0.00001093,0.01000,0.995
0,fc1,0.01083721,0.01000,0.997
0,fc2,0.00014591,0.01000,4.290
1,self_attn.k_proj,0.00460731,0.01000,0.993
1,self_attn.v_proj,0.00057901,0.01000,0.989
1,self_attn.q_proj,0.00501648,0.01000,1.004
1,self_attn.out_proj,0.00000384,0.01000,0.980
1,fc1,0.01723385,0.01000,1.018
1,fc2,0.00027718,0.01000,4.274
2,self_attn.k_proj,0.00625587,0.01000,1.028
2,self_attn.v_proj,0.00100671,0.01000,0.992
2,self_attn.q_proj,0.00620751,0.01000,1.017
2,self_attn.out_proj,0.00001057,0.01000,0.986
2,fc1,0.01686204,0.01000,1.000
2,fc2,0.00013050,0.01000,4.262
3,self_attn.k_proj,0.00688523,0.01000,0.981
3,self_attn.v_proj,0.00138955,0.01000,0.989
3,self_attn.q_proj,0.00759731,0.01000,0.988
3,self_attn.out_proj,0.00001236,0.01000,0.998
3,fc1,0.01656991,0.01000,1.003
3,fc2,0.00012674,0.01000,4.207
4,self_attn.k_proj,0.01033037,0.01000,1.005
4,self_attn.v_proj,0.00170416,0.01000,0.988
4,self_attn.q_proj,0.01105807,0.01000,0.985
4,self_attn.out_proj,0.00002068,0.01000,0.996
4,fc1,0.01853193,0.01000,1.005
4,fc2,0.00013410,0.01000,4.235
5,self_attn.k_proj,0.01293353,0.01000,1.007
5,self_attn.v_proj,0.00222387,0.01000,0.989
5,self_attn.q_proj,0.01334210,0.01000,1.003
5,self_attn.out_proj,0.00002222,0.01000,1.007
5,fc1,0.02076346,0.01000,0.994
5,fc2,0.00014411,0.01000,4.170
6,self_attn.k_proj,0.01992640,0.01000,1.042
6,self_attn.v_proj,0.00283416,0.01000,1.005
6,self_attn.q_proj,0.01790950,0.01000,1.015
6,self_attn.out_proj,0.00004584,0.01000,0.994
6,fc1,0.02586313,0.01000,0.987
6,fc2,0.00019328,0.01000,4.243
7,self_attn.k_proj,0.02163527,0.01000,0.981
7,self_attn.v_proj,0.00339857,0.01000,0.978
7,self_attn.q_proj,0.01917062,0.01000,0.995
7,self_attn.out_proj,0.00005514,0.01000,0.994
7,fc1,0.03230386,0.01000,1.036
7,fc2,0.00027319,0.01000,4.248
8,self_attn.k_proj,0.02458253,0.01000,0.986
8,self_attn.v_proj,0.00393817,0.01000,0.977
8,self_attn.q_proj,0.02009545,0.01000,0.996
8,self_attn.out_proj,0.00007193,0.01000,0.990
8,fc1,0.03901298,0.01000,1.007
8,fc2,0.00036630,0.01000,4.221
9,self_attn.k_proj,0.02626408,0.01000,1.021
9,self_attn.v_proj,0.00449418,0.01000,0.980
9,self_attn.q_proj,0.02207199,0.01000,0.988
9,self_attn.out_proj,0.00009974,0.01000,0.992
9,fc1,0.04441365,0.01000,1.009
9,fc2,0.00049525,0.01000,4.350
10,self_attn.k_proj,0.02680579,0.01000,0.992
10,self_attn.v_proj,0.00567766,0.01000,0.980
10,self_attn.q_proj,0.02212340,0.01000,0.996
10,self_attn.out_proj,0.00013059,0.01000,0.977
10,fc1,0.05002769,0.01000,1.000
10,fc2,0.00073721,0.01000,4.189
11,self_attn.k_proj,0.02718079,0.01000,1.009
11,self_attn.v_proj,0.00700397,0.01000,0.978
11,self_attn.q_proj,0.02239926,0.01000,1.007
11,self_attn.out_proj,0.00017297,0.01000,1.003
11,fc1,0.05576458,0.01000,1.005
11,fc2,0.00095275,0.01000,4.233
12,self_attn.k_proj,0.03069451,0.01000,0.995
12,self_attn.v_proj,0.00774106,0.01000,0.989
12,self_attn.q_proj,0.02362737,0.01000,0.977
12,self_attn.out_proj,0.00025744,0.01000,0.994
12,fc1,0.05810564,0.01000,1.012
12,fc2,0.00123986,0.01000,4.256
13,self_attn.k_proj,0.03295046,0.01000,0.995
13,self_attn.v_proj,0.00860731,0.01000,0.977
13,self_attn.q_proj,0.02428213,0.01000,0.986
13,self_attn.out_proj,0.00027379,0.01000,1.068
13,fc1,0.06419239,0.01000,1.021
13,fc2,0.00162063,0.01000,4.230
14,self_attn.k_proj,0.03117430,0.01000,1.009
14,self_attn.v_proj,0.01099943,0.01000,0.983
14,self_attn.q_proj,0.02365817,0.01000,0.991
14,self_attn.out_proj,0.00030741,0.01000,0.996
14,fc1,0.07080662,0.01000,1.012
14,fc2,0.00221463,0.01000,4.206
15,self_attn.k_proj,0.02812890,0.01000,1.004
15,self_attn.v_proj,0.01401449,0.01000,0.977
15,self_attn.q_proj,0.02391200,0.01000,1.010
15,self_attn.out_proj,0.00029116,0.01000,0.986
15,fc1,0.07525838,0.01000,1.011
15,fc2,0.00280922,0.01000,4.259
16,self_attn.k_proj,0.02830217,0.01000,0.986
16,self_attn.v_proj,0.01540015,0.01000,0.994
16,self_attn.q_proj,0.02135721,0.01000,0.997
16,self_attn.out_proj,0.00044422,0.01000,0.996
16,fc1,0.08256883,0.01000,1.011
16,fc2,0.00352829,0.01000,4.263
17,self_attn.k_proj,0.02758769,0.01000,1.023
17,self_attn.v_proj,0.01700824,0.01000,0.972
17,self_attn.q_proj,0.02158560,0.01000,0.995
17,self_attn.out_proj,0.00051447,0.01000,0.989
17,fc1,0.09083328,0.01000,0.998
17,fc2,0.00448523,0.01000,4.202
18,self_attn.k_proj,0.02513609,0.01000,0.985
18,self_attn.v_proj,0.01950069,0.01000,0.998
18,self_attn.q_proj,0.02091608,0.01000,0.986
18,self_attn.out_proj,0.00059864,0.01000,1.026
18,fc1,0.09597015,0.01000,0.994
18,fc2,0.00544927,0.01000,4.187
19,self_attn.k_proj,0.02561334,0.01000,1.077
19,self_attn.v_proj,0.02522137,0.01000,1.002
19,self_attn.q_proj,0.02101323,0.01000,1.015
19,self_attn.out_proj,0.00087916,0.01000,0.984
19,fc1,0.10437368,0.01000,0.997
19,fc2,0.00673680,0.01000,4.163
20,self_attn.k_proj,0.02653702,0.01000,0.983
20,self_attn.v_proj,0.02878364,0.01000,0.993
20,self_attn.q_proj,0.02050654,0.01000,0.975
20,self_attn.out_proj,0.00057599,0.01000,0.986
20,fc1,0.10855858,0.01000,0.998
20,fc2,0.00745274,0.01000,4.255
21,self_attn.k_proj,0.02398171,0.01000,1.003
21,self_attn.v_proj,0.02851950,0.01000,0.985
21,self_attn.q_proj,0.02189942,0.01000,0.983
21,self_attn.out_proj,0.00025027,0.01000,0.998
21,fc1,0.10575759,0.01000,0.985
21,fc2,0.00817760,0.01000,4.237
22,self_attn.k_proj,0.02366718,0.01000,0.994
22,self_attn.v_proj,0.03047793,0.01000,0.985
22,self_attn.q_proj,0.02532681,0.01000,0.996
22,self_attn.out_proj,0.00129898,0.01000,1.022
22,fc1,0.10098480,0.01000,1.009
22,fc2,0.00862298,0.01000,4.217
23,self_attn.k_proj,0.02841244,0.01000,1.030
23,self_attn.v_proj,0.02046534,0.01000,1.014
23,self_attn.q_proj,0.05300370,0.01000,1.000
23,self_attn.out_proj,0.00440506,0.01000,0.987
23,fc1,0.09355172,0.01000,1.001
23,fc2,0.00552451,0.01000,4.275
|