File size: 6,025 Bytes
2c8413d | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00409379,0.01000,1.000
0,self_attn.v_proj,0.00072114,0.01000,1.006
0,self_attn.q_proj,0.00414090,0.01000,0.980
0,self_attn.out_proj,0.00001473,0.01000,1.009
0,fc1,0.00906052,0.01000,0.986
0,fc2,0.00011689,0.01000,4.245
1,self_attn.k_proj,0.00241560,0.01000,0.998
1,self_attn.v_proj,0.00030304,0.01000,0.979
1,self_attn.q_proj,0.00263582,0.01000,0.991
1,self_attn.out_proj,0.00001348,0.01000,0.990
1,fc1,0.00911925,0.01000,1.001
1,fc2,0.00113884,0.01000,4.272
2,self_attn.k_proj,0.00382860,0.01000,1.008
2,self_attn.v_proj,0.00054063,0.01000,0.996
2,self_attn.q_proj,0.00378607,0.01000,0.999
2,self_attn.out_proj,0.00000811,0.01000,0.978
2,fc1,0.01030087,0.01000,1.010
2,fc2,0.00010722,0.01000,4.167
3,self_attn.k_proj,0.00392859,0.01000,0.990
3,self_attn.v_proj,0.00063046,0.01000,0.989
3,self_attn.q_proj,0.00420090,0.01000,0.973
3,self_attn.out_proj,0.00001649,0.01000,1.002
3,fc1,0.00846032,0.01000,0.985
3,fc2,0.00012199,0.01000,4.221
4,self_attn.k_proj,0.00556619,0.01000,0.996
4,self_attn.v_proj,0.00072275,0.01000,0.987
4,self_attn.q_proj,0.00558837,0.01000,0.993
4,self_attn.out_proj,0.00001731,0.01000,1.013
4,fc1,0.00879328,0.01000,0.989
4,fc2,0.00011329,0.01000,4.202
5,self_attn.k_proj,0.00716568,0.01000,0.991
5,self_attn.v_proj,0.00093275,0.01000,0.987
5,self_attn.q_proj,0.00673818,0.01000,1.002
5,self_attn.out_proj,0.00003818,0.01000,1.005
5,fc1,0.01022671,0.01000,0.978
5,fc2,0.00017304,0.01000,4.199
6,self_attn.k_proj,0.01196123,0.01000,1.025
6,self_attn.v_proj,0.00122724,0.01000,1.007
6,self_attn.q_proj,0.00925438,0.01000,1.007
6,self_attn.out_proj,0.00006164,0.01000,1.004
6,fc1,0.01337742,0.01000,0.994
6,fc2,0.00021436,0.01000,4.231
7,self_attn.k_proj,0.01336243,0.01000,0.995
7,self_attn.v_proj,0.00149999,0.01000,0.978
7,self_attn.q_proj,0.01013738,0.01000,0.991
7,self_attn.out_proj,0.00006549,0.01000,0.991
7,fc1,0.01671198,0.01000,0.994
7,fc2,0.00019174,0.01000,4.216
8,self_attn.k_proj,0.01508483,0.01000,0.983
8,self_attn.v_proj,0.00175653,0.01000,1.034
8,self_attn.q_proj,0.01071484,0.01000,0.995
8,self_attn.out_proj,0.00006830,0.01000,0.985
8,fc1,0.01985171,0.01000,0.993
8,fc2,0.00024323,0.01000,4.181
9,self_attn.k_proj,0.01629625,0.01000,0.994
9,self_attn.v_proj,0.00207414,0.01000,0.989
9,self_attn.q_proj,0.01226537,0.01000,0.987
9,self_attn.out_proj,0.00007884,0.01000,1.017
9,fc1,0.02325909,0.01000,0.996
9,fc2,0.00029927,0.01000,4.260
10,self_attn.k_proj,0.01694436,0.01000,0.984
10,self_attn.v_proj,0.00279443,0.01000,1.003
10,self_attn.q_proj,0.01290223,0.01000,1.009
10,self_attn.out_proj,0.00008043,0.01000,0.984
10,fc1,0.02705885,0.01000,1.041
10,fc2,0.00040550,0.01000,4.158
11,self_attn.k_proj,0.01743016,0.01000,0.992
11,self_attn.v_proj,0.00366602,0.01000,0.991
11,self_attn.q_proj,0.01367142,0.01000,1.000
11,self_attn.out_proj,0.00010108,0.01000,0.988
11,fc1,0.03210959,0.01000,1.008
11,fc2,0.00055330,0.01000,4.275
12,self_attn.k_proj,0.02062906,0.01000,0.982
12,self_attn.v_proj,0.00437126,0.01000,0.979
12,self_attn.q_proj,0.01520991,0.01000,0.995
12,self_attn.out_proj,0.00014373,0.01000,0.980
12,fc1,0.03572238,0.01000,1.010
12,fc2,0.00066190,0.01000,4.168
13,self_attn.k_proj,0.02250100,0.01000,0.984
13,self_attn.v_proj,0.00493668,0.01000,1.048
13,self_attn.q_proj,0.01598719,0.01000,1.047
13,self_attn.out_proj,0.00015132,0.01000,0.999
13,fc1,0.03995991,0.01000,1.019
13,fc2,0.00083408,0.01000,4.255
14,self_attn.k_proj,0.02120009,0.01000,0.979
14,self_attn.v_proj,0.00648613,0.01000,0.987
14,self_attn.q_proj,0.01573154,0.01000,0.990
14,self_attn.out_proj,0.00017486,0.01000,1.005
14,fc1,0.04477219,0.01000,0.981
14,fc2,0.00120158,0.01000,4.182
15,self_attn.k_proj,0.01888706,0.01000,0.996
15,self_attn.v_proj,0.00828507,0.01000,0.989
15,self_attn.q_proj,0.01590251,0.01000,1.019
15,self_attn.out_proj,0.00018840,0.01000,1.015
15,fc1,0.04777357,0.01000,1.004
15,fc2,0.00149223,0.01000,4.271
16,self_attn.k_proj,0.01895629,0.01000,0.994
16,self_attn.v_proj,0.00919615,0.01000,0.988
16,self_attn.q_proj,0.01408941,0.01000,0.987
16,self_attn.out_proj,0.00027497,0.01000,0.993
16,fc1,0.05255585,0.01000,0.994
16,fc2,0.00180443,0.01000,4.196
17,self_attn.k_proj,0.01800555,0.01000,0.990
17,self_attn.v_proj,0.01010960,0.01000,0.976
17,self_attn.q_proj,0.01410830,0.01000,0.985
17,self_attn.out_proj,0.00029745,0.01000,0.998
17,fc1,0.05777301,0.01000,1.011
17,fc2,0.00218752,0.01000,4.182
18,self_attn.k_proj,0.01598491,0.01000,1.027
18,self_attn.v_proj,0.01118781,0.01000,0.995
18,self_attn.q_proj,0.01337853,0.01000,0.999
18,self_attn.out_proj,0.00052338,0.01000,0.985
18,fc1,0.05900865,0.01000,1.069
18,fc2,0.00268790,0.01000,4.194
19,self_attn.k_proj,0.01571657,0.01000,0.997
19,self_attn.v_proj,0.01393012,0.01000,1.016
19,self_attn.q_proj,0.01293182,0.01000,0.997
19,self_attn.out_proj,0.00089465,0.01000,1.000
19,fc1,0.06260797,0.01000,1.066
19,fc2,0.00281360,0.01000,4.196
20,self_attn.k_proj,0.01550068,0.01000,0.983
20,self_attn.v_proj,0.01531409,0.01000,0.990
20,self_attn.q_proj,0.01223863,0.01000,1.027
20,self_attn.out_proj,0.00108642,0.01000,1.043
20,fc1,0.06158617,0.01000,0.997
20,fc2,0.00320006,0.01000,4.245
21,self_attn.k_proj,0.01362426,0.01000,1.005
21,self_attn.v_proj,0.01469827,0.01000,0.990
21,self_attn.q_proj,0.01251260,0.01000,0.993
21,self_attn.out_proj,0.00081556,0.01000,0.997
21,fc1,0.05632990,0.01000,1.020
21,fc2,0.00376281,0.01000,4.198
22,self_attn.k_proj,0.01262085,0.01000,1.009
22,self_attn.v_proj,0.01517828,0.01000,1.001
22,self_attn.q_proj,0.01358408,0.01000,1.001
22,self_attn.out_proj,0.00131237,0.01000,1.007
22,fc1,0.04993823,0.01000,1.032
22,fc2,0.00548277,0.01000,4.281
23,self_attn.k_proj,0.01658067,0.01000,1.060
23,self_attn.v_proj,0.00926656,0.01000,0.979
23,self_attn.q_proj,0.02430908,0.01000,0.970
23,self_attn.out_proj,0.00185453,0.01000,1.000
23,fc1,0.03861813,0.01000,0.996
23,fc2,0.00391702,0.01000,4.238
|