File size: 11,328 Bytes
3ed573b | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00093500,0.01000,1.534
0,self_attn.v_proj,0.00075287,0.01000,1.058
0,self_attn.q_proj,0.00301158,0.01000,0.966
0,self_attn.o_proj,0.01636044,0.01000,1.097
0,mlp.up_proj,0.55349815,0.01000,1.074
0,mlp.gate_proj,0.63002926,0.01000,0.989
0,mlp.down_proj,0.18759912,0.01000,3.718
1,self_attn.k_proj,0.00388462,0.01000,1.037
1,self_attn.v_proj,0.00418270,0.01000,1.124
1,self_attn.q_proj,0.01329488,0.01000,1.123
1,self_attn.o_proj,0.02369094,0.01000,1.134
1,mlp.up_proj,5.06094027,0.01000,1.068
1,mlp.gate_proj,12.48626137,0.01000,0.973
1,mlp.down_proj,0.21249261,0.01000,3.772
2,self_attn.k_proj,0.00920746,0.01000,1.026
2,self_attn.v_proj,0.00892699,0.01000,0.995
2,self_attn.q_proj,0.03115090,0.01000,0.972
2,self_attn.o_proj,0.01967876,0.01000,1.049
2,mlp.up_proj,18.21238136,0.01000,1.142
2,mlp.gate_proj,23.30099678,0.01000,1.107
2,mlp.down_proj,0.15935239,0.01000,3.670
3,self_attn.k_proj,0.01730567,0.01000,1.145
3,self_attn.v_proj,0.01813262,0.01000,1.010
3,self_attn.q_proj,0.06220551,0.01000,1.113
3,self_attn.o_proj,0.03520732,0.01000,1.112
3,mlp.up_proj,11.37148094,0.01000,1.075
3,mlp.gate_proj,24.17206383,0.01000,1.038
3,mlp.down_proj,0.37454456,0.01000,3.873
4,self_attn.k_proj,0.03873355,0.01000,1.127
4,self_attn.v_proj,0.04026245,0.01000,1.068
4,self_attn.q_proj,0.13652131,0.01000,1.121
4,self_attn.o_proj,0.05750610,0.01000,1.179
4,mlp.up_proj,11.50895309,0.01000,1.067
4,mlp.gate_proj,29.62431717,0.01000,1.020
4,mlp.down_proj,0.79113972,0.01000,3.775
5,self_attn.k_proj,0.03782712,0.01000,1.035
5,self_attn.v_proj,0.04062828,0.01000,1.005
5,self_attn.q_proj,0.13939869,0.01000,0.988
5,self_attn.o_proj,0.08601132,0.01000,1.120
5,mlp.up_proj,7.35449219,0.01000,1.113
5,mlp.gate_proj,15.71476841,0.01000,0.987
5,mlp.down_proj,1.26612008,0.01000,3.658
6,self_attn.k_proj,0.07410677,0.01000,1.083
6,self_attn.v_proj,0.08444937,0.01000,1.035
6,self_attn.q_proj,0.29530990,0.01000,1.046
6,self_attn.o_proj,0.24855541,0.01000,1.035
6,mlp.up_proj,12.12503052,0.01000,1.186
6,mlp.gate_proj,24.27440262,0.01000,1.014
6,mlp.down_proj,59.69503403,0.01000,3.886
7,self_attn.k_proj,0.18620780,0.01000,1.172
7,self_attn.v_proj,0.19225197,0.01000,1.037
7,self_attn.q_proj,0.66303122,0.01000,0.981
7,self_attn.o_proj,0.22942577,0.01000,1.053
7,mlp.up_proj,12.31387806,0.01000,1.202
7,mlp.gate_proj,21.64307404,0.01000,1.131
7,mlp.down_proj,2.05965924,0.01000,3.897
8,self_attn.k_proj,0.31598431,0.01000,1.144
8,self_attn.v_proj,0.34093946,0.01000,1.188
8,self_attn.q_proj,1.14995360,0.01000,1.148
8,self_attn.o_proj,0.35936299,0.01000,1.137
8,mlp.up_proj,12.45734978,0.01000,1.095
8,mlp.gate_proj,14.27222443,0.01000,1.059
8,mlp.down_proj,3.87224698,0.01000,3.592
9,self_attn.k_proj,0.42755005,0.01000,1.060
9,self_attn.v_proj,0.43955854,0.01000,0.980
9,self_attn.q_proj,1.51034832,0.01000,0.993
9,self_attn.o_proj,0.53357273,0.01000,1.063
9,mlp.up_proj,17.22698212,0.01000,1.102
9,mlp.gate_proj,23.49119186,0.01000,1.075
9,mlp.down_proj,5.00397158,0.01000,3.603
10,self_attn.k_proj,0.90024441,0.01000,1.063
10,self_attn.v_proj,1.01532078,0.01000,0.989
10,self_attn.q_proj,3.25746417,0.01000,0.973
10,self_attn.o_proj,0.74504685,0.01000,1.033
10,mlp.up_proj,18.57254982,0.01000,1.187
10,mlp.gate_proj,23.94193268,0.01000,1.042
10,mlp.down_proj,5.72752857,0.01000,3.799
11,self_attn.k_proj,0.46532309,0.01000,1.186
11,self_attn.v_proj,0.49314433,0.01000,1.097
11,self_attn.q_proj,1.61019170,0.01000,1.068
11,self_attn.o_proj,0.63873482,0.01000,1.066
11,mlp.up_proj,19.01406097,0.01000,1.049
11,mlp.gate_proj,22.41117859,0.01000,1.093
11,mlp.down_proj,5.03123236,0.01000,3.816
12,self_attn.k_proj,0.53598475,0.01000,1.056
12,self_attn.v_proj,0.58172190,0.01000,0.974
12,self_attn.q_proj,1.87110019,0.01000,1.103
12,self_attn.o_proj,0.86515743,0.01000,1.163
12,mlp.up_proj,19.76538849,0.01000,1.060
12,mlp.gate_proj,21.69308472,0.01000,0.996
12,mlp.down_proj,4.94389725,0.01000,3.518
13,self_attn.k_proj,0.41922653,0.01000,1.072
13,self_attn.v_proj,0.41501531,0.01000,0.966
13,self_attn.q_proj,1.54299450,0.01000,1.014
13,self_attn.o_proj,0.64388251,0.01000,1.041
13,mlp.up_proj,19.62747574,0.01000,1.152
13,mlp.gate_proj,19.93264961,0.01000,1.026
13,mlp.down_proj,5.23524094,0.01000,3.653
14,self_attn.k_proj,0.69069356,0.01000,1.158
14,self_attn.v_proj,0.72211957,0.01000,1.076
14,self_attn.q_proj,2.52726769,0.01000,0.986
14,self_attn.o_proj,1.15350628,0.01000,1.025
14,mlp.up_proj,19.14536667,0.01000,1.055
14,mlp.gate_proj,19.30226707,0.01000,1.131
14,mlp.down_proj,4.67902088,0.01000,3.912
15,self_attn.k_proj,0.73228085,0.01000,1.084
15,self_attn.v_proj,0.70357966,0.01000,1.095
15,self_attn.q_proj,2.62229300,0.01000,1.147
15,self_attn.o_proj,1.01154995,0.01000,1.058
15,mlp.up_proj,18.30879593,0.01000,1.072
15,mlp.gate_proj,17.72216034,0.01000,0.982
15,mlp.down_proj,5.20527649,0.01000,3.729
16,self_attn.k_proj,1.26578164,0.01000,1.050
16,self_attn.v_proj,1.44486320,0.01000,0.955
16,self_attn.q_proj,4.88816977,0.01000,1.048
16,self_attn.o_proj,1.40934920,0.01000,1.159
16,mlp.up_proj,20.92573166,0.01000,1.061
16,mlp.gate_proj,21.00225067,0.01000,0.998
16,mlp.down_proj,12.26511765,0.01000,3.586
17,self_attn.k_proj,1.20173907,0.01000,1.172
17,self_attn.v_proj,1.35401189,0.01000,1.089
17,self_attn.q_proj,4.90240002,0.01000,1.130
17,self_attn.o_proj,1.96535897,0.01000,1.158
17,mlp.up_proj,20.21404648,0.01000,1.085
17,mlp.gate_proj,19.69080925,0.01000,0.977
17,mlp.down_proj,8.91361427,0.01000,3.612
18,self_attn.k_proj,1.35796165,0.01000,1.066
18,self_attn.v_proj,1.48053002,0.01000,0.970
18,self_attn.q_proj,5.17301416,0.01000,1.029
18,self_attn.o_proj,1.48301518,0.01000,1.033
18,mlp.up_proj,22.05006790,0.01000,1.070
18,mlp.gate_proj,21.51061440,0.01000,1.045
18,mlp.down_proj,7.47183609,0.01000,3.574
19,self_attn.k_proj,2.67927146,0.01000,1.050
19,self_attn.v_proj,2.84377718,0.01000,0.990
19,self_attn.q_proj,10.55477047,0.01000,1.005
19,self_attn.o_proj,2.78883767,0.01000,1.057
19,mlp.up_proj,25.99320602,0.01000,1.182
19,mlp.gate_proj,25.00505829,0.01000,1.060
19,mlp.down_proj,9.58252621,0.01000,3.734
20,self_attn.k_proj,2.25592470,0.01000,1.186
20,self_attn.v_proj,2.64512777,0.01000,1.087
20,self_attn.q_proj,9.77148819,0.01000,0.975
20,self_attn.o_proj,2.61370730,0.01000,1.056
20,mlp.up_proj,28.45001221,0.01000,1.048
20,mlp.gate_proj,26.85064888,0.01000,1.100
20,mlp.down_proj,10.31070518,0.01000,3.764
21,self_attn.k_proj,3.03140640,0.01000,1.053
21,self_attn.v_proj,3.70216203,0.01000,1.002
21,self_attn.q_proj,12.58547688,0.01000,0.986
21,self_attn.o_proj,2.81117725,0.01000,1.165
21,mlp.up_proj,32.83880615,0.01000,1.052
21,mlp.gate_proj,30.72813225,0.01000,0.987
21,mlp.down_proj,14.17037201,0.01000,3.583
22,self_attn.k_proj,6.70605469,0.01000,1.070
22,self_attn.v_proj,7.37399912,0.01000,0.973
22,self_attn.q_proj,26.31335831,0.01000,1.006
22,self_attn.o_proj,5.94558525,0.01000,1.058
22,mlp.up_proj,38.05461502,0.01000,1.204
22,mlp.gate_proj,35.98967361,0.01000,1.021
22,mlp.down_proj,23.43338966,0.01000,3.696
23,self_attn.k_proj,6.65718555,0.01000,1.167
23,self_attn.v_proj,8.32367611,0.01000,1.091
23,self_attn.q_proj,27.57974243,0.01000,0.993
23,self_attn.o_proj,9.29317760,0.01000,1.056
23,mlp.up_proj,43.67939758,0.01000,1.085
23,mlp.gate_proj,42.31611633,0.01000,1.128
23,mlp.down_proj,31.69913673,0.01000,3.802
24,self_attn.k_proj,11.80602646,0.01000,1.067
24,self_attn.v_proj,15.26894760,0.01000,1.076
24,self_attn.q_proj,48.94207001,0.01000,1.119
24,self_attn.o_proj,14.16162300,0.01000,1.110
24,mlp.up_proj,47.95410156,0.01000,1.113
24,mlp.gate_proj,46.95746231,0.01000,0.999
24,mlp.down_proj,37.59236908,0.01000,3.698
25,self_attn.k_proj,9.39568329,0.01000,1.065
25,self_attn.v_proj,11.52959633,0.01000,0.981
25,self_attn.q_proj,37.55451965,0.01000,1.061
25,self_attn.o_proj,6.60415459,0.01000,1.156
25,mlp.up_proj,53.72169495,0.01000,1.061
25,mlp.gate_proj,53.26170349,0.01000,1.014
25,mlp.down_proj,49.13291931,0.01000,3.564
26,self_attn.k_proj,15.07968521,0.01000,1.042
26,self_attn.v_proj,18.87903214,0.01000,1.023
26,self_attn.q_proj,61.75351334,0.01000,0.987
26,self_attn.o_proj,8.19011021,0.01000,1.035
26,mlp.up_proj,63.40507126,0.01000,1.162
26,mlp.gate_proj,61.87738037,0.01000,0.968
26,mlp.down_proj,55.10468674,0.01000,3.617
27,self_attn.k_proj,16.51064682,0.01000,1.152
27,self_attn.v_proj,22.46823502,0.01000,0.951
27,self_attn.q_proj,69.66435242,0.01000,1.014
27,self_attn.o_proj,9.08815002,0.01000,1.053
27,mlp.up_proj,70.57014465,0.01000,1.231
27,mlp.gate_proj,67.74318695,0.01000,1.085
27,mlp.down_proj,74.30647278,0.01000,3.742
28,self_attn.k_proj,19.06116486,0.01000,1.185
28,self_attn.v_proj,22.31396866,0.01000,1.009
28,self_attn.q_proj,73.59075928,0.01000,1.058
28,self_attn.o_proj,15.23631573,0.01000,1.049
28,mlp.up_proj,81.82687378,0.01000,1.201
28,mlp.gate_proj,76.54244995,0.01000,1.133
28,mlp.down_proj,100.95344543,0.01000,3.875
29,self_attn.k_proj,42.74740601,0.01000,1.176
29,self_attn.v_proj,62.09001541,0.01000,1.087
29,self_attn.q_proj,169.90083313,0.01000,1.098
29,self_attn.o_proj,19.69995117,0.01000,1.015
29,mlp.up_proj,94.24476624,0.01000,1.089
29,mlp.gate_proj,85.47050476,0.01000,0.995
29,mlp.down_proj,111.90260315,0.01000,3.936
30,self_attn.k_proj,48.42563629,0.01000,1.164
30,self_attn.v_proj,63.64318848,0.01000,1.086
30,self_attn.q_proj,186.39895630,0.01000,1.069
30,self_attn.o_proj,28.51611710,0.01000,1.014
30,mlp.up_proj,99.81655884,0.01000,1.058
30,mlp.gate_proj,88.40076447,0.01000,0.987
30,mlp.down_proj,144.04133606,0.01000,3.710
31,self_attn.k_proj,67.51919556,0.01000,1.048
31,self_attn.v_proj,93.95922852,0.01000,0.948
31,self_attn.q_proj,243.45693970,0.01000,1.109
31,self_attn.o_proj,38.91883850,0.01000,1.155
31,mlp.up_proj,105.36692047,0.01000,1.053
31,mlp.gate_proj,90.30496979,0.01000,1.033
31,mlp.down_proj,174.71215820,0.01000,3.657
32,self_attn.k_proj,90.68847656,0.01000,1.075
32,self_attn.v_proj,136.25199890,0.01000,0.984
32,self_attn.q_proj,349.72949219,0.01000,1.022
32,self_attn.o_proj,42.40522003,0.01000,1.082
32,mlp.up_proj,112.39004517,0.01000,1.057
32,mlp.gate_proj,94.23210907,0.01000,1.021
32,mlp.down_proj,209.10299683,0.01000,3.541
33,self_attn.k_proj,160.63726807,0.01000,1.170
33,self_attn.v_proj,312.46691895,0.01000,1.057
33,self_attn.q_proj,723.88800049,0.01000,1.030
33,self_attn.o_proj,101.37340546,0.01000,1.064
33,mlp.up_proj,123.91452026,0.01000,1.132
33,mlp.gate_proj,102.19406128,0.01000,1.138
33,mlp.down_proj,272.35577393,0.01000,3.912
34,self_attn.k_proj,137.95373535,0.01000,1.092
34,self_attn.v_proj,218.98117065,0.01000,1.085
34,self_attn.q_proj,585.34942627,0.01000,1.113
34,self_attn.o_proj,121.98693085,0.01000,1.006
34,mlp.up_proj,144.67446899,0.01000,1.042
34,mlp.gate_proj,125.80036163,0.01000,1.068
34,mlp.down_proj,392.88323975,0.01000,3.726
35,self_attn.k_proj,63.21575165,0.01000,1.095
35,self_attn.v_proj,82.64318848,0.01000,0.952
35,self_attn.q_proj,236.55862427,0.01000,1.097
35,self_attn.o_proj,66.26197815,0.01000,1.150
35,mlp.up_proj,196.64938354,0.01000,1.047
35,mlp.gate_proj,170.04873657,0.01000,1.024
35,mlp.down_proj,2814.77734375,0.01000,3.573
|