File size: 8,233 Bytes
e91eb74 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 |
layer,module,loss,samples,damp,time
0,self_attn.q_proj,0.00143004,0.01000,1.666
0,self_attn.k_proj,0.00152641,0.01000,1.244
0,self_attn.v_proj,0.00055014,0.01000,1.224
0,self_attn.dense,0.00040645,0.01000,1.199
0,mlp.fc1,0.00156395,0.01000,1.471
0,mlp.fc2,45.18684896,0.01250,8.215
1,self_attn.q_proj,0.00098901,0.01000,1.230
1,self_attn.k_proj,0.00098037,0.01000,1.193
1,self_attn.v_proj,0.00025730,0.01000,1.200
1,self_attn.dense,0.00010639,0.01000,1.247
1,mlp.fc1,0.00321254,0.01000,1.491
1,mlp.fc2,47.71025594,0.01250,8.363
2,self_attn.q_proj,0.00124894,0.01000,1.345
2,self_attn.k_proj,0.00125460,0.01000,1.299
2,self_attn.v_proj,0.00052309,0.01000,1.253
2,self_attn.dense,0.00011987,0.01000,1.390
2,mlp.fc1,0.00455974,0.01000,1.709
2,mlp.fc2,51.62885539,0.01250,8.104
3,self_attn.q_proj,0.00130572,0.01000,1.189
3,self_attn.k_proj,0.00125844,0.01000,1.239
3,self_attn.v_proj,0.00100104,0.01000,1.399
3,self_attn.dense,0.00010456,0.01000,1.400
3,mlp.fc1,0.00656331,0.01000,1.650
3,mlp.fc2,52.00990804,0.01250,8.130
4,self_attn.q_proj,0.00165055,0.01000,1.275
4,self_attn.k_proj,0.00151279,0.01000,1.267
4,self_attn.v_proj,0.00109894,0.01000,1.210
4,self_attn.dense,0.00008104,0.01000,1.164
4,mlp.fc1,0.00635077,0.01000,1.470
4,mlp.fc2,45.79121908,0.01250,7.909
5,self_attn.q_proj,0.00146975,0.01000,1.218
5,self_attn.k_proj,0.00134510,0.01000,1.212
5,self_attn.v_proj,0.00096357,0.01000,1.230
5,self_attn.dense,0.00009522,0.01000,1.167
5,mlp.fc1,0.00543682,0.01000,1.510
5,mlp.fc2,39.91021474,0.01250,8.151
6,self_attn.q_proj,0.00179219,0.01000,1.304
6,self_attn.k_proj,0.00164673,0.01000,1.153
6,self_attn.v_proj,0.00118458,0.01000,1.130
6,self_attn.dense,0.00008672,0.01000,1.179
6,mlp.fc1,0.00587255,0.01000,1.484
6,mlp.fc2,44.64824422,0.01250,8.148
7,self_attn.q_proj,0.00186776,0.01000,1.171
7,self_attn.k_proj,0.00177774,0.01000,1.137
7,self_attn.v_proj,0.00120310,0.01000,1.267
7,self_attn.dense,0.00006188,0.01000,1.291
7,mlp.fc1,0.00593133,0.01000,1.634
7,mlp.fc2,39.13363139,0.01250,8.085
8,self_attn.q_proj,0.00189651,0.01000,1.240
8,self_attn.k_proj,0.00176293,0.01000,1.228
8,self_attn.v_proj,0.00140262,0.01000,1.245
8,self_attn.dense,0.00006599,0.01000,1.192
8,mlp.fc1,0.00588503,0.01000,1.698
8,mlp.fc2,40.45288086,0.01250,8.500
9,self_attn.q_proj,0.00191524,0.01000,1.303
9,self_attn.k_proj,0.00177061,0.01000,1.146
9,self_attn.v_proj,0.00140069,0.01000,1.155
9,self_attn.dense,0.00008725,0.01000,1.173
9,mlp.fc1,0.00577327,0.01000,1.504
9,mlp.fc2,41.11215210,0.01250,8.315
10,self_attn.q_proj,0.00192486,0.01000,1.232
10,self_attn.k_proj,0.00184659,0.01000,1.287
10,self_attn.v_proj,0.00122425,0.01000,1.217
10,self_attn.dense,0.00008808,0.01000,1.212
10,mlp.fc1,0.00560408,0.01000,1.617
10,mlp.fc2,38.80376689,0.01250,8.274
11,self_attn.q_proj,0.00201942,0.01000,1.267
11,self_attn.k_proj,0.00193283,0.01000,1.240
11,self_attn.v_proj,0.00134693,0.01000,1.196
11,self_attn.dense,0.00010903,0.01000,1.279
11,mlp.fc1,0.00545754,0.01000,1.536
11,mlp.fc2,38.56307475,0.01250,7.950
12,self_attn.q_proj,0.00209887,0.01000,1.200
12,self_attn.k_proj,0.00200503,0.01000,1.235
12,self_attn.v_proj,0.00137541,0.01000,1.226
12,self_attn.dense,0.00008138,0.01000,1.221
12,mlp.fc1,0.00540713,0.01000,1.525
12,mlp.fc2,40.88318888,0.01250,8.217
13,self_attn.q_proj,0.00200631,0.01000,1.251
13,self_attn.k_proj,0.00194197,0.01000,1.219
13,self_attn.v_proj,0.00134296,0.01000,1.149
13,self_attn.dense,0.00007691,0.01000,1.237
13,mlp.fc1,0.00549893,0.01000,1.499
13,mlp.fc2,41.56899770,0.01250,8.045
14,self_attn.q_proj,0.00210726,0.01000,1.282
14,self_attn.k_proj,0.00314308,0.01000,1.203
14,self_attn.v_proj,0.00133068,0.01000,1.242
14,self_attn.dense,0.00009206,0.01000,1.209
14,mlp.fc1,0.00539970,0.01000,1.479
14,mlp.fc2,41.86838531,0.01250,8.351
15,self_attn.q_proj,0.00199632,0.01000,1.302
15,self_attn.k_proj,0.00192289,0.01000,1.252
15,self_attn.v_proj,0.00126881,0.01000,1.190
15,self_attn.dense,0.00010529,0.01000,1.233
15,mlp.fc1,0.00512260,0.01000,1.654
15,mlp.fc2,40.16023763,0.01250,8.171
16,self_attn.q_proj,0.00206465,0.01000,1.269
16,self_attn.k_proj,0.00198583,0.01000,1.272
16,self_attn.v_proj,0.00134773,0.01000,1.218
16,self_attn.dense,0.00011100,0.01000,1.248
16,mlp.fc1,0.00523687,0.01000,1.613
16,mlp.fc2,44.88688151,0.01250,8.167
17,self_attn.q_proj,0.00197861,0.01000,1.327
17,self_attn.k_proj,0.00189119,0.01000,1.293
17,self_attn.v_proj,0.00124682,0.01000,1.285
17,self_attn.dense,0.00008207,0.01000,1.278
17,mlp.fc1,0.00489658,0.01000,1.480
17,mlp.fc2,41.40846761,0.01250,8.204
18,self_attn.q_proj,0.00228992,0.01000,1.315
18,self_attn.k_proj,0.00217069,0.01000,1.268
18,self_attn.v_proj,0.00131716,0.01000,1.255
18,self_attn.dense,0.00008202,0.01000,1.252
18,mlp.fc1,0.00499909,0.01000,1.578
18,mlp.fc2,41.80710856,0.01250,8.319
19,self_attn.q_proj,0.00216272,0.01000,1.389
19,self_attn.k_proj,0.00209569,0.01000,1.459
19,self_attn.v_proj,0.00134877,0.01000,1.276
19,self_attn.dense,0.00010894,0.01000,1.240
19,mlp.fc1,0.00535385,0.01000,1.577
19,mlp.fc2,50.55662028,0.01250,8.463
20,self_attn.q_proj,0.00229107,0.01000,1.262
20,self_attn.k_proj,0.03851147,0.01000,1.216
20,self_attn.v_proj,0.00130100,0.01000,1.126
20,self_attn.dense,0.00012769,0.01000,1.188
20,mlp.fc1,0.00545297,0.01000,1.534
20,mlp.fc2,49.51214600,0.01250,8.264
21,self_attn.q_proj,0.00218866,0.01000,1.271
21,self_attn.k_proj,0.00204123,0.01000,1.301
21,self_attn.v_proj,0.00156515,0.01000,1.246
21,self_attn.dense,0.00012658,0.01000,1.226
21,mlp.fc1,0.00584921,0.01000,1.567
21,mlp.fc2,52.78467306,0.01250,8.395
22,self_attn.q_proj,0.00225957,0.01000,1.327
22,self_attn.k_proj,0.00357083,0.01000,1.294
22,self_attn.v_proj,0.00164564,0.01000,1.182
22,self_attn.dense,0.00010589,0.01000,1.298
22,mlp.fc1,0.00612155,0.01000,1.662
22,mlp.fc2,52.80789185,0.01250,8.462
23,self_attn.q_proj,0.00243160,0.01000,1.332
23,self_attn.k_proj,0.00276039,0.01000,1.332
23,self_attn.v_proj,0.00159178,0.01000,1.117
23,self_attn.dense,0.00016935,0.01000,1.254
23,mlp.fc1,0.00641046,0.01000,1.594
23,mlp.fc2,52.62599691,0.01250,8.410
24,self_attn.q_proj,0.00232852,0.01000,1.257
24,self_attn.k_proj,0.00215273,0.01000,1.328
24,self_attn.v_proj,0.00190273,0.01000,1.293
24,self_attn.dense,0.00019747,0.01000,1.250
24,mlp.fc1,0.00686966,0.01000,1.517
24,mlp.fc2,55.26352437,0.01250,8.156
25,self_attn.q_proj,0.00253579,0.01000,1.216
25,self_attn.k_proj,0.01635120,0.01000,1.195
25,self_attn.v_proj,0.00198928,0.01000,1.303
25,self_attn.dense,0.00024381,0.01000,1.295
25,mlp.fc1,0.00749265,0.01000,1.487
25,mlp.fc2,52.59010824,0.01250,8.389
26,self_attn.q_proj,0.00319071,0.01000,1.357
26,self_attn.k_proj,0.00231659,0.01000,1.326
26,self_attn.v_proj,0.00232149,0.01000,1.287
26,self_attn.dense,0.00024788,0.01000,1.330
26,mlp.fc1,0.00773018,0.01000,1.644
26,mlp.fc2,50.22942098,0.01250,8.381
27,self_attn.q_proj,0.00275840,0.01000,1.284
27,self_attn.k_proj,0.00304915,0.01000,1.255
27,self_attn.v_proj,0.00238565,0.01000,1.236
27,self_attn.dense,0.00028637,0.01000,1.232
27,mlp.fc1,0.00808649,0.01000,1.501
27,mlp.fc2,48.66911825,0.01250,8.210
28,self_attn.q_proj,0.00248579,0.01000,1.194
28,self_attn.k_proj,0.00226670,0.01000,1.181
28,self_attn.v_proj,0.00246282,0.01000,1.183
28,self_attn.dense,0.00041967,0.01000,1.281
28,mlp.fc1,0.00824952,0.01000,1.527
28,mlp.fc2,43.05557760,0.01250,8.224
29,self_attn.q_proj,0.11153113,0.01000,1.266
29,self_attn.k_proj,0.64342054,0.01000,1.226
29,self_attn.v_proj,0.00479308,0.01000,1.228
29,self_attn.dense,0.00025549,0.01000,1.224
29,mlp.fc1,0.03276892,0.01000,1.495
29,mlp.fc2,36.04873657,0.01250,8.129
30,self_attn.q_proj,0.06741060,0.01000,1.441
30,self_attn.k_proj,0.70108302,0.01000,1.260
30,self_attn.v_proj,0.00279436,0.01000,1.327
30,self_attn.dense,0.00033670,0.01000,1.297
30,mlp.fc1,0.02931402,0.01000,1.595
30,mlp.fc2,32.39466349,0.01250,8.556
31,self_attn.q_proj,0.03431750,0.01000,1.214
31,self_attn.k_proj,5.91425705,0.01000,1.192
31,self_attn.v_proj,0.00139703,0.01000,1.202
31,self_attn.dense,0.00031197,0.01000,1.166
31,mlp.fc1,0.01573335,0.01000,1.476
31,mlp.fc2,58.13183085,0.01250,8.144
|