File size: 12,973 Bytes
b9f5d0d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 |
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000000,0.05000,1.608
0,self_attn.v_proj,0.0000000000,0.05000,1.271
0,self_attn.q_proj,0.0000000001,0.05000,1.268
0,self_attn.o_proj,0.0000000003,0.05000,1.243
0,mlp.gate_proj,0.0000000149,0.05000,1.288
0,mlp.up_proj,0.0000000041,0.05000,1.275
0,mlp.down_proj,0.0000000021,0.05000,5.248
1,self_attn.k_proj,0.0000000000,0.05000,1.212
1,self_attn.v_proj,0.0000000000,0.05000,1.233
1,self_attn.q_proj,0.0000000002,0.05000,1.236
1,self_attn.o_proj,0.0000000002,0.05000,1.271
1,mlp.gate_proj,0.0000002356,0.05000,1.311
1,mlp.up_proj,0.0000000629,0.05000,1.349
1,mlp.down_proj,0.0000000041,0.05000,5.250
2,self_attn.k_proj,0.0000000001,0.05000,1.243
2,self_attn.v_proj,0.0000000001,0.05000,1.248
2,self_attn.q_proj,0.0000000004,0.05000,1.293
2,self_attn.o_proj,0.0000000005,0.05000,1.230
2,mlp.gate_proj,0.0000003456,0.05000,1.310
2,mlp.up_proj,0.0000001293,0.05000,1.350
2,mlp.down_proj,0.0000000034,0.05000,5.178
3,self_attn.k_proj,0.0000000002,0.05000,1.385
3,self_attn.v_proj,0.0000000002,0.05000,1.366
3,self_attn.q_proj,0.0000000007,0.05000,1.383
3,self_attn.o_proj,0.0000000006,0.05000,1.285
3,mlp.gate_proj,0.0000004641,0.05000,1.489
3,mlp.up_proj,0.0000001930,0.05000,1.492
3,mlp.down_proj,0.0000000064,0.05000,5.132
4,self_attn.k_proj,0.0000000003,0.05000,1.237
4,self_attn.v_proj,0.0000000003,0.05000,1.247
4,self_attn.q_proj,0.0000000012,0.05000,1.250
4,self_attn.o_proj,0.0000000008,0.05000,1.287
4,mlp.gate_proj,0.0000006685,0.05000,1.799
4,mlp.up_proj,0.0000003718,0.05000,1.796
4,mlp.down_proj,0.0000000080,0.05000,5.095
5,self_attn.k_proj,0.0000000003,0.05000,1.245
5,self_attn.v_proj,0.0000000004,0.05000,1.220
5,self_attn.q_proj,0.0000000014,0.05000,1.239
5,self_attn.o_proj,0.0000000010,0.05000,1.237
5,mlp.gate_proj,0.0000007204,0.05000,2.094
5,mlp.up_proj,0.0000002762,0.05000,2.086
5,mlp.down_proj,0.0000000159,0.05000,5.226
6,self_attn.k_proj,0.0000000005,0.05000,1.272
6,self_attn.v_proj,0.0000000006,0.05000,1.216
6,self_attn.q_proj,0.0000000023,0.05000,1.229
6,self_attn.o_proj,0.0000000014,0.05000,1.272
6,mlp.gate_proj,0.0000010165,0.05000,2.343
6,mlp.up_proj,0.0000005455,0.05000,2.312
6,mlp.down_proj,0.0000030633,0.05000,5.788
7,self_attn.k_proj,0.0000000022,0.05000,1.278
7,self_attn.v_proj,0.0000000024,0.05000,1.246
7,self_attn.q_proj,0.0000000095,0.05000,1.363
7,self_attn.o_proj,0.0000000033,0.05000,1.337
7,mlp.gate_proj,0.0000009015,0.05000,2.519
7,mlp.up_proj,0.0000004249,0.05000,2.498
7,mlp.down_proj,0.0000000286,0.05000,5.549
8,self_attn.k_proj,0.0000000025,0.05000,1.270
8,self_attn.v_proj,0.0000000029,0.05000,1.227
8,self_attn.q_proj,0.0000000109,0.05000,1.263
8,self_attn.o_proj,0.0000000039,0.05000,1.279
8,mlp.gate_proj,0.0000002529,0.05000,2.641
8,mlp.up_proj,0.0000001376,0.05000,2.604
8,mlp.down_proj,0.0000000270,0.05000,5.703
9,self_attn.k_proj,0.0000000020,0.05000,1.250
9,self_attn.v_proj,0.0000000021,0.05000,1.201
9,self_attn.q_proj,0.0000000083,0.05000,1.245
9,self_attn.o_proj,0.0000000031,0.05000,1.271
9,mlp.gate_proj,0.0000001374,0.05000,2.712
9,mlp.up_proj,0.0000001229,0.05000,2.666
9,mlp.down_proj,0.0000000360,0.05000,5.699
10,self_attn.k_proj,0.0000000032,0.05000,1.237
10,self_attn.v_proj,0.0000000037,0.05000,1.202
10,self_attn.q_proj,0.0000000146,0.05000,1.222
10,self_attn.o_proj,0.0000000055,0.05000,1.265
10,mlp.gate_proj,0.0000001438,0.05000,2.729
10,mlp.up_proj,0.0000001321,0.05000,2.691
10,mlp.down_proj,0.0000000309,0.05000,5.662
11,self_attn.k_proj,0.0000000047,0.05000,1.236
11,self_attn.v_proj,0.0000000054,0.05000,1.206
11,self_attn.q_proj,0.0000000213,0.05000,1.242
11,self_attn.o_proj,0.0000000080,0.05000,1.279
11,mlp.gate_proj,0.0000001702,0.05000,2.725
11,mlp.up_proj,0.0000001570,0.05000,2.679
11,mlp.down_proj,0.0000000382,0.05000,5.663
12,self_attn.k_proj,0.0000000038,0.05000,1.270
12,self_attn.v_proj,0.0000000043,0.05000,1.221
12,self_attn.q_proj,0.0000000168,0.05000,1.246
12,self_attn.o_proj,0.0000000083,0.05000,1.287
12,mlp.gate_proj,0.0000001990,0.05000,2.718
12,mlp.up_proj,0.0000001818,0.05000,2.679
12,mlp.down_proj,0.0000000475,0.05000,5.667
13,self_attn.k_proj,0.0000000083,0.05000,1.218
13,self_attn.v_proj,0.0000000095,0.05000,1.204
13,self_attn.q_proj,0.0000000373,0.05000,1.239
13,self_attn.o_proj,0.0000000132,0.05000,1.437
13,mlp.gate_proj,0.0000002398,0.05000,2.726
13,mlp.up_proj,0.0000002055,0.05000,2.682
13,mlp.down_proj,0.0000000539,0.05000,5.732
14,self_attn.k_proj,0.0000000060,0.05000,1.249
14,self_attn.v_proj,0.0000000070,0.05000,1.207
14,self_attn.q_proj,0.0000000262,0.05000,1.231
14,self_attn.o_proj,0.0000000124,0.05000,1.283
14,mlp.gate_proj,0.0000002277,0.05000,2.766
14,mlp.up_proj,0.0000002028,0.05000,2.716
14,mlp.down_proj,0.0000000555,0.05000,5.775
15,self_attn.k_proj,0.0000000054,0.05000,1.234
15,self_attn.v_proj,0.0000000057,0.05000,1.239
15,self_attn.q_proj,0.0000000232,0.05000,1.236
15,self_attn.o_proj,0.0000000120,0.05000,1.333
15,mlp.gate_proj,0.0000002143,0.05000,2.781
15,mlp.up_proj,0.0000002041,0.05000,2.748
15,mlp.down_proj,0.0000000569,0.05000,5.749
16,self_attn.k_proj,0.0000000069,0.05000,1.247
16,self_attn.v_proj,0.0000000078,0.05000,1.218
16,self_attn.q_proj,0.0000000293,0.05000,1.238
16,self_attn.o_proj,0.0000000160,0.05000,1.282
16,mlp.gate_proj,0.0000001931,0.05000,2.763
16,mlp.up_proj,0.0000001971,0.05000,2.714
16,mlp.down_proj,0.0000000595,0.05000,5.776
17,self_attn.k_proj,0.0000000070,0.05000,1.259
17,self_attn.v_proj,0.0000000076,0.05000,1.244
17,self_attn.q_proj,0.0000000310,0.05000,1.272
17,self_attn.o_proj,0.0000000174,0.05000,1.294
17,mlp.gate_proj,0.0000002041,0.05000,2.790
17,mlp.up_proj,0.0000002107,0.05000,2.739
17,mlp.down_proj,0.0000000591,0.05000,5.725
18,self_attn.k_proj,0.0000000099,0.05000,1.236
18,self_attn.v_proj,0.0000000110,0.05000,1.231
18,self_attn.q_proj,0.0000000449,0.05000,1.244
18,self_attn.o_proj,0.0000000171,0.05000,1.300
18,mlp.gate_proj,0.0000002128,0.05000,2.755
18,mlp.up_proj,0.0000002273,0.05000,2.717
18,mlp.down_proj,0.0000000713,0.05000,5.824
19,self_attn.k_proj,0.0000000133,0.05000,1.419
19,self_attn.v_proj,0.0000000144,0.05000,1.370
19,self_attn.q_proj,0.0000000573,0.05000,1.400
19,self_attn.o_proj,0.0000000215,0.05000,3.100
19,mlp.gate_proj,0.0000002382,0.05000,2.840
19,mlp.up_proj,0.0000002524,0.05000,2.880
19,mlp.down_proj,0.0000001835,0.05000,11.147
20,self_attn.k_proj,0.0000000244,0.05000,2.686
20,self_attn.v_proj,0.0000000304,0.05000,2.694
20,self_attn.q_proj,0.0000001156,0.05000,2.743
20,self_attn.o_proj,0.0000000301,0.05000,2.666
20,mlp.gate_proj,0.0000002484,0.05000,3.245
20,mlp.up_proj,0.0000002656,0.05000,3.233
20,mlp.down_proj,0.0000001017,0.05000,12.341
21,self_attn.k_proj,0.0000000251,0.05000,2.986
21,self_attn.v_proj,0.0000000264,0.05000,2.962
21,self_attn.q_proj,0.0000001019,0.05000,3.059
21,self_attn.o_proj,0.0000000396,0.05000,2.976
21,mlp.gate_proj,0.0000002622,0.05000,3.496
21,mlp.up_proj,0.0000002757,0.05000,3.500
21,mlp.down_proj,0.0000001119,0.05000,11.943
22,self_attn.k_proj,0.0000000238,0.05000,2.946
22,self_attn.v_proj,0.0000000296,0.05000,2.853
22,self_attn.q_proj,0.0000001088,0.05000,2.927
22,self_attn.o_proj,0.0000000381,0.05000,2.933
22,mlp.gate_proj,0.0000002831,0.05000,3.603
22,mlp.up_proj,0.0000003007,0.05000,3.516
22,mlp.down_proj,0.0000001143,0.05000,12.494
23,self_attn.k_proj,0.0000000342,0.05000,2.872
23,self_attn.v_proj,0.0000000455,0.05000,2.833
23,self_attn.q_proj,0.0000001655,0.05000,2.872
23,self_attn.o_proj,0.0000000303,0.05000,3.006
23,mlp.gate_proj,0.0000002891,0.05000,3.699
23,mlp.up_proj,0.0000003093,0.05000,3.486
23,mlp.down_proj,0.0000001386,0.05000,12.495
24,self_attn.k_proj,0.0000000418,0.05000,2.969
24,self_attn.v_proj,0.0000000572,0.05000,3.049
24,self_attn.q_proj,0.0000002142,0.05000,3.041
24,self_attn.o_proj,0.0000000520,0.05000,3.151
24,mlp.gate_proj,0.0000003189,0.05000,3.735
24,mlp.up_proj,0.0000003336,0.05000,3.711
24,mlp.down_proj,0.0000001439,0.05000,12.620
25,self_attn.k_proj,0.0000000434,0.05000,1.259
25,self_attn.v_proj,0.0000000548,0.05000,1.228
25,self_attn.q_proj,0.0000002045,0.05000,1.253
25,self_attn.o_proj,0.0000000486,0.05000,1.285
25,mlp.gate_proj,0.0000003654,0.05000,3.381
25,mlp.up_proj,0.0000003748,0.05000,3.274
25,mlp.down_proj,0.0000001957,0.05000,6.119
26,self_attn.k_proj,0.0000000447,0.05000,1.252
26,self_attn.v_proj,0.0000000600,0.05000,1.214
26,self_attn.q_proj,0.0000002259,0.05000,1.230
26,self_attn.o_proj,0.0000000501,0.05000,1.267
26,mlp.gate_proj,0.0000004381,0.05000,2.894
26,mlp.up_proj,0.0000004364,0.05000,2.844
26,mlp.down_proj,0.0000003177,0.05000,5.673
27,self_attn.k_proj,0.0000000808,0.05000,1.259
27,self_attn.v_proj,0.0000001062,0.05000,1.214
27,self_attn.q_proj,0.0000003821,0.05000,1.235
27,self_attn.o_proj,0.0000000942,0.05000,1.285
27,mlp.gate_proj,0.0000005449,0.05000,2.707
27,mlp.up_proj,0.0000005444,0.05000,2.679
27,mlp.down_proj,0.0000004879,0.05000,5.670
28,self_attn.k_proj,0.0000001069,0.05000,1.244
28,self_attn.v_proj,0.0000001591,0.05000,1.218
28,self_attn.q_proj,0.0000005816,0.05000,1.240
28,self_attn.o_proj,0.0000001124,0.05000,1.282
28,mlp.gate_proj,0.0000006669,0.05000,2.688
28,mlp.up_proj,0.0000006805,0.05000,2.661
28,mlp.down_proj,0.0000006141,0.05000,5.578
29,self_attn.k_proj,0.0000001652,0.05000,1.224
29,self_attn.v_proj,0.0000002137,0.05000,1.218
29,self_attn.q_proj,0.0000007917,0.05000,1.223
29,self_attn.o_proj,0.0000000944,0.05000,1.286
29,mlp.gate_proj,0.0000007430,0.05000,2.691
29,mlp.up_proj,0.0000007675,0.05000,2.657
29,mlp.down_proj,0.0000009056,0.05000,5.653
30,self_attn.k_proj,0.0000002540,0.05000,1.300
30,self_attn.v_proj,0.0000003661,0.05000,1.221
30,self_attn.q_proj,0.0000012225,0.05000,1.254
30,self_attn.o_proj,0.0000002047,0.05000,1.293
30,mlp.gate_proj,0.0000009594,0.05000,2.721
30,mlp.up_proj,0.0000009889,0.05000,2.666
30,mlp.down_proj,0.0000011860,0.05000,5.710
31,self_attn.k_proj,0.0000002662,0.05000,1.266
31,self_attn.v_proj,0.0000003309,0.05000,1.229
31,self_attn.q_proj,0.0000012580,0.05000,1.253
31,self_attn.o_proj,0.0000001825,0.05000,1.279
31,mlp.gate_proj,0.0000010435,0.05000,2.735
31,mlp.up_proj,0.0000010983,0.05000,2.693
31,mlp.down_proj,0.0000014923,0.05000,5.708
32,self_attn.k_proj,0.0000004588,0.05000,1.257
32,self_attn.v_proj,0.0000006749,0.05000,1.223
32,self_attn.q_proj,0.0000022000,0.05000,1.256
32,self_attn.o_proj,0.0000001838,0.05000,1.291
32,mlp.gate_proj,0.0000011835,0.05000,2.746
32,mlp.up_proj,0.0000012659,0.05000,2.906
32,mlp.down_proj,0.0000019001,0.05000,5.747
33,self_attn.k_proj,0.0000005869,0.05000,1.227
33,self_attn.v_proj,0.0000008845,0.05000,1.226
33,self_attn.q_proj,0.0000029721,0.05000,1.245
33,self_attn.o_proj,0.0000002444,0.05000,1.273
33,mlp.gate_proj,0.0000012551,0.05000,2.778
33,mlp.up_proj,0.0000013810,0.05000,2.740
33,mlp.down_proj,0.0000024191,0.05000,5.714
34,self_attn.k_proj,0.0000009436,0.05000,1.226
34,self_attn.v_proj,0.0000014251,0.05000,1.244
34,self_attn.q_proj,0.0000047080,0.05000,1.284
34,self_attn.o_proj,0.0000002777,0.05000,1.266
34,mlp.gate_proj,0.0000014021,0.05000,2.765
34,mlp.up_proj,0.0000015736,0.05000,2.723
34,mlp.down_proj,0.0000030276,0.05000,5.794
35,self_attn.k_proj,0.0000012035,0.05000,1.236
35,self_attn.v_proj,0.0000019715,0.05000,1.209
35,self_attn.q_proj,0.0000061430,0.05000,1.227
35,self_attn.o_proj,0.0000002815,0.05000,1.280
35,mlp.gate_proj,0.0000015192,0.05000,2.764
35,mlp.up_proj,0.0000017237,0.05000,2.725
35,mlp.down_proj,0.0000044798,0.05000,6.006
36,self_attn.k_proj,0.0000012551,0.05000,1.238
36,self_attn.v_proj,0.0000019508,0.05000,1.226
36,self_attn.q_proj,0.0000057919,0.05000,1.238
36,self_attn.o_proj,0.0000007864,0.05000,1.282
36,mlp.gate_proj,0.0000016147,0.05000,2.746
36,mlp.up_proj,0.0000018898,0.05000,2.715
36,mlp.down_proj,0.0000064629,0.05000,5.655
37,self_attn.k_proj,0.0000016820,0.05000,1.387
37,self_attn.v_proj,0.0000029921,0.05000,1.228
37,self_attn.q_proj,0.0000083882,0.05000,1.269
37,self_attn.o_proj,0.0000008105,0.05000,1.375
37,mlp.gate_proj,0.0000017379,0.05000,2.764
37,mlp.up_proj,0.0000020626,0.05000,2.722
37,mlp.down_proj,0.0000090136,0.05000,5.689
38,self_attn.k_proj,0.0000017496,0.05000,1.223
38,self_attn.v_proj,0.0000032497,0.05000,1.208
38,self_attn.q_proj,0.0000083224,0.05000,1.225
38,self_attn.o_proj,0.0000017614,0.05000,1.280
38,mlp.gate_proj,0.0000022542,0.05000,2.758
38,mlp.up_proj,0.0000025480,0.05000,2.713
38,mlp.down_proj,0.0000141993,0.05000,5.750
39,self_attn.k_proj,0.0000008697,0.05000,1.233
39,self_attn.v_proj,0.0000013233,0.05000,1.214
39,self_attn.q_proj,0.0000040708,0.05000,1.232
39,self_attn.o_proj,0.0000014657,0.05000,1.255
39,mlp.gate_proj,0.0000032426,0.05000,2.746
39,mlp.up_proj,0.0000035667,0.05000,2.682
39,mlp.down_proj,0.0000380214,0.05000,5.708
|