File size: 9,297 Bytes
00b2f1e | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00022096,0.01000,1.099
0,self_attn.v_proj,0.00000229,0.01000,2.435
0,self_attn.q_proj,0.00036210,0.01000,2.448
0,self_attn.o_proj,0.00000175,0.01000,2.415
0,mlp.up_proj,0.00150737,0.01000,1.416
0,mlp.gate_proj,0.00142441,0.01000,0.274
0,mlp.down_proj,0.00595958,0.01000,0.739
1,self_attn.k_proj,0.00078274,0.01000,0.286
1,self_attn.v_proj,0.00015115,0.01000,0.272
1,self_attn.q_proj,0.00174118,0.01000,0.162
1,self_attn.o_proj,0.00103411,0.01000,0.769
1,mlp.up_proj,0.00179594,0.01000,1.660
1,mlp.gate_proj,0.00228291,0.01000,0.973
1,mlp.down_proj,0.00224895,0.01000,0.746
2,self_attn.k_proj,0.00125878,0.01000,0.437
2,self_attn.v_proj,0.00020735,0.01000,0.269
2,self_attn.q_proj,0.00295782,0.01000,0.638
2,self_attn.o_proj,0.00098028,0.01000,0.810
2,mlp.up_proj,0.00240148,0.01000,0.318
2,mlp.gate_proj,0.00286920,0.01000,0.260
2,mlp.down_proj,0.00500130,0.01000,6.505
3,self_attn.k_proj,0.00188067,0.01000,1.197
3,self_attn.v_proj,0.00074529,0.01000,0.289
3,self_attn.q_proj,0.00454102,0.01000,0.292
3,self_attn.o_proj,0.00114469,0.01000,0.283
3,mlp.up_proj,0.00272536,0.01000,0.309
3,mlp.gate_proj,0.00309045,0.01000,0.279
3,mlp.down_proj,0.00337280,0.01000,0.736
4,self_attn.k_proj,0.00178011,0.01000,0.471
4,self_attn.v_proj,0.00069859,0.01000,0.149
4,self_attn.q_proj,0.00427734,0.01000,0.145
4,self_attn.o_proj,0.00194755,0.01000,1.499
4,mlp.up_proj,0.00357304,0.01000,0.308
4,mlp.gate_proj,0.00408032,0.01000,0.289
4,mlp.down_proj,0.00474062,0.01000,0.744
5,self_attn.k_proj,0.00194141,0.01000,0.269
5,self_attn.v_proj,0.00072606,0.01000,0.919
5,self_attn.q_proj,0.00453751,0.01000,1.476
5,self_attn.o_proj,0.00234540,0.01000,0.281
5,mlp.up_proj,0.00409303,0.01000,0.266
5,mlp.gate_proj,0.00449629,0.01000,0.596
5,mlp.down_proj,0.00556781,0.01000,6.516
6,self_attn.k_proj,0.00163071,0.01000,0.275
6,self_attn.v_proj,0.00068974,0.01000,0.287
6,self_attn.q_proj,0.00406556,0.01000,0.276
6,self_attn.o_proj,0.00182722,0.01000,0.284
6,mlp.up_proj,0.00438432,0.01000,0.273
6,mlp.gate_proj,0.00448065,0.01000,0.271
6,mlp.down_proj,0.00687783,0.01000,0.819
7,self_attn.k_proj,0.00229149,0.01000,0.366
7,self_attn.v_proj,0.00139370,0.01000,0.148
7,self_attn.q_proj,0.00637256,0.01000,0.142
7,self_attn.o_proj,0.00216803,0.01000,1.421
7,mlp.up_proj,0.00479016,0.01000,0.280
7,mlp.gate_proj,0.00473948,0.01000,0.287
7,mlp.down_proj,0.00823352,0.01000,0.831
8,self_attn.k_proj,0.00214538,0.01000,1.666
8,self_attn.v_proj,0.00103131,0.01000,1.952
8,self_attn.q_proj,0.00540090,0.01000,1.636
8,self_attn.o_proj,0.00283757,0.01000,0.303
8,mlp.up_proj,0.00546549,0.01000,0.274
8,mlp.gate_proj,0.00495393,0.01000,0.275
8,mlp.down_proj,0.01154038,0.01000,6.464
9,self_attn.k_proj,0.00147208,0.01000,1.818
9,self_attn.v_proj,0.00058141,0.01000,1.731
9,self_attn.q_proj,0.00394661,0.01000,1.675
9,self_attn.o_proj,0.00251221,0.01000,0.324
9,mlp.up_proj,0.00595842,0.01000,0.347
9,mlp.gate_proj,0.00489875,0.01000,0.343
9,mlp.down_proj,0.01428184,0.01000,0.904
10,self_attn.k_proj,0.00132155,0.01000,2.685
10,self_attn.v_proj,0.00068617,0.01000,2.503
10,self_attn.q_proj,0.00363028,0.01000,1.752
10,self_attn.o_proj,0.00545926,0.01000,0.408
10,mlp.up_proj,0.00611763,0.01000,1.632
10,mlp.gate_proj,0.00474317,0.01000,1.328
10,mlp.down_proj,0.01347071,0.01000,2.937
11,self_attn.k_proj,0.00115821,0.01000,3.339
11,self_attn.v_proj,0.00065106,0.01000,2.422
11,self_attn.q_proj,0.00344706,0.01000,2.382
11,self_attn.o_proj,0.00740811,0.01000,2.400
11,mlp.up_proj,0.00620620,0.01000,2.718
11,mlp.gate_proj,0.00449832,0.01000,2.710
11,mlp.down_proj,0.27257532,0.01000,5.754
12,self_attn.k_proj,0.00163961,0.01000,0.344
12,self_attn.v_proj,0.00094356,0.01000,0.337
12,self_attn.q_proj,0.00456318,0.01000,0.338
12,self_attn.o_proj,0.00419531,0.01000,1.311
12,mlp.up_proj,0.00565002,0.01000,0.279
12,mlp.gate_proj,0.00445975,0.01000,1.091
12,mlp.down_proj,0.01192240,0.01000,4.327
13,self_attn.k_proj,0.00174242,0.01000,0.339
13,self_attn.v_proj,0.00083272,0.01000,0.344
13,self_attn.q_proj,0.00502530,0.01000,0.395
13,self_attn.o_proj,0.00500150,0.01000,0.343
13,mlp.up_proj,0.00570113,0.01000,1.926
13,mlp.gate_proj,0.00524486,0.01000,1.750
13,mlp.down_proj,0.01178209,0.01000,2.821
14,self_attn.k_proj,0.00200629,0.01000,0.361
14,self_attn.v_proj,0.00157519,0.01000,0.359
14,self_attn.q_proj,0.00566488,0.01000,0.366
14,self_attn.o_proj,0.00620107,0.01000,2.248
14,mlp.up_proj,0.00577955,0.01000,4.655
14,mlp.gate_proj,0.00547774,0.01000,5.042
14,mlp.down_proj,0.01469438,0.01000,8.832
15,self_attn.k_proj,0.00194205,0.01000,0.349
15,self_attn.v_proj,0.00151308,0.01000,0.345
15,self_attn.q_proj,0.00563300,0.01000,0.342
15,self_attn.o_proj,0.00601548,0.01000,0.344
15,mlp.up_proj,0.00601284,0.01000,0.342
15,mlp.gate_proj,0.00594717,0.01000,0.336
15,mlp.down_proj,0.01753610,0.01000,5.689
16,self_attn.k_proj,0.00155090,0.01000,1.763
16,self_attn.v_proj,0.00110804,0.01000,0.365
16,self_attn.q_proj,0.00422240,0.01000,0.357
16,self_attn.o_proj,0.00903260,0.01000,0.345
16,mlp.up_proj,0.00553630,0.01000,1.181
16,mlp.gate_proj,0.00532908,0.01000,1.499
16,mlp.down_proj,0.01532181,0.01000,5.315
17,self_attn.k_proj,0.00241632,0.01000,0.830
17,self_attn.v_proj,0.00194845,0.01000,2.641
17,self_attn.q_proj,0.00834111,0.01000,4.413
17,self_attn.o_proj,0.01061929,0.01000,2.746
17,mlp.up_proj,0.00562216,0.01000,2.742
17,mlp.gate_proj,0.00506327,0.01000,1.101
17,mlp.down_proj,0.01818097,0.01000,4.789
18,self_attn.k_proj,0.00273163,0.01000,2.613
18,self_attn.v_proj,0.00311299,0.01000,1.891
18,self_attn.q_proj,0.00828936,0.01000,0.344
18,self_attn.o_proj,0.00938506,0.01000,0.345
18,mlp.up_proj,0.00625932,0.01000,0.344
18,mlp.gate_proj,0.00583430,0.01000,0.339
18,mlp.down_proj,0.03318551,0.01000,2.234
19,self_attn.k_proj,0.00133622,0.01000,0.326
19,self_attn.v_proj,0.00225405,0.01000,0.800
19,self_attn.q_proj,0.00550781,0.01000,1.800
19,self_attn.o_proj,0.01567704,0.01000,0.449
19,mlp.up_proj,0.00725614,0.01000,2.903
19,mlp.gate_proj,0.00687203,0.01000,2.471
19,mlp.down_proj,0.03395692,0.01000,2.946
20,self_attn.k_proj,0.00182818,0.01000,0.388
20,self_attn.v_proj,0.00369986,0.01000,1.045
20,self_attn.q_proj,0.00668970,0.01000,3.772
20,self_attn.o_proj,0.01447436,0.01000,3.580
20,mlp.up_proj,0.00868652,0.01000,2.710
20,mlp.gate_proj,0.00763109,0.01000,1.037
20,mlp.down_proj,0.06614500,0.01000,3.153
21,self_attn.k_proj,0.00169165,0.01000,0.353
21,self_attn.v_proj,0.00278996,0.01000,1.556
21,self_attn.q_proj,0.00603606,0.01000,2.608
21,self_attn.o_proj,0.01160419,0.01000,2.633
21,mlp.up_proj,0.00941546,0.01000,2.761
21,mlp.gate_proj,0.00857336,0.01000,1.637
21,mlp.down_proj,0.05236044,0.01000,3.023
22,self_attn.k_proj,0.00173458,0.01000,0.340
22,self_attn.v_proj,0.00304587,0.01000,0.335
22,self_attn.q_proj,0.00609978,0.01000,1.500
22,self_attn.o_proj,0.01699413,0.01000,0.329
22,mlp.up_proj,0.01043702,0.01000,3.157
22,mlp.gate_proj,0.00901166,0.01000,2.403
22,mlp.down_proj,0.08635419,0.01000,2.277
23,self_attn.k_proj,0.00235798,0.01000,2.724
23,self_attn.v_proj,0.00853371,0.01000,2.700
23,self_attn.q_proj,0.00731025,0.01000,2.679
23,self_attn.o_proj,0.04595792,0.01000,0.347
23,mlp.up_proj,0.01267573,0.01000,1.922
23,mlp.gate_proj,0.00977481,0.01000,1.572
23,mlp.down_proj,0.09878369,0.01000,1.992
24,self_attn.k_proj,0.00193833,0.01000,0.352
24,self_attn.v_proj,0.00926276,0.01000,0.343
24,self_attn.q_proj,0.00732911,0.01000,0.354
24,self_attn.o_proj,0.02490180,0.01000,0.294
24,mlp.up_proj,0.01275103,0.01000,3.643
24,mlp.gate_proj,0.00968059,0.01000,4.339
24,mlp.down_proj,0.13135986,0.01000,6.748
25,self_attn.k_proj,0.00188807,0.01000,1.592
25,self_attn.v_proj,0.00410724,0.01000,1.087
25,self_attn.q_proj,0.00648702,0.01000,0.338
25,self_attn.o_proj,0.01829978,0.01000,1.828
25,mlp.up_proj,0.01323432,0.01000,0.353
25,mlp.gate_proj,0.01043347,0.01000,0.343
25,mlp.down_proj,0.10982227,0.01000,6.597
26,self_attn.k_proj,0.00186195,0.01000,3.885
26,self_attn.v_proj,0.00593649,0.01000,2.686
26,self_attn.q_proj,0.00663982,0.01000,0.818
26,self_attn.o_proj,0.02385299,0.01000,0.346
26,mlp.up_proj,0.01519259,0.01000,0.357
26,mlp.gate_proj,0.01179895,0.01000,0.383
26,mlp.down_proj,0.16240232,0.01000,2.805
27,self_attn.k_proj,0.00188216,0.01000,0.753
27,self_attn.v_proj,0.00480582,0.01000,2.568
27,self_attn.q_proj,0.00687713,0.01000,3.243
27,self_attn.o_proj,0.03130198,0.01000,1.944
27,mlp.up_proj,0.01527163,0.01000,0.361
27,mlp.gate_proj,0.01144433,0.01000,0.350
27,mlp.down_proj,0.20937583,0.01000,6.981
28,self_attn.k_proj,0.00163398,0.01000,2.274
28,self_attn.v_proj,0.00619308,0.01000,0.347
28,self_attn.q_proj,0.00561940,0.01000,1.200
28,self_attn.o_proj,0.02704479,0.01000,0.391
28,mlp.up_proj,0.01647252,0.01000,0.362
28,mlp.gate_proj,0.01167521,0.01000,0.348
28,mlp.down_proj,3.19434714,0.01000,7.166
29,self_attn.k_proj,0.00153822,0.01000,1.574
29,self_attn.v_proj,0.00717453,0.01000,0.978
29,self_attn.q_proj,0.00649254,0.01000,1.795
29,self_attn.o_proj,0.06275121,0.01000,0.949
29,mlp.up_proj,0.02440672,0.01000,2.122
29,mlp.gate_proj,0.01807862,0.01000,0.632
29,mlp.down_proj,0.86159390,0.01000,0.909
|