File size: 11,667 Bytes
c72312f | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000529,0.05000,5.639
0,self_attn.v_proj,0.0000000459,0.05000,5.749
0,self_attn.q_proj,0.0000001946,0.05000,5.781
0,self_attn.o_proj,0.0000001205,0.05000,1.680
0,mlp.gate_proj,0.0000119312,0.05000,2.209
0,mlp.up_proj,0.0000104520,0.05000,2.237
0,mlp.down_proj,0.0000016241,0.05000,3.944
1,self_attn.q_proj,0.0000003163,0.05000,5.104
1,self_attn.v_proj,0.0000000882,0.05000,5.167
1,self_attn.k_proj,0.0000000853,0.05000,5.201
1,self_attn.o_proj,0.0000001642,0.05000,1.658
1,mlp.up_proj,0.0001817668,0.05000,2.850
1,mlp.gate_proj,0.0004014041,0.05000,2.881
1,mlp.down_proj,0.0000017688,0.05000,4.370
2,self_attn.q_proj,0.0000008970,0.05000,5.286
2,self_attn.k_proj,0.0000002566,0.05000,5.321
2,self_attn.v_proj,0.0000002510,0.05000,5.343
2,self_attn.o_proj,0.0000002251,0.05000,1.713
2,mlp.gate_proj,0.0006498467,0.05000,2.413
2,mlp.up_proj,0.0005177948,0.05000,2.438
2,mlp.down_proj,0.0000012732,0.05000,4.137
3,self_attn.q_proj,0.0000017194,0.05000,4.685
3,self_attn.k_proj,0.0000004413,0.05000,4.758
3,self_attn.v_proj,0.0000004548,0.05000,4.772
3,self_attn.o_proj,0.0000003429,0.05000,1.565
3,mlp.gate_proj,0.0006881107,0.05000,2.288
3,mlp.up_proj,0.0003561646,0.05000,2.318
3,mlp.down_proj,0.0000036292,0.05000,4.141
4,self_attn.v_proj,0.0000008922,0.05000,4.747
4,self_attn.q_proj,0.0000032643,0.05000,4.819
4,self_attn.k_proj,0.0000008853,0.05000,4.835
4,self_attn.o_proj,0.0000005458,0.05000,1.590
4,mlp.gate_proj,0.0005724557,0.05000,2.200
4,mlp.up_proj,0.0002293439,0.05000,2.225
4,mlp.down_proj,0.0000055330,0.05000,4.094
5,self_attn.q_proj,0.0000035649,0.05000,4.698
5,self_attn.v_proj,0.0000009740,0.05000,4.701
5,self_attn.k_proj,0.0000009058,0.05000,4.750
5,self_attn.o_proj,0.0000009772,0.05000,1.573
5,mlp.gate_proj,0.0002079280,0.05000,2.225
5,mlp.up_proj,0.0001013186,0.05000,2.242
5,mlp.down_proj,0.0000081773,0.05000,4.052
6,self_attn.v_proj,0.0000020665,0.05000,4.633
6,self_attn.k_proj,0.0000018139,0.05000,4.651
6,self_attn.q_proj,0.0000076765,0.05000,4.707
6,self_attn.o_proj,0.0000023579,0.05000,1.543
6,mlp.gate_proj,0.0002195186,0.05000,2.175
6,mlp.up_proj,0.0001256842,0.05000,2.209
6,mlp.down_proj,0.0001805787,0.05000,4.051
7,self_attn.k_proj,0.0000041912,0.05000,4.737
7,self_attn.q_proj,0.0000155375,0.05000,4.792
7,self_attn.v_proj,0.0000043051,0.05000,4.791
7,self_attn.o_proj,0.0000028798,0.05000,1.601
7,mlp.up_proj,0.0001527545,0.05000,2.254
7,mlp.gate_proj,0.0002531733,0.05000,2.284
7,mlp.down_proj,0.0000135267,0.05000,4.097
8,self_attn.k_proj,0.0000061028,0.05000,4.791
8,self_attn.v_proj,0.0000066735,0.05000,4.804
8,self_attn.q_proj,0.0000235807,0.05000,4.855
8,self_attn.o_proj,0.0000041072,0.05000,1.567
8,mlp.up_proj,0.0001451299,0.05000,2.221
8,mlp.gate_proj,0.0001770070,0.05000,2.239
8,mlp.down_proj,0.0000203039,0.05000,4.053
9,self_attn.q_proj,0.0000290558,0.05000,4.707
9,self_attn.v_proj,0.0000080488,0.05000,4.772
9,self_attn.k_proj,0.0000081565,0.05000,4.789
9,self_attn.o_proj,0.0000045795,0.05000,1.552
9,mlp.up_proj,0.0001810021,0.05000,2.156
9,mlp.gate_proj,0.0002832804,0.05000,2.183
9,mlp.down_proj,0.0000204025,0.05000,4.116
10,self_attn.q_proj,0.0000428730,0.05000,4.681
10,self_attn.k_proj,0.0000110682,0.05000,4.728
10,self_attn.v_proj,0.0000127939,0.05000,4.753
10,self_attn.o_proj,0.0000070710,0.05000,1.515
10,mlp.gate_proj,0.0002172222,0.05000,2.220
10,mlp.up_proj,0.0001513125,0.05000,2.218
10,mlp.down_proj,0.0000166309,0.05000,4.037
11,self_attn.k_proj,0.0000055936,0.05000,4.616
11,self_attn.q_proj,0.0000206081,0.05000,4.677
11,self_attn.v_proj,0.0000057883,0.05000,4.701
11,self_attn.o_proj,0.0000043435,0.05000,1.481
11,mlp.up_proj,0.0001400455,0.05000,2.178
11,mlp.gate_proj,0.0001772193,0.05000,2.182
11,mlp.down_proj,0.0000154659,0.05000,4.043
12,self_attn.k_proj,0.0000063814,0.05000,4.536
12,self_attn.q_proj,0.0000242027,0.05000,4.576
12,self_attn.v_proj,0.0000068583,0.05000,4.605
12,self_attn.o_proj,0.0000050332,0.05000,1.562
12,mlp.up_proj,0.0001370627,0.05000,2.161
12,mlp.gate_proj,0.0001573160,0.05000,2.180
12,mlp.down_proj,0.0000155309,0.05000,3.970
13,self_attn.v_proj,0.0000047044,0.05000,4.507
13,self_attn.q_proj,0.0000184363,0.05000,4.572
13,self_attn.k_proj,0.0000048823,0.05000,4.595
13,self_attn.o_proj,0.0000040465,0.05000,1.519
13,mlp.up_proj,0.0001393028,0.05000,2.214
13,mlp.gate_proj,0.0001458737,0.05000,2.229
13,mlp.down_proj,0.0000165562,0.05000,3.984
14,self_attn.k_proj,0.0000078433,0.05000,4.434
14,self_attn.v_proj,0.0000083064,0.05000,4.512
14,self_attn.q_proj,0.0000305769,0.05000,4.529
14,self_attn.o_proj,0.0000068696,0.05000,1.534
14,mlp.gate_proj,0.0001425182,0.05000,2.143
14,mlp.up_proj,0.0001369667,0.05000,2.165
14,mlp.down_proj,0.0000144339,0.05000,3.994
15,self_attn.k_proj,0.0000078901,0.05000,4.457
15,self_attn.q_proj,0.0000304238,0.05000,4.517
15,self_attn.v_proj,0.0000075067,0.05000,4.547
15,self_attn.o_proj,0.0000057910,0.05000,1.549
15,mlp.gate_proj,0.0001314416,0.05000,2.075
15,mlp.up_proj,0.0001308323,0.05000,2.096
15,mlp.down_proj,0.0000141322,0.05000,4.025
16,self_attn.q_proj,0.0000527059,0.05000,4.588
16,self_attn.k_proj,0.0000129936,0.05000,4.645
16,self_attn.v_proj,0.0000147963,0.05000,4.672
16,self_attn.o_proj,0.0000062181,0.05000,1.554
16,mlp.up_proj,0.0001370881,0.05000,2.170
16,mlp.gate_proj,0.0001460451,0.05000,2.173
16,mlp.down_proj,0.0001291258,0.05000,4.031
17,self_attn.k_proj,0.0000099961,0.05000,4.611
17,self_attn.v_proj,0.0000111945,0.05000,4.684
17,self_attn.q_proj,0.0000450757,0.05000,4.705
17,self_attn.o_proj,0.0000065814,0.05000,1.551
17,mlp.up_proj,0.0001229390,0.05000,2.229
17,mlp.gate_proj,0.0001291509,0.05000,2.260
17,mlp.down_proj,0.0000138228,0.05000,4.005
18,self_attn.q_proj,0.0000491217,0.05000,4.514
18,self_attn.k_proj,0.0000119304,0.05000,4.544
18,self_attn.v_proj,0.0000134876,0.05000,4.585
18,self_attn.o_proj,0.0000080063,0.05000,1.528
18,mlp.up_proj,0.0001347442,0.05000,2.151
18,mlp.gate_proj,0.0001388276,0.05000,2.173
18,mlp.down_proj,0.0000170619,0.05000,4.005
19,self_attn.k_proj,0.0000229575,0.05000,4.624
19,self_attn.q_proj,0.0000984122,0.05000,4.668
19,self_attn.v_proj,0.0000236798,0.05000,4.691
19,self_attn.o_proj,0.0000106329,0.05000,1.582
19,mlp.up_proj,0.0001514618,0.05000,2.286
19,mlp.gate_proj,0.0001546628,0.05000,2.302
19,mlp.down_proj,0.0000227354,0.05000,4.005
20,self_attn.q_proj,0.0000933378,0.05000,4.620
20,self_attn.v_proj,0.0000220575,0.05000,4.667
20,self_attn.k_proj,0.0000202215,0.05000,4.695
20,self_attn.o_proj,0.0000106457,0.05000,1.588
20,mlp.up_proj,0.0001666797,0.05000,2.134
20,mlp.gate_proj,0.0001662707,0.05000,2.132
20,mlp.down_proj,0.0000256278,0.05000,3.855
21,self_attn.q_proj,0.0001202196,0.05000,4.409
21,self_attn.k_proj,0.0000271532,0.05000,4.460
21,self_attn.v_proj,0.0000298576,0.05000,4.463
21,self_attn.o_proj,0.0000127776,0.05000,1.502
21,mlp.gate_proj,0.0002019959,0.05000,2.158
21,mlp.up_proj,0.0002010829,0.05000,2.176
21,mlp.down_proj,0.0000345897,0.05000,3.940
22,self_attn.k_proj,0.0000543410,0.05000,4.310
22,self_attn.v_proj,0.0000614177,0.05000,4.389
22,self_attn.q_proj,0.0002431058,0.05000,4.428
22,self_attn.o_proj,0.0000251777,0.05000,1.475
22,mlp.gate_proj,0.0002430665,0.05000,2.006
22,mlp.up_proj,0.0002305638,0.05000,2.024
22,mlp.down_proj,0.0000551142,0.05000,4.117
23,self_attn.k_proj,0.0000548529,0.05000,4.693
23,self_attn.q_proj,0.0002422710,0.05000,4.733
23,self_attn.v_proj,0.0000634447,0.05000,4.766
23,self_attn.o_proj,0.0000301494,0.05000,1.571
23,mlp.up_proj,0.0002738696,0.05000,2.283
23,mlp.gate_proj,0.0003045300,0.05000,2.310
23,mlp.down_proj,0.0000784298,0.05000,4.072
24,self_attn.v_proj,0.0001179669,0.05000,4.527
24,self_attn.k_proj,0.0000914282,0.05000,4.581
24,self_attn.q_proj,0.0003977864,0.05000,4.606
24,self_attn.o_proj,0.0000348926,0.05000,1.539
24,mlp.up_proj,0.0003071852,0.05000,2.174
24,mlp.gate_proj,0.0003468198,0.05000,2.199
24,mlp.down_proj,0.0000987934,0.05000,4.011
25,self_attn.k_proj,0.0000689053,0.05000,4.630
25,self_attn.q_proj,0.0002806590,0.05000,4.681
25,self_attn.v_proj,0.0000781839,0.05000,4.700
25,self_attn.o_proj,0.0000216056,0.05000,1.567
25,mlp.gate_proj,0.0004061265,0.05000,2.350
25,mlp.up_proj,0.0003546657,0.05000,2.372
25,mlp.down_proj,0.0001193259,0.05000,4.131
26,self_attn.q_proj,0.0004597529,0.05000,4.504
26,self_attn.v_proj,0.0001259534,0.05000,4.592
26,self_attn.k_proj,0.0001063583,0.05000,4.603
26,self_attn.o_proj,0.0000202876,0.05000,1.588
26,mlp.up_proj,0.0004417255,0.05000,2.244
26,mlp.gate_proj,0.0004897194,0.05000,2.276
26,mlp.down_proj,0.0001446874,0.05000,4.001
27,self_attn.v_proj,0.0001698991,0.05000,4.541
27,self_attn.q_proj,0.0005717810,0.05000,4.596
27,self_attn.k_proj,0.0001285193,0.05000,4.611
27,self_attn.o_proj,0.0000299984,0.05000,1.533
27,mlp.up_proj,0.0005171644,0.05000,2.243
27,mlp.gate_proj,0.0005543040,0.05000,2.272
27,mlp.down_proj,0.0002140129,0.05000,4.063
28,self_attn.q_proj,0.0006321518,0.05000,4.605
28,self_attn.v_proj,0.0001818466,0.05000,4.617
28,self_attn.k_proj,0.0001574352,0.05000,4.603
28,self_attn.o_proj,0.0000483718,0.05000,1.539
28,mlp.gate_proj,0.0006389360,0.05000,2.202
28,mlp.up_proj,0.0006213975,0.05000,2.220
28,mlp.down_proj,0.0003262202,0.05000,4.026
29,self_attn.k_proj,0.0003507194,0.05000,4.563
29,self_attn.v_proj,0.0004741120,0.05000,4.606
29,self_attn.q_proj,0.0015347515,0.05000,4.631
29,self_attn.o_proj,0.0000478133,0.05000,1.528
29,mlp.gate_proj,0.0007606724,0.05000,2.246
29,mlp.up_proj,0.0007786636,0.05000,2.274
29,mlp.down_proj,0.0003562392,0.05000,4.091
30,self_attn.k_proj,0.0004426675,0.05000,4.557
30,self_attn.q_proj,0.0017618013,0.05000,4.629
30,self_attn.v_proj,0.0005607962,0.05000,4.643
30,self_attn.o_proj,0.0000970244,0.05000,1.504
30,mlp.up_proj,0.0008522944,0.05000,2.130
30,mlp.gate_proj,0.0008062162,0.05000,2.169
30,mlp.down_proj,0.0004936067,0.05000,4.025
31,self_attn.v_proj,0.0008217572,0.05000,4.589
31,self_attn.k_proj,0.0005931148,0.05000,4.626
31,self_attn.q_proj,0.0022387475,0.05000,4.661
31,self_attn.o_proj,0.0000931515,0.05000,1.562
31,mlp.up_proj,0.0009072860,0.05000,2.213
31,mlp.gate_proj,0.0008159017,0.05000,2.236
31,mlp.down_proj,0.0006296246,0.05000,4.061
32,self_attn.v_proj,0.0012069424,0.05000,4.608
32,self_attn.k_proj,0.0007966917,0.05000,4.655
32,self_attn.q_proj,0.0032704534,0.05000,4.695
32,self_attn.o_proj,0.0001177748,0.05000,1.529
32,mlp.up_proj,0.0009638389,0.05000,2.166
32,mlp.gate_proj,0.0008459933,0.05000,2.195
32,mlp.down_proj,0.0007726722,0.05000,3.959
33,self_attn.q_proj,0.0068431394,0.05000,4.501
33,self_attn.v_proj,0.0026603756,0.05000,4.515
33,self_attn.k_proj,0.0013990668,0.05000,4.569
33,self_attn.o_proj,0.0001440813,0.05000,1.581
33,mlp.up_proj,0.0010475062,0.05000,2.215
33,mlp.gate_proj,0.0009084458,0.05000,2.241
33,mlp.down_proj,0.0009851406,0.05000,3.856
34,self_attn.k_proj,0.0012023171,0.05000,4.691
34,self_attn.q_proj,0.0053871334,0.05000,4.754
34,self_attn.v_proj,0.0020066263,0.05000,4.756
34,self_attn.o_proj,0.0002732787,0.05000,1.535
34,mlp.gate_proj,0.0010677983,0.05000,2.184
34,mlp.up_proj,0.0011509700,0.05000,2.210
34,mlp.down_proj,0.0011212979,0.05000,4.006
35,self_attn.v_proj,0.0008843137,0.05000,4.681
35,self_attn.q_proj,0.0025782813,0.05000,4.733
35,self_attn.k_proj,0.0006658983,0.05000,4.775
35,self_attn.o_proj,0.0003583769,0.05000,1.576
35,mlp.gate_proj,0.0016682997,0.05000,2.171
35,mlp.up_proj,0.0017624593,0.05000,2.190
35,mlp.down_proj,0.0016827106,0.05000,4.071
|