File size: 9,067 Bytes
6611689 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000833145,0.05000,5.504
0,self_attn.v_proj,0.0000048262,0.05000,5.610
0,self_attn.q_proj,0.0001627265,0.05000,5.606
0,self_attn.o_proj,0.0000002214,0.05000,1.191
0,mlp.gate_proj,0.0000997544,0.05000,3.078
0,mlp.up_proj,0.0000880482,0.05000,3.099
0,mlp.down_proj,0.0000010819,0.05000,3.332
1,self_attn.q_proj,0.0002339984,0.05000,5.468
1,self_attn.k_proj,0.0001366074,0.05000,5.615
1,self_attn.v_proj,0.0000161811,0.05000,5.641
1,self_attn.o_proj,0.0000006392,0.05000,1.165
1,mlp.gate_proj,0.0001622974,0.05000,2.888
1,mlp.up_proj,0.0001428511,0.05000,2.918
1,mlp.down_proj,0.0003240824,0.05000,3.307
2,self_attn.q_proj,0.0009462966,0.05000,5.619
2,self_attn.k_proj,0.0005598217,0.05000,5.643
2,self_attn.v_proj,0.0000587609,0.05000,5.671
2,self_attn.o_proj,0.0000006137,0.05000,1.139
2,mlp.up_proj,0.0002262556,0.05000,2.879
2,mlp.gate_proj,0.0002659620,0.05000,2.937
2,mlp.down_proj,0.0000028477,0.05000,2.979
3,self_attn.q_proj,0.0006456479,0.05000,5.110
3,self_attn.v_proj,0.0000623240,0.05000,5.181
3,self_attn.k_proj,0.0003549168,0.05000,5.208
3,self_attn.o_proj,0.0000012870,0.05000,1.070
3,mlp.up_proj,0.0002929948,0.05000,2.290
3,mlp.gate_proj,0.0003876079,0.05000,2.322
3,mlp.down_proj,0.0000042261,0.05000,3.058
4,self_attn.v_proj,0.0000641730,0.05000,5.203
4,self_attn.q_proj,0.0006326817,0.05000,5.248
4,self_attn.k_proj,0.0003315510,0.05000,5.274
4,self_attn.o_proj,0.0000023387,0.05000,1.078
4,mlp.gate_proj,0.0005043794,0.05000,2.391
4,mlp.up_proj,0.0003418379,0.05000,2.413
4,mlp.down_proj,0.0000061632,0.05000,3.072
5,self_attn.k_proj,0.0005265745,0.05000,5.141
5,self_attn.v_proj,0.0000638105,0.05000,5.204
5,self_attn.q_proj,0.0008782418,0.05000,5.240
5,self_attn.o_proj,0.0000025126,0.05000,1.060
5,mlp.up_proj,0.0003865409,0.05000,2.458
5,mlp.gate_proj,0.0005401021,0.05000,2.486
5,mlp.down_proj,0.0000082887,0.05000,3.048
6,self_attn.v_proj,0.0000612041,0.05000,5.136
6,self_attn.k_proj,0.0003914881,0.05000,5.177
6,self_attn.q_proj,0.0007378610,0.05000,5.211
6,self_attn.o_proj,0.0000043394,0.05000,1.034
6,mlp.gate_proj,0.0005627311,0.05000,2.457
6,mlp.up_proj,0.0004075962,0.05000,2.475
6,mlp.down_proj,0.0000099089,0.05000,2.958
7,self_attn.k_proj,0.0003767969,0.05000,5.226
7,self_attn.v_proj,0.0000546954,0.05000,5.279
7,self_attn.q_proj,0.0006362990,0.05000,5.295
7,self_attn.o_proj,0.0000061320,0.05000,1.056
7,mlp.up_proj,0.0004317052,0.05000,2.434
7,mlp.gate_proj,0.0005475797,0.05000,2.443
7,mlp.down_proj,0.0000111637,0.05000,3.088
8,self_attn.k_proj,0.0004685118,0.05000,5.168
8,self_attn.v_proj,0.0000670339,0.05000,5.199
8,self_attn.q_proj,0.0007847853,0.05000,5.229
8,self_attn.o_proj,0.0000080611,0.05000,1.108
8,mlp.up_proj,0.0004457112,0.05000,2.385
8,mlp.gate_proj,0.0005756153,0.05000,2.414
8,mlp.down_proj,0.0000119709,0.05000,3.063
9,self_attn.q_proj,0.0007281643,0.05000,5.169
9,self_attn.v_proj,0.0000788263,0.05000,5.243
9,self_attn.k_proj,0.0004247850,0.05000,5.248
9,self_attn.o_proj,0.0000077604,0.05000,1.016
9,mlp.gate_proj,0.0005563830,0.05000,2.452
9,mlp.up_proj,0.0004468315,0.05000,2.474
9,mlp.down_proj,0.0000119611,0.05000,2.982
10,self_attn.v_proj,0.0000621950,0.05000,5.226
10,self_attn.k_proj,0.0004504600,0.05000,5.274
10,self_attn.q_proj,0.0007390235,0.05000,5.337
10,self_attn.o_proj,0.0000074142,0.05000,1.079
10,mlp.gate_proj,0.0005601441,0.05000,2.303
10,mlp.up_proj,0.0004797459,0.05000,2.322
10,mlp.down_proj,0.0000133788,0.05000,3.071
11,self_attn.v_proj,0.0000770151,0.05000,5.048
11,self_attn.k_proj,0.0003612847,0.05000,5.134
11,self_attn.q_proj,0.0006474613,0.05000,5.161
11,self_attn.o_proj,0.0000095606,0.05000,1.116
11,mlp.up_proj,0.0005172904,0.05000,2.391
11,mlp.gate_proj,0.0005825480,0.05000,2.425
11,mlp.down_proj,0.0000147894,0.05000,3.155
12,self_attn.k_proj,0.0005030657,0.05000,5.040
12,self_attn.q_proj,0.0008600825,0.05000,5.172
12,self_attn.v_proj,0.0000796377,0.05000,5.186
12,self_attn.o_proj,0.0000104103,0.05000,1.071
12,mlp.up_proj,0.0005417673,0.05000,2.423
12,mlp.gate_proj,0.0006048538,0.05000,2.449
12,mlp.down_proj,0.0000159788,0.05000,3.090
13,self_attn.k_proj,0.0005679255,0.05000,5.098
13,self_attn.q_proj,0.0009026564,0.05000,5.188
13,self_attn.v_proj,0.0000920754,0.05000,5.205
13,self_attn.o_proj,0.0000111667,0.05000,1.057
13,mlp.up_proj,0.0005947397,0.05000,2.364
13,mlp.gate_proj,0.0007042694,0.05000,2.385
13,mlp.down_proj,0.0000207118,0.05000,3.023
14,self_attn.v_proj,0.0001053973,0.05000,5.222
14,self_attn.k_proj,0.0004498990,0.05000,5.278
14,self_attn.q_proj,0.0009584807,0.05000,5.306
14,self_attn.o_proj,0.0000123116,0.05000,1.090
14,mlp.up_proj,0.0006279950,0.05000,2.357
14,mlp.gate_proj,0.0007503058,0.05000,2.383
14,mlp.down_proj,0.0000250014,0.05000,3.074
15,self_attn.k_proj,0.0004797868,0.05000,4.990
15,self_attn.v_proj,0.0001005991,0.05000,5.166
15,self_attn.q_proj,0.0009365002,0.05000,5.185
15,self_attn.o_proj,0.0000076168,0.05000,1.067
15,mlp.up_proj,0.0006121564,0.05000,2.409
15,mlp.gate_proj,0.0007879107,0.05000,2.440
15,mlp.down_proj,0.0000245487,0.05000,3.107
16,self_attn.v_proj,0.0001098983,0.05000,5.208
16,self_attn.q_proj,0.0009610252,0.05000,5.322
16,self_attn.k_proj,0.0005322082,0.05000,5.361
16,self_attn.o_proj,0.0000051471,0.05000,1.175
16,mlp.up_proj,0.0005994866,0.05000,2.891
16,mlp.gate_proj,0.0007955586,0.05000,2.940
16,mlp.down_proj,0.0000232563,0.05000,3.234
17,self_attn.v_proj,0.0001056392,0.05000,5.383
17,self_attn.k_proj,0.0004881229,0.05000,5.419
17,self_attn.q_proj,0.0009143897,0.05000,5.493
17,self_attn.o_proj,0.0000044561,0.05000,1.173
17,mlp.gate_proj,0.0008321888,0.05000,2.826
17,mlp.up_proj,0.0006171612,0.05000,2.839
17,mlp.down_proj,0.0000246102,0.05000,3.241
18,self_attn.v_proj,0.0001294144,0.05000,5.402
18,self_attn.q_proj,0.0010036130,0.05000,5.491
18,self_attn.k_proj,0.0005490085,0.05000,5.539
18,self_attn.o_proj,0.0000047686,0.05000,1.202
18,mlp.up_proj,0.0006625156,0.05000,2.816
18,mlp.gate_proj,0.0008736592,0.05000,2.858
18,mlp.down_proj,0.0000259963,0.05000,3.274
19,self_attn.q_proj,0.0009206464,0.05000,5.306
19,self_attn.v_proj,0.0001300041,0.05000,5.346
19,self_attn.k_proj,0.0005263201,0.05000,5.421
19,self_attn.o_proj,0.0000081053,0.05000,1.206
19,mlp.up_proj,0.0007115615,0.05000,2.476
19,mlp.gate_proj,0.0009267995,0.05000,2.501
19,mlp.down_proj,0.0000313765,0.05000,3.005
20,self_attn.k_proj,0.0005501762,0.05000,5.269
20,self_attn.q_proj,0.0009316968,0.05000,5.310
20,self_attn.v_proj,0.0001533229,0.05000,5.339
20,self_attn.o_proj,0.0000053971,0.05000,1.074
20,mlp.gate_proj,0.0008958201,0.05000,2.386
20,mlp.up_proj,0.0007214489,0.05000,2.403
20,mlp.down_proj,0.0000298560,0.05000,3.048
21,self_attn.k_proj,0.0005322746,0.05000,5.115
21,self_attn.v_proj,0.0001965262,0.05000,5.151
21,self_attn.q_proj,0.0009163225,0.05000,5.171
21,self_attn.o_proj,0.0000058034,0.05000,1.071
21,mlp.up_proj,0.0007544485,0.05000,2.394
21,mlp.gate_proj,0.0009466076,0.05000,2.413
21,mlp.down_proj,0.0000325444,0.05000,2.984
22,self_attn.v_proj,0.0001977625,0.05000,5.113
22,self_attn.q_proj,0.0009122455,0.05000,5.193
22,self_attn.k_proj,0.0005100145,0.05000,5.229
22,self_attn.o_proj,0.0000058460,0.05000,1.057
22,mlp.gate_proj,0.0010337803,0.05000,2.355
22,mlp.up_proj,0.0008206790,0.05000,2.376
22,mlp.down_proj,0.0000370742,0.05000,2.997
23,self_attn.v_proj,0.0001945850,0.05000,5.120
23,self_attn.k_proj,0.0005421275,0.05000,5.187
23,self_attn.q_proj,0.0009014102,0.05000,5.207
23,self_attn.o_proj,0.0000118679,0.05000,1.071
23,mlp.gate_proj,0.0011874684,0.05000,2.391
23,mlp.up_proj,0.0009013988,0.05000,2.412
23,mlp.down_proj,0.0000456437,0.05000,3.112
24,self_attn.k_proj,0.0006013965,0.05000,5.117
24,self_attn.q_proj,0.0009966169,0.05000,5.178
24,self_attn.v_proj,0.0002814000,0.05000,5.192
24,self_attn.o_proj,0.0000167604,0.05000,1.067
24,mlp.up_proj,0.0009939129,0.05000,2.419
24,mlp.gate_proj,0.0013279702,0.05000,2.446
24,mlp.down_proj,0.0000607813,0.05000,3.056
25,self_attn.k_proj,0.0004979556,0.05000,5.164
25,self_attn.q_proj,0.0009840556,0.05000,5.252
25,self_attn.v_proj,0.0002535410,0.05000,5.264
25,self_attn.o_proj,0.0000184899,0.05000,1.043
25,mlp.gate_proj,0.0014792334,0.05000,2.438
25,mlp.up_proj,0.0011075135,0.05000,2.447
25,mlp.down_proj,0.0000877130,0.05000,3.067
26,self_attn.v_proj,0.0003436589,0.05000,5.014
26,self_attn.q_proj,0.0008804976,0.05000,5.161
26,self_attn.k_proj,0.0005433848,0.05000,5.189
26,self_attn.o_proj,0.0000359726,0.05000,1.044
26,mlp.up_proj,0.0011477621,0.05000,2.349
26,mlp.gate_proj,0.0015504545,0.05000,2.368
26,mlp.down_proj,0.0001262205,0.05000,3.025
27,self_attn.v_proj,0.0002239405,0.05000,5.051
27,self_attn.k_proj,0.0003883892,0.05000,5.105
27,self_attn.q_proj,0.0007127493,0.05000,5.130
27,self_attn.o_proj,0.0000817960,0.05000,1.054
27,mlp.up_proj,0.0012877010,0.05000,2.463
27,mlp.gate_proj,0.0015451877,0.05000,2.483
27,mlp.down_proj,0.0004653256,0.05000,3.056
|