File size: 11,667 Bytes
c72312f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000529,0.05000,5.639
0,self_attn.v_proj,0.0000000459,0.05000,5.749
0,self_attn.q_proj,0.0000001946,0.05000,5.781
0,self_attn.o_proj,0.0000001205,0.05000,1.680
0,mlp.gate_proj,0.0000119312,0.05000,2.209
0,mlp.up_proj,0.0000104520,0.05000,2.237
0,mlp.down_proj,0.0000016241,0.05000,3.944
1,self_attn.q_proj,0.0000003163,0.05000,5.104
1,self_attn.v_proj,0.0000000882,0.05000,5.167
1,self_attn.k_proj,0.0000000853,0.05000,5.201
1,self_attn.o_proj,0.0000001642,0.05000,1.658
1,mlp.up_proj,0.0001817668,0.05000,2.850
1,mlp.gate_proj,0.0004014041,0.05000,2.881
1,mlp.down_proj,0.0000017688,0.05000,4.370
2,self_attn.q_proj,0.0000008970,0.05000,5.286
2,self_attn.k_proj,0.0000002566,0.05000,5.321
2,self_attn.v_proj,0.0000002510,0.05000,5.343
2,self_attn.o_proj,0.0000002251,0.05000,1.713
2,mlp.gate_proj,0.0006498467,0.05000,2.413
2,mlp.up_proj,0.0005177948,0.05000,2.438
2,mlp.down_proj,0.0000012732,0.05000,4.137
3,self_attn.q_proj,0.0000017194,0.05000,4.685
3,self_attn.k_proj,0.0000004413,0.05000,4.758
3,self_attn.v_proj,0.0000004548,0.05000,4.772
3,self_attn.o_proj,0.0000003429,0.05000,1.565
3,mlp.gate_proj,0.0006881107,0.05000,2.288
3,mlp.up_proj,0.0003561646,0.05000,2.318
3,mlp.down_proj,0.0000036292,0.05000,4.141
4,self_attn.v_proj,0.0000008922,0.05000,4.747
4,self_attn.q_proj,0.0000032643,0.05000,4.819
4,self_attn.k_proj,0.0000008853,0.05000,4.835
4,self_attn.o_proj,0.0000005458,0.05000,1.590
4,mlp.gate_proj,0.0005724557,0.05000,2.200
4,mlp.up_proj,0.0002293439,0.05000,2.225
4,mlp.down_proj,0.0000055330,0.05000,4.094
5,self_attn.q_proj,0.0000035649,0.05000,4.698
5,self_attn.v_proj,0.0000009740,0.05000,4.701
5,self_attn.k_proj,0.0000009058,0.05000,4.750
5,self_attn.o_proj,0.0000009772,0.05000,1.573
5,mlp.gate_proj,0.0002079280,0.05000,2.225
5,mlp.up_proj,0.0001013186,0.05000,2.242
5,mlp.down_proj,0.0000081773,0.05000,4.052
6,self_attn.v_proj,0.0000020665,0.05000,4.633
6,self_attn.k_proj,0.0000018139,0.05000,4.651
6,self_attn.q_proj,0.0000076765,0.05000,4.707
6,self_attn.o_proj,0.0000023579,0.05000,1.543
6,mlp.gate_proj,0.0002195186,0.05000,2.175
6,mlp.up_proj,0.0001256842,0.05000,2.209
6,mlp.down_proj,0.0001805787,0.05000,4.051
7,self_attn.k_proj,0.0000041912,0.05000,4.737
7,self_attn.q_proj,0.0000155375,0.05000,4.792
7,self_attn.v_proj,0.0000043051,0.05000,4.791
7,self_attn.o_proj,0.0000028798,0.05000,1.601
7,mlp.up_proj,0.0001527545,0.05000,2.254
7,mlp.gate_proj,0.0002531733,0.05000,2.284
7,mlp.down_proj,0.0000135267,0.05000,4.097
8,self_attn.k_proj,0.0000061028,0.05000,4.791
8,self_attn.v_proj,0.0000066735,0.05000,4.804
8,self_attn.q_proj,0.0000235807,0.05000,4.855
8,self_attn.o_proj,0.0000041072,0.05000,1.567
8,mlp.up_proj,0.0001451299,0.05000,2.221
8,mlp.gate_proj,0.0001770070,0.05000,2.239
8,mlp.down_proj,0.0000203039,0.05000,4.053
9,self_attn.q_proj,0.0000290558,0.05000,4.707
9,self_attn.v_proj,0.0000080488,0.05000,4.772
9,self_attn.k_proj,0.0000081565,0.05000,4.789
9,self_attn.o_proj,0.0000045795,0.05000,1.552
9,mlp.up_proj,0.0001810021,0.05000,2.156
9,mlp.gate_proj,0.0002832804,0.05000,2.183
9,mlp.down_proj,0.0000204025,0.05000,4.116
10,self_attn.q_proj,0.0000428730,0.05000,4.681
10,self_attn.k_proj,0.0000110682,0.05000,4.728
10,self_attn.v_proj,0.0000127939,0.05000,4.753
10,self_attn.o_proj,0.0000070710,0.05000,1.515
10,mlp.gate_proj,0.0002172222,0.05000,2.220
10,mlp.up_proj,0.0001513125,0.05000,2.218
10,mlp.down_proj,0.0000166309,0.05000,4.037
11,self_attn.k_proj,0.0000055936,0.05000,4.616
11,self_attn.q_proj,0.0000206081,0.05000,4.677
11,self_attn.v_proj,0.0000057883,0.05000,4.701
11,self_attn.o_proj,0.0000043435,0.05000,1.481
11,mlp.up_proj,0.0001400455,0.05000,2.178
11,mlp.gate_proj,0.0001772193,0.05000,2.182
11,mlp.down_proj,0.0000154659,0.05000,4.043
12,self_attn.k_proj,0.0000063814,0.05000,4.536
12,self_attn.q_proj,0.0000242027,0.05000,4.576
12,self_attn.v_proj,0.0000068583,0.05000,4.605
12,self_attn.o_proj,0.0000050332,0.05000,1.562
12,mlp.up_proj,0.0001370627,0.05000,2.161
12,mlp.gate_proj,0.0001573160,0.05000,2.180
12,mlp.down_proj,0.0000155309,0.05000,3.970
13,self_attn.v_proj,0.0000047044,0.05000,4.507
13,self_attn.q_proj,0.0000184363,0.05000,4.572
13,self_attn.k_proj,0.0000048823,0.05000,4.595
13,self_attn.o_proj,0.0000040465,0.05000,1.519
13,mlp.up_proj,0.0001393028,0.05000,2.214
13,mlp.gate_proj,0.0001458737,0.05000,2.229
13,mlp.down_proj,0.0000165562,0.05000,3.984
14,self_attn.k_proj,0.0000078433,0.05000,4.434
14,self_attn.v_proj,0.0000083064,0.05000,4.512
14,self_attn.q_proj,0.0000305769,0.05000,4.529
14,self_attn.o_proj,0.0000068696,0.05000,1.534
14,mlp.gate_proj,0.0001425182,0.05000,2.143
14,mlp.up_proj,0.0001369667,0.05000,2.165
14,mlp.down_proj,0.0000144339,0.05000,3.994
15,self_attn.k_proj,0.0000078901,0.05000,4.457
15,self_attn.q_proj,0.0000304238,0.05000,4.517
15,self_attn.v_proj,0.0000075067,0.05000,4.547
15,self_attn.o_proj,0.0000057910,0.05000,1.549
15,mlp.gate_proj,0.0001314416,0.05000,2.075
15,mlp.up_proj,0.0001308323,0.05000,2.096
15,mlp.down_proj,0.0000141322,0.05000,4.025
16,self_attn.q_proj,0.0000527059,0.05000,4.588
16,self_attn.k_proj,0.0000129936,0.05000,4.645
16,self_attn.v_proj,0.0000147963,0.05000,4.672
16,self_attn.o_proj,0.0000062181,0.05000,1.554
16,mlp.up_proj,0.0001370881,0.05000,2.170
16,mlp.gate_proj,0.0001460451,0.05000,2.173
16,mlp.down_proj,0.0001291258,0.05000,4.031
17,self_attn.k_proj,0.0000099961,0.05000,4.611
17,self_attn.v_proj,0.0000111945,0.05000,4.684
17,self_attn.q_proj,0.0000450757,0.05000,4.705
17,self_attn.o_proj,0.0000065814,0.05000,1.551
17,mlp.up_proj,0.0001229390,0.05000,2.229
17,mlp.gate_proj,0.0001291509,0.05000,2.260
17,mlp.down_proj,0.0000138228,0.05000,4.005
18,self_attn.q_proj,0.0000491217,0.05000,4.514
18,self_attn.k_proj,0.0000119304,0.05000,4.544
18,self_attn.v_proj,0.0000134876,0.05000,4.585
18,self_attn.o_proj,0.0000080063,0.05000,1.528
18,mlp.up_proj,0.0001347442,0.05000,2.151
18,mlp.gate_proj,0.0001388276,0.05000,2.173
18,mlp.down_proj,0.0000170619,0.05000,4.005
19,self_attn.k_proj,0.0000229575,0.05000,4.624
19,self_attn.q_proj,0.0000984122,0.05000,4.668
19,self_attn.v_proj,0.0000236798,0.05000,4.691
19,self_attn.o_proj,0.0000106329,0.05000,1.582
19,mlp.up_proj,0.0001514618,0.05000,2.286
19,mlp.gate_proj,0.0001546628,0.05000,2.302
19,mlp.down_proj,0.0000227354,0.05000,4.005
20,self_attn.q_proj,0.0000933378,0.05000,4.620
20,self_attn.v_proj,0.0000220575,0.05000,4.667
20,self_attn.k_proj,0.0000202215,0.05000,4.695
20,self_attn.o_proj,0.0000106457,0.05000,1.588
20,mlp.up_proj,0.0001666797,0.05000,2.134
20,mlp.gate_proj,0.0001662707,0.05000,2.132
20,mlp.down_proj,0.0000256278,0.05000,3.855
21,self_attn.q_proj,0.0001202196,0.05000,4.409
21,self_attn.k_proj,0.0000271532,0.05000,4.460
21,self_attn.v_proj,0.0000298576,0.05000,4.463
21,self_attn.o_proj,0.0000127776,0.05000,1.502
21,mlp.gate_proj,0.0002019959,0.05000,2.158
21,mlp.up_proj,0.0002010829,0.05000,2.176
21,mlp.down_proj,0.0000345897,0.05000,3.940
22,self_attn.k_proj,0.0000543410,0.05000,4.310
22,self_attn.v_proj,0.0000614177,0.05000,4.389
22,self_attn.q_proj,0.0002431058,0.05000,4.428
22,self_attn.o_proj,0.0000251777,0.05000,1.475
22,mlp.gate_proj,0.0002430665,0.05000,2.006
22,mlp.up_proj,0.0002305638,0.05000,2.024
22,mlp.down_proj,0.0000551142,0.05000,4.117
23,self_attn.k_proj,0.0000548529,0.05000,4.693
23,self_attn.q_proj,0.0002422710,0.05000,4.733
23,self_attn.v_proj,0.0000634447,0.05000,4.766
23,self_attn.o_proj,0.0000301494,0.05000,1.571
23,mlp.up_proj,0.0002738696,0.05000,2.283
23,mlp.gate_proj,0.0003045300,0.05000,2.310
23,mlp.down_proj,0.0000784298,0.05000,4.072
24,self_attn.v_proj,0.0001179669,0.05000,4.527
24,self_attn.k_proj,0.0000914282,0.05000,4.581
24,self_attn.q_proj,0.0003977864,0.05000,4.606
24,self_attn.o_proj,0.0000348926,0.05000,1.539
24,mlp.up_proj,0.0003071852,0.05000,2.174
24,mlp.gate_proj,0.0003468198,0.05000,2.199
24,mlp.down_proj,0.0000987934,0.05000,4.011
25,self_attn.k_proj,0.0000689053,0.05000,4.630
25,self_attn.q_proj,0.0002806590,0.05000,4.681
25,self_attn.v_proj,0.0000781839,0.05000,4.700
25,self_attn.o_proj,0.0000216056,0.05000,1.567
25,mlp.gate_proj,0.0004061265,0.05000,2.350
25,mlp.up_proj,0.0003546657,0.05000,2.372
25,mlp.down_proj,0.0001193259,0.05000,4.131
26,self_attn.q_proj,0.0004597529,0.05000,4.504
26,self_attn.v_proj,0.0001259534,0.05000,4.592
26,self_attn.k_proj,0.0001063583,0.05000,4.603
26,self_attn.o_proj,0.0000202876,0.05000,1.588
26,mlp.up_proj,0.0004417255,0.05000,2.244
26,mlp.gate_proj,0.0004897194,0.05000,2.276
26,mlp.down_proj,0.0001446874,0.05000,4.001
27,self_attn.v_proj,0.0001698991,0.05000,4.541
27,self_attn.q_proj,0.0005717810,0.05000,4.596
27,self_attn.k_proj,0.0001285193,0.05000,4.611
27,self_attn.o_proj,0.0000299984,0.05000,1.533
27,mlp.up_proj,0.0005171644,0.05000,2.243
27,mlp.gate_proj,0.0005543040,0.05000,2.272
27,mlp.down_proj,0.0002140129,0.05000,4.063
28,self_attn.q_proj,0.0006321518,0.05000,4.605
28,self_attn.v_proj,0.0001818466,0.05000,4.617
28,self_attn.k_proj,0.0001574352,0.05000,4.603
28,self_attn.o_proj,0.0000483718,0.05000,1.539
28,mlp.gate_proj,0.0006389360,0.05000,2.202
28,mlp.up_proj,0.0006213975,0.05000,2.220
28,mlp.down_proj,0.0003262202,0.05000,4.026
29,self_attn.k_proj,0.0003507194,0.05000,4.563
29,self_attn.v_proj,0.0004741120,0.05000,4.606
29,self_attn.q_proj,0.0015347515,0.05000,4.631
29,self_attn.o_proj,0.0000478133,0.05000,1.528
29,mlp.gate_proj,0.0007606724,0.05000,2.246
29,mlp.up_proj,0.0007786636,0.05000,2.274
29,mlp.down_proj,0.0003562392,0.05000,4.091
30,self_attn.k_proj,0.0004426675,0.05000,4.557
30,self_attn.q_proj,0.0017618013,0.05000,4.629
30,self_attn.v_proj,0.0005607962,0.05000,4.643
30,self_attn.o_proj,0.0000970244,0.05000,1.504
30,mlp.up_proj,0.0008522944,0.05000,2.130
30,mlp.gate_proj,0.0008062162,0.05000,2.169
30,mlp.down_proj,0.0004936067,0.05000,4.025
31,self_attn.v_proj,0.0008217572,0.05000,4.589
31,self_attn.k_proj,0.0005931148,0.05000,4.626
31,self_attn.q_proj,0.0022387475,0.05000,4.661
31,self_attn.o_proj,0.0000931515,0.05000,1.562
31,mlp.up_proj,0.0009072860,0.05000,2.213
31,mlp.gate_proj,0.0008159017,0.05000,2.236
31,mlp.down_proj,0.0006296246,0.05000,4.061
32,self_attn.v_proj,0.0012069424,0.05000,4.608
32,self_attn.k_proj,0.0007966917,0.05000,4.655
32,self_attn.q_proj,0.0032704534,0.05000,4.695
32,self_attn.o_proj,0.0001177748,0.05000,1.529
32,mlp.up_proj,0.0009638389,0.05000,2.166
32,mlp.gate_proj,0.0008459933,0.05000,2.195
32,mlp.down_proj,0.0007726722,0.05000,3.959
33,self_attn.q_proj,0.0068431394,0.05000,4.501
33,self_attn.v_proj,0.0026603756,0.05000,4.515
33,self_attn.k_proj,0.0013990668,0.05000,4.569
33,self_attn.o_proj,0.0001440813,0.05000,1.581
33,mlp.up_proj,0.0010475062,0.05000,2.215
33,mlp.gate_proj,0.0009084458,0.05000,2.241
33,mlp.down_proj,0.0009851406,0.05000,3.856
34,self_attn.k_proj,0.0012023171,0.05000,4.691
34,self_attn.q_proj,0.0053871334,0.05000,4.754
34,self_attn.v_proj,0.0020066263,0.05000,4.756
34,self_attn.o_proj,0.0002732787,0.05000,1.535
34,mlp.gate_proj,0.0010677983,0.05000,2.184
34,mlp.up_proj,0.0011509700,0.05000,2.210
34,mlp.down_proj,0.0011212979,0.05000,4.006
35,self_attn.v_proj,0.0008843137,0.05000,4.681
35,self_attn.q_proj,0.0025782813,0.05000,4.733
35,self_attn.k_proj,0.0006658983,0.05000,4.775
35,self_attn.o_proj,0.0003583769,0.05000,1.576
35,mlp.gate_proj,0.0016682997,0.05000,2.171
35,mlp.up_proj,0.0017624593,0.05000,2.190
35,mlp.down_proj,0.0016827106,0.05000,4.071