File size: 11,667 Bytes
995e802
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
layer,module,loss,samples,damp,time
0,self_attn.q_proj,0.0000001497,0.05000,4.382
0,self_attn.k_proj,0.0000000404,0.05000,4.441
0,self_attn.v_proj,0.0000000348,0.05000,4.350
0,self_attn.o_proj,0.0000000850,0.05000,1.280
0,mlp.gate_proj,0.0000102160,0.05000,1.724
0,mlp.up_proj,0.0000089166,0.05000,1.743
0,mlp.down_proj,0.0000010669,0.05000,3.375
1,self_attn.q_proj,0.0000002582,0.05000,4.558
1,self_attn.k_proj,0.0000000700,0.05000,4.591
1,self_attn.v_proj,0.0000000709,0.05000,4.631
1,self_attn.o_proj,0.0000001153,0.05000,1.476
1,mlp.gate_proj,0.0003654537,0.05000,2.372
1,mlp.up_proj,0.0001678912,0.05000,2.411
1,mlp.down_proj,0.0000015869,0.05000,3.571
2,self_attn.k_proj,0.0000002100,0.05000,4.218
2,self_attn.v_proj,0.0000001973,0.05000,4.249
2,self_attn.q_proj,0.0000007267,0.05000,4.284
2,self_attn.o_proj,0.0000001442,0.05000,1.321
2,mlp.gate_proj,0.0006378509,0.05000,1.795
2,mlp.up_proj,0.0005036621,0.05000,1.815
2,mlp.down_proj,0.0000010006,0.05000,3.541
3,self_attn.v_proj,0.0000003527,0.05000,3.926
3,self_attn.q_proj,0.0000013755,0.05000,4.000
3,self_attn.k_proj,0.0000003573,0.05000,4.022
3,self_attn.o_proj,0.0000002609,0.05000,1.337
3,mlp.gate_proj,0.0005461829,0.05000,1.862
3,mlp.up_proj,0.0002773691,0.05000,1.880
3,mlp.down_proj,0.0000025155,0.05000,3.506
4,self_attn.v_proj,0.0000006756,0.05000,3.921
4,self_attn.k_proj,0.0000006994,0.05000,3.970
4,self_attn.q_proj,0.0000025318,0.05000,4.003
4,self_attn.o_proj,0.0000003630,0.05000,1.330
4,mlp.up_proj,0.0001704913,0.05000,1.772
4,mlp.gate_proj,0.0004582719,0.05000,1.796
4,mlp.down_proj,0.0000030722,0.05000,3.513
5,self_attn.q_proj,0.0000027408,0.05000,3.876
5,self_attn.v_proj,0.0000007342,0.05000,3.951
5,self_attn.k_proj,0.0000007074,0.05000,3.970
5,self_attn.o_proj,0.0000006741,0.05000,1.321
5,mlp.gate_proj,0.0001597727,0.05000,1.780
5,mlp.up_proj,0.0000717189,0.05000,1.806
5,mlp.down_proj,0.0000043840,0.05000,3.511
6,self_attn.k_proj,0.0000014229,0.05000,3.949
6,self_attn.q_proj,0.0000059482,0.05000,4.004
6,self_attn.v_proj,0.0000015715,0.05000,4.024
6,self_attn.o_proj,0.0000014801,0.05000,1.334
6,mlp.up_proj,0.0000913276,0.05000,1.890
6,mlp.gate_proj,0.0001743651,0.05000,1.909
6,mlp.down_proj,0.0000798332,0.05000,3.506
7,self_attn.k_proj,0.0000034002,0.05000,3.909
7,self_attn.q_proj,0.0000122388,0.05000,3.980
7,self_attn.v_proj,0.0000031944,0.05000,4.008
7,self_attn.o_proj,0.0000018697,0.05000,1.365
7,mlp.gate_proj,0.0001922215,0.05000,1.803
7,mlp.up_proj,0.0001066429,0.05000,1.820
7,mlp.down_proj,0.0000077401,0.05000,3.487
8,self_attn.k_proj,0.0000046752,0.05000,3.969
8,self_attn.v_proj,0.0000047731,0.05000,4.012
8,self_attn.q_proj,0.0000178354,0.05000,4.034
8,self_attn.o_proj,0.0000024056,0.05000,1.357
8,mlp.gate_proj,0.0001238246,0.05000,1.818
8,mlp.up_proj,0.0000997321,0.05000,1.841
8,mlp.down_proj,0.0000107304,0.05000,3.535
9,self_attn.k_proj,0.0000066289,0.05000,3.922
9,self_attn.v_proj,0.0000057406,0.05000,3.985
9,self_attn.q_proj,0.0000228142,0.05000,3.999
9,self_attn.o_proj,0.0000030817,0.05000,1.339
9,mlp.gate_proj,0.0001988376,0.05000,1.867
9,mlp.up_proj,0.0001221854,0.05000,1.890
9,mlp.down_proj,0.0000100834,0.05000,3.498
10,self_attn.v_proj,0.0000088171,0.05000,3.950
10,self_attn.q_proj,0.0000320740,0.05000,3.982
10,self_attn.k_proj,0.0000083633,0.05000,3.991
10,self_attn.o_proj,0.0000037997,0.05000,1.328
10,mlp.gate_proj,0.0001482455,0.05000,1.833
10,mlp.up_proj,0.0001002380,0.05000,1.847
10,mlp.down_proj,0.0000081155,0.05000,3.547
11,self_attn.q_proj,0.0000157204,0.05000,3.920
11,self_attn.k_proj,0.0000043992,0.05000,3.961
11,self_attn.v_proj,0.0000040354,0.05000,3.979
11,self_attn.o_proj,0.0000023009,0.05000,1.361
11,mlp.gate_proj,0.0001224862,0.05000,1.821
11,mlp.up_proj,0.0000944792,0.05000,1.843
11,mlp.down_proj,0.0000084048,0.05000,3.499
12,self_attn.k_proj,0.0000053237,0.05000,3.876
12,self_attn.q_proj,0.0000195351,0.05000,3.972
12,self_attn.v_proj,0.0000052086,0.05000,4.002
12,self_attn.o_proj,0.0000033271,0.05000,1.326
12,mlp.up_proj,0.0000952316,0.05000,1.945
12,mlp.gate_proj,0.0001117326,0.05000,1.964
12,mlp.down_proj,0.0000084220,0.05000,3.492
13,self_attn.k_proj,0.0000040553,0.05000,3.982
13,self_attn.v_proj,0.0000035740,0.05000,4.028
13,self_attn.q_proj,0.0000149411,0.05000,4.051
13,self_attn.o_proj,0.0000025440,0.05000,1.361
13,mlp.up_proj,0.0000980827,0.05000,1.869
13,mlp.gate_proj,0.0001053022,0.05000,1.887
13,mlp.down_proj,0.0000091428,0.05000,3.461
14,self_attn.v_proj,0.0000062012,0.05000,3.923
14,self_attn.q_proj,0.0000241531,0.05000,4.003
14,self_attn.k_proj,0.0000063827,0.05000,4.028
14,self_attn.o_proj,0.0000039574,0.05000,1.324
14,mlp.gate_proj,0.0001051134,0.05000,1.836
14,mlp.up_proj,0.0000985452,0.05000,1.853
14,mlp.down_proj,0.0000083144,0.05000,3.479
15,self_attn.k_proj,0.0000065399,0.05000,3.894
15,self_attn.q_proj,0.0000246789,0.05000,3.961
15,self_attn.v_proj,0.0000057165,0.05000,4.000
15,self_attn.o_proj,0.0000033902,0.05000,1.349
15,mlp.gate_proj,0.0000980051,0.05000,1.929
15,mlp.up_proj,0.0000952363,0.05000,1.953
15,mlp.down_proj,0.0000081789,0.05000,3.566
16,self_attn.v_proj,0.0000111526,0.05000,3.887
16,self_attn.k_proj,0.0000106205,0.05000,3.942
16,self_attn.q_proj,0.0000424247,0.05000,3.978
16,self_attn.o_proj,0.0000038802,0.05000,1.318
16,mlp.up_proj,0.0000966814,0.05000,1.790
16,mlp.gate_proj,0.0001058810,0.05000,1.820
16,mlp.down_proj,0.0000451322,0.05000,3.495
17,self_attn.q_proj,0.0000358253,0.05000,3.836
17,self_attn.k_proj,0.0000080998,0.05000,3.941
17,self_attn.v_proj,0.0000082012,0.05000,3.967
17,self_attn.o_proj,0.0000036289,0.05000,1.328
17,mlp.gate_proj,0.0000921126,0.05000,1.786
17,mlp.up_proj,0.0000849465,0.05000,1.782
17,mlp.down_proj,0.0000071025,0.05000,3.466
18,self_attn.v_proj,0.0000099717,0.05000,3.973
18,self_attn.k_proj,0.0000098200,0.05000,3.997
18,self_attn.q_proj,0.0000393778,0.05000,4.048
18,self_attn.o_proj,0.0000046202,0.05000,1.349
18,mlp.up_proj,0.0000947463,0.05000,1.908
18,mlp.gate_proj,0.0001002435,0.05000,1.925
18,mlp.down_proj,0.0000094912,0.05000,3.519
19,self_attn.v_proj,0.0000176808,0.05000,3.878
19,self_attn.q_proj,0.0000786607,0.05000,3.975
19,self_attn.k_proj,0.0000189547,0.05000,3.977
19,self_attn.o_proj,0.0000072878,0.05000,1.341
19,mlp.gate_proj,0.0001130672,0.05000,1.850
19,mlp.up_proj,0.0001079505,0.05000,1.874
19,mlp.down_proj,0.0000130190,0.05000,3.474
20,self_attn.v_proj,0.0000165799,0.05000,3.919
20,self_attn.k_proj,0.0000168190,0.05000,3.972
20,self_attn.q_proj,0.0000756451,0.05000,3.986
20,self_attn.o_proj,0.0000069506,0.05000,1.357
20,mlp.gate_proj,0.0001250732,0.05000,1.799
20,mlp.up_proj,0.0001220248,0.05000,1.819
20,mlp.down_proj,0.0000152876,0.05000,3.501
21,self_attn.v_proj,0.0000228874,0.05000,3.940
21,self_attn.q_proj,0.0000968350,0.05000,3.979
21,self_attn.k_proj,0.0000223913,0.05000,4.006
21,self_attn.o_proj,0.0000090330,0.05000,1.340
21,mlp.gate_proj,0.0001505156,0.05000,1.844
21,mlp.up_proj,0.0001460762,0.05000,1.855
21,mlp.down_proj,0.0000205126,0.05000,3.539
22,self_attn.v_proj,0.0000470790,0.05000,3.991
22,self_attn.q_proj,0.0002022357,0.05000,4.041
22,self_attn.k_proj,0.0000466329,0.05000,4.060
22,self_attn.o_proj,0.0000183918,0.05000,1.325
22,mlp.gate_proj,0.0001807079,0.05000,1.864
22,mlp.up_proj,0.0001656352,0.05000,1.887
22,mlp.down_proj,0.0000324256,0.05000,3.467
23,self_attn.k_proj,0.0000448676,0.05000,3.970
23,self_attn.v_proj,0.0000475164,0.05000,4.023
23,self_attn.q_proj,0.0001911028,0.05000,4.047
23,self_attn.o_proj,0.0000203201,0.05000,1.321
23,mlp.up_proj,0.0001968862,0.05000,1.826
23,mlp.gate_proj,0.0002260412,0.05000,1.850
23,mlp.down_proj,0.0000465797,0.05000,3.430
24,self_attn.v_proj,0.0000918311,0.05000,3.915
24,self_attn.q_proj,0.0003130213,0.05000,3.980
24,self_attn.k_proj,0.0000751774,0.05000,4.005
24,self_attn.o_proj,0.0000240284,0.05000,1.329
24,mlp.up_proj,0.0002207510,0.05000,1.803
24,mlp.gate_proj,0.0002575789,0.05000,1.812
24,mlp.down_proj,0.0000600394,0.05000,3.719
25,self_attn.q_proj,0.0002166719,0.05000,3.930
25,self_attn.v_proj,0.0000578186,0.05000,3.994
25,self_attn.k_proj,0.0000542144,0.05000,4.005
25,self_attn.o_proj,0.0000134359,0.05000,1.332
25,mlp.up_proj,0.0002558766,0.05000,1.811
25,mlp.gate_proj,0.0003033456,0.05000,1.834
25,mlp.down_proj,0.0000730246,0.05000,3.487
26,self_attn.q_proj,0.0003547980,0.05000,3.916
26,self_attn.k_proj,0.0000841941,0.05000,3.954
26,self_attn.v_proj,0.0000925788,0.05000,3.989
26,self_attn.o_proj,0.0000134945,0.05000,1.351
26,mlp.gate_proj,0.0003733178,0.05000,1.903
26,mlp.up_proj,0.0003256705,0.05000,1.927
26,mlp.down_proj,0.0000952209,0.05000,3.523
27,self_attn.q_proj,0.0004478611,0.05000,3.904
27,self_attn.v_proj,0.0001275532,0.05000,3.981
27,self_attn.k_proj,0.0001037366,0.05000,4.014
27,self_attn.o_proj,0.0000206886,0.05000,1.319
27,mlp.gate_proj,0.0004283897,0.05000,1.854
27,mlp.up_proj,0.0003877850,0.05000,1.870
27,mlp.down_proj,0.0001451184,0.05000,3.689
28,self_attn.k_proj,0.0001290215,0.05000,3.955
28,self_attn.v_proj,0.0001380381,0.05000,4.015
28,self_attn.q_proj,0.0005028249,0.05000,4.041
28,self_attn.o_proj,0.0000354018,0.05000,1.331
28,mlp.gate_proj,0.0004989572,0.05000,1.777
28,mlp.up_proj,0.0004736893,0.05000,1.800
28,mlp.down_proj,0.0002259568,0.05000,3.485
29,self_attn.q_proj,0.0012338733,0.05000,3.883
29,self_attn.k_proj,0.0002937443,0.05000,3.952
29,self_attn.v_proj,0.0003944995,0.05000,3.980
29,self_attn.o_proj,0.0000378399,0.05000,1.396
29,mlp.up_proj,0.0005982406,0.05000,1.797
29,mlp.gate_proj,0.0005981093,0.05000,1.801
29,mlp.down_proj,0.0002386291,0.05000,3.496
30,self_attn.v_proj,0.0004350560,0.05000,3.897
30,self_attn.q_proj,0.0014054731,0.05000,3.941
30,self_attn.k_proj,0.0003603588,0.05000,3.986
30,self_attn.o_proj,0.0000687038,0.05000,1.319
30,mlp.gate_proj,0.0006366458,0.05000,1.815
30,mlp.up_proj,0.0006604899,0.05000,1.813
30,mlp.down_proj,0.0003442335,0.05000,3.540
31,self_attn.k_proj,0.0005021534,0.05000,4.020
31,self_attn.q_proj,0.0018248984,0.05000,4.098
31,self_attn.v_proj,0.0006612717,0.05000,4.119
31,self_attn.o_proj,0.0000640828,0.05000,1.338
31,mlp.up_proj,0.0007156640,0.05000,1.771
31,mlp.gate_proj,0.0006541759,0.05000,1.792
31,mlp.down_proj,0.0004586547,0.05000,3.540
32,self_attn.q_proj,0.0027697828,0.05000,3.898
32,self_attn.k_proj,0.0006917736,0.05000,3.967
32,self_attn.v_proj,0.0010175645,0.05000,4.006
32,self_attn.o_proj,0.0001164538,0.05000,1.352
32,mlp.up_proj,0.0007774354,0.05000,1.754
32,mlp.gate_proj,0.0006933136,0.05000,1.779
32,mlp.down_proj,0.0005796508,0.05000,3.510
33,self_attn.q_proj,0.0060845944,0.05000,3.802
33,self_attn.k_proj,0.0012694908,0.05000,3.924
33,self_attn.v_proj,0.0023390502,0.05000,3.946
33,self_attn.o_proj,0.0001119355,0.05000,1.334
33,mlp.gate_proj,0.0007650941,0.05000,1.843
33,mlp.up_proj,0.0008669923,0.05000,1.857
33,mlp.down_proj,0.0007560028,0.05000,3.585
34,self_attn.v_proj,0.0016800856,0.05000,3.933
34,self_attn.q_proj,0.0047758973,0.05000,3.971
34,self_attn.k_proj,0.0010792233,0.05000,4.010
34,self_attn.o_proj,0.0002744614,0.05000,1.330
34,mlp.gate_proj,0.0009299143,0.05000,1.851
34,mlp.up_proj,0.0009779911,0.05000,1.870
34,mlp.down_proj,0.0009601268,0.05000,3.484
35,self_attn.q_proj,0.0022361877,0.05000,3.879
35,self_attn.k_proj,0.0005822161,0.05000,3.916
35,self_attn.v_proj,0.0007247474,0.05000,3.974
35,self_attn.o_proj,0.0003144698,0.05000,1.357
35,mlp.gate_proj,0.0015252715,0.05000,1.929
35,mlp.up_proj,0.0015549625,0.05000,1.927
35,mlp.down_proj,0.0016945056,0.05000,3.497