File size: 11,328 Bytes
3ed573b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00093500,0.01000,1.534
0,self_attn.v_proj,0.00075287,0.01000,1.058
0,self_attn.q_proj,0.00301158,0.01000,0.966
0,self_attn.o_proj,0.01636044,0.01000,1.097
0,mlp.up_proj,0.55349815,0.01000,1.074
0,mlp.gate_proj,0.63002926,0.01000,0.989
0,mlp.down_proj,0.18759912,0.01000,3.718
1,self_attn.k_proj,0.00388462,0.01000,1.037
1,self_attn.v_proj,0.00418270,0.01000,1.124
1,self_attn.q_proj,0.01329488,0.01000,1.123
1,self_attn.o_proj,0.02369094,0.01000,1.134
1,mlp.up_proj,5.06094027,0.01000,1.068
1,mlp.gate_proj,12.48626137,0.01000,0.973
1,mlp.down_proj,0.21249261,0.01000,3.772
2,self_attn.k_proj,0.00920746,0.01000,1.026
2,self_attn.v_proj,0.00892699,0.01000,0.995
2,self_attn.q_proj,0.03115090,0.01000,0.972
2,self_attn.o_proj,0.01967876,0.01000,1.049
2,mlp.up_proj,18.21238136,0.01000,1.142
2,mlp.gate_proj,23.30099678,0.01000,1.107
2,mlp.down_proj,0.15935239,0.01000,3.670
3,self_attn.k_proj,0.01730567,0.01000,1.145
3,self_attn.v_proj,0.01813262,0.01000,1.010
3,self_attn.q_proj,0.06220551,0.01000,1.113
3,self_attn.o_proj,0.03520732,0.01000,1.112
3,mlp.up_proj,11.37148094,0.01000,1.075
3,mlp.gate_proj,24.17206383,0.01000,1.038
3,mlp.down_proj,0.37454456,0.01000,3.873
4,self_attn.k_proj,0.03873355,0.01000,1.127
4,self_attn.v_proj,0.04026245,0.01000,1.068
4,self_attn.q_proj,0.13652131,0.01000,1.121
4,self_attn.o_proj,0.05750610,0.01000,1.179
4,mlp.up_proj,11.50895309,0.01000,1.067
4,mlp.gate_proj,29.62431717,0.01000,1.020
4,mlp.down_proj,0.79113972,0.01000,3.775
5,self_attn.k_proj,0.03782712,0.01000,1.035
5,self_attn.v_proj,0.04062828,0.01000,1.005
5,self_attn.q_proj,0.13939869,0.01000,0.988
5,self_attn.o_proj,0.08601132,0.01000,1.120
5,mlp.up_proj,7.35449219,0.01000,1.113
5,mlp.gate_proj,15.71476841,0.01000,0.987
5,mlp.down_proj,1.26612008,0.01000,3.658
6,self_attn.k_proj,0.07410677,0.01000,1.083
6,self_attn.v_proj,0.08444937,0.01000,1.035
6,self_attn.q_proj,0.29530990,0.01000,1.046
6,self_attn.o_proj,0.24855541,0.01000,1.035
6,mlp.up_proj,12.12503052,0.01000,1.186
6,mlp.gate_proj,24.27440262,0.01000,1.014
6,mlp.down_proj,59.69503403,0.01000,3.886
7,self_attn.k_proj,0.18620780,0.01000,1.172
7,self_attn.v_proj,0.19225197,0.01000,1.037
7,self_attn.q_proj,0.66303122,0.01000,0.981
7,self_attn.o_proj,0.22942577,0.01000,1.053
7,mlp.up_proj,12.31387806,0.01000,1.202
7,mlp.gate_proj,21.64307404,0.01000,1.131
7,mlp.down_proj,2.05965924,0.01000,3.897
8,self_attn.k_proj,0.31598431,0.01000,1.144
8,self_attn.v_proj,0.34093946,0.01000,1.188
8,self_attn.q_proj,1.14995360,0.01000,1.148
8,self_attn.o_proj,0.35936299,0.01000,1.137
8,mlp.up_proj,12.45734978,0.01000,1.095
8,mlp.gate_proj,14.27222443,0.01000,1.059
8,mlp.down_proj,3.87224698,0.01000,3.592
9,self_attn.k_proj,0.42755005,0.01000,1.060
9,self_attn.v_proj,0.43955854,0.01000,0.980
9,self_attn.q_proj,1.51034832,0.01000,0.993
9,self_attn.o_proj,0.53357273,0.01000,1.063
9,mlp.up_proj,17.22698212,0.01000,1.102
9,mlp.gate_proj,23.49119186,0.01000,1.075
9,mlp.down_proj,5.00397158,0.01000,3.603
10,self_attn.k_proj,0.90024441,0.01000,1.063
10,self_attn.v_proj,1.01532078,0.01000,0.989
10,self_attn.q_proj,3.25746417,0.01000,0.973
10,self_attn.o_proj,0.74504685,0.01000,1.033
10,mlp.up_proj,18.57254982,0.01000,1.187
10,mlp.gate_proj,23.94193268,0.01000,1.042
10,mlp.down_proj,5.72752857,0.01000,3.799
11,self_attn.k_proj,0.46532309,0.01000,1.186
11,self_attn.v_proj,0.49314433,0.01000,1.097
11,self_attn.q_proj,1.61019170,0.01000,1.068
11,self_attn.o_proj,0.63873482,0.01000,1.066
11,mlp.up_proj,19.01406097,0.01000,1.049
11,mlp.gate_proj,22.41117859,0.01000,1.093
11,mlp.down_proj,5.03123236,0.01000,3.816
12,self_attn.k_proj,0.53598475,0.01000,1.056
12,self_attn.v_proj,0.58172190,0.01000,0.974
12,self_attn.q_proj,1.87110019,0.01000,1.103
12,self_attn.o_proj,0.86515743,0.01000,1.163
12,mlp.up_proj,19.76538849,0.01000,1.060
12,mlp.gate_proj,21.69308472,0.01000,0.996
12,mlp.down_proj,4.94389725,0.01000,3.518
13,self_attn.k_proj,0.41922653,0.01000,1.072
13,self_attn.v_proj,0.41501531,0.01000,0.966
13,self_attn.q_proj,1.54299450,0.01000,1.014
13,self_attn.o_proj,0.64388251,0.01000,1.041
13,mlp.up_proj,19.62747574,0.01000,1.152
13,mlp.gate_proj,19.93264961,0.01000,1.026
13,mlp.down_proj,5.23524094,0.01000,3.653
14,self_attn.k_proj,0.69069356,0.01000,1.158
14,self_attn.v_proj,0.72211957,0.01000,1.076
14,self_attn.q_proj,2.52726769,0.01000,0.986
14,self_attn.o_proj,1.15350628,0.01000,1.025
14,mlp.up_proj,19.14536667,0.01000,1.055
14,mlp.gate_proj,19.30226707,0.01000,1.131
14,mlp.down_proj,4.67902088,0.01000,3.912
15,self_attn.k_proj,0.73228085,0.01000,1.084
15,self_attn.v_proj,0.70357966,0.01000,1.095
15,self_attn.q_proj,2.62229300,0.01000,1.147
15,self_attn.o_proj,1.01154995,0.01000,1.058
15,mlp.up_proj,18.30879593,0.01000,1.072
15,mlp.gate_proj,17.72216034,0.01000,0.982
15,mlp.down_proj,5.20527649,0.01000,3.729
16,self_attn.k_proj,1.26578164,0.01000,1.050
16,self_attn.v_proj,1.44486320,0.01000,0.955
16,self_attn.q_proj,4.88816977,0.01000,1.048
16,self_attn.o_proj,1.40934920,0.01000,1.159
16,mlp.up_proj,20.92573166,0.01000,1.061
16,mlp.gate_proj,21.00225067,0.01000,0.998
16,mlp.down_proj,12.26511765,0.01000,3.586
17,self_attn.k_proj,1.20173907,0.01000,1.172
17,self_attn.v_proj,1.35401189,0.01000,1.089
17,self_attn.q_proj,4.90240002,0.01000,1.130
17,self_attn.o_proj,1.96535897,0.01000,1.158
17,mlp.up_proj,20.21404648,0.01000,1.085
17,mlp.gate_proj,19.69080925,0.01000,0.977
17,mlp.down_proj,8.91361427,0.01000,3.612
18,self_attn.k_proj,1.35796165,0.01000,1.066
18,self_attn.v_proj,1.48053002,0.01000,0.970
18,self_attn.q_proj,5.17301416,0.01000,1.029
18,self_attn.o_proj,1.48301518,0.01000,1.033
18,mlp.up_proj,22.05006790,0.01000,1.070
18,mlp.gate_proj,21.51061440,0.01000,1.045
18,mlp.down_proj,7.47183609,0.01000,3.574
19,self_attn.k_proj,2.67927146,0.01000,1.050
19,self_attn.v_proj,2.84377718,0.01000,0.990
19,self_attn.q_proj,10.55477047,0.01000,1.005
19,self_attn.o_proj,2.78883767,0.01000,1.057
19,mlp.up_proj,25.99320602,0.01000,1.182
19,mlp.gate_proj,25.00505829,0.01000,1.060
19,mlp.down_proj,9.58252621,0.01000,3.734
20,self_attn.k_proj,2.25592470,0.01000,1.186
20,self_attn.v_proj,2.64512777,0.01000,1.087
20,self_attn.q_proj,9.77148819,0.01000,0.975
20,self_attn.o_proj,2.61370730,0.01000,1.056
20,mlp.up_proj,28.45001221,0.01000,1.048
20,mlp.gate_proj,26.85064888,0.01000,1.100
20,mlp.down_proj,10.31070518,0.01000,3.764
21,self_attn.k_proj,3.03140640,0.01000,1.053
21,self_attn.v_proj,3.70216203,0.01000,1.002
21,self_attn.q_proj,12.58547688,0.01000,0.986
21,self_attn.o_proj,2.81117725,0.01000,1.165
21,mlp.up_proj,32.83880615,0.01000,1.052
21,mlp.gate_proj,30.72813225,0.01000,0.987
21,mlp.down_proj,14.17037201,0.01000,3.583
22,self_attn.k_proj,6.70605469,0.01000,1.070
22,self_attn.v_proj,7.37399912,0.01000,0.973
22,self_attn.q_proj,26.31335831,0.01000,1.006
22,self_attn.o_proj,5.94558525,0.01000,1.058
22,mlp.up_proj,38.05461502,0.01000,1.204
22,mlp.gate_proj,35.98967361,0.01000,1.021
22,mlp.down_proj,23.43338966,0.01000,3.696
23,self_attn.k_proj,6.65718555,0.01000,1.167
23,self_attn.v_proj,8.32367611,0.01000,1.091
23,self_attn.q_proj,27.57974243,0.01000,0.993
23,self_attn.o_proj,9.29317760,0.01000,1.056
23,mlp.up_proj,43.67939758,0.01000,1.085
23,mlp.gate_proj,42.31611633,0.01000,1.128
23,mlp.down_proj,31.69913673,0.01000,3.802
24,self_attn.k_proj,11.80602646,0.01000,1.067
24,self_attn.v_proj,15.26894760,0.01000,1.076
24,self_attn.q_proj,48.94207001,0.01000,1.119
24,self_attn.o_proj,14.16162300,0.01000,1.110
24,mlp.up_proj,47.95410156,0.01000,1.113
24,mlp.gate_proj,46.95746231,0.01000,0.999
24,mlp.down_proj,37.59236908,0.01000,3.698
25,self_attn.k_proj,9.39568329,0.01000,1.065
25,self_attn.v_proj,11.52959633,0.01000,0.981
25,self_attn.q_proj,37.55451965,0.01000,1.061
25,self_attn.o_proj,6.60415459,0.01000,1.156
25,mlp.up_proj,53.72169495,0.01000,1.061
25,mlp.gate_proj,53.26170349,0.01000,1.014
25,mlp.down_proj,49.13291931,0.01000,3.564
26,self_attn.k_proj,15.07968521,0.01000,1.042
26,self_attn.v_proj,18.87903214,0.01000,1.023
26,self_attn.q_proj,61.75351334,0.01000,0.987
26,self_attn.o_proj,8.19011021,0.01000,1.035
26,mlp.up_proj,63.40507126,0.01000,1.162
26,mlp.gate_proj,61.87738037,0.01000,0.968
26,mlp.down_proj,55.10468674,0.01000,3.617
27,self_attn.k_proj,16.51064682,0.01000,1.152
27,self_attn.v_proj,22.46823502,0.01000,0.951
27,self_attn.q_proj,69.66435242,0.01000,1.014
27,self_attn.o_proj,9.08815002,0.01000,1.053
27,mlp.up_proj,70.57014465,0.01000,1.231
27,mlp.gate_proj,67.74318695,0.01000,1.085
27,mlp.down_proj,74.30647278,0.01000,3.742
28,self_attn.k_proj,19.06116486,0.01000,1.185
28,self_attn.v_proj,22.31396866,0.01000,1.009
28,self_attn.q_proj,73.59075928,0.01000,1.058
28,self_attn.o_proj,15.23631573,0.01000,1.049
28,mlp.up_proj,81.82687378,0.01000,1.201
28,mlp.gate_proj,76.54244995,0.01000,1.133
28,mlp.down_proj,100.95344543,0.01000,3.875
29,self_attn.k_proj,42.74740601,0.01000,1.176
29,self_attn.v_proj,62.09001541,0.01000,1.087
29,self_attn.q_proj,169.90083313,0.01000,1.098
29,self_attn.o_proj,19.69995117,0.01000,1.015
29,mlp.up_proj,94.24476624,0.01000,1.089
29,mlp.gate_proj,85.47050476,0.01000,0.995
29,mlp.down_proj,111.90260315,0.01000,3.936
30,self_attn.k_proj,48.42563629,0.01000,1.164
30,self_attn.v_proj,63.64318848,0.01000,1.086
30,self_attn.q_proj,186.39895630,0.01000,1.069
30,self_attn.o_proj,28.51611710,0.01000,1.014
30,mlp.up_proj,99.81655884,0.01000,1.058
30,mlp.gate_proj,88.40076447,0.01000,0.987
30,mlp.down_proj,144.04133606,0.01000,3.710
31,self_attn.k_proj,67.51919556,0.01000,1.048
31,self_attn.v_proj,93.95922852,0.01000,0.948
31,self_attn.q_proj,243.45693970,0.01000,1.109
31,self_attn.o_proj,38.91883850,0.01000,1.155
31,mlp.up_proj,105.36692047,0.01000,1.053
31,mlp.gate_proj,90.30496979,0.01000,1.033
31,mlp.down_proj,174.71215820,0.01000,3.657
32,self_attn.k_proj,90.68847656,0.01000,1.075
32,self_attn.v_proj,136.25199890,0.01000,0.984
32,self_attn.q_proj,349.72949219,0.01000,1.022
32,self_attn.o_proj,42.40522003,0.01000,1.082
32,mlp.up_proj,112.39004517,0.01000,1.057
32,mlp.gate_proj,94.23210907,0.01000,1.021
32,mlp.down_proj,209.10299683,0.01000,3.541
33,self_attn.k_proj,160.63726807,0.01000,1.170
33,self_attn.v_proj,312.46691895,0.01000,1.057
33,self_attn.q_proj,723.88800049,0.01000,1.030
33,self_attn.o_proj,101.37340546,0.01000,1.064
33,mlp.up_proj,123.91452026,0.01000,1.132
33,mlp.gate_proj,102.19406128,0.01000,1.138
33,mlp.down_proj,272.35577393,0.01000,3.912
34,self_attn.k_proj,137.95373535,0.01000,1.092
34,self_attn.v_proj,218.98117065,0.01000,1.085
34,self_attn.q_proj,585.34942627,0.01000,1.113
34,self_attn.o_proj,121.98693085,0.01000,1.006
34,mlp.up_proj,144.67446899,0.01000,1.042
34,mlp.gate_proj,125.80036163,0.01000,1.068
34,mlp.down_proj,392.88323975,0.01000,3.726
35,self_attn.k_proj,63.21575165,0.01000,1.095
35,self_attn.v_proj,82.64318848,0.01000,0.952
35,self_attn.q_proj,236.55862427,0.01000,1.097
35,self_attn.o_proj,66.26197815,0.01000,1.150
35,mlp.up_proj,196.64938354,0.01000,1.047
35,mlp.gate_proj,170.04873657,0.01000,1.024
35,mlp.down_proj,2814.77734375,0.01000,3.573