File size: 9,925 Bytes
e33a532
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.36111963,0.01000,1.132
0,self_attn.v_proj,0.00330429,0.01000,0.942
0,self_attn.q_proj,0.52731681,0.01000,0.963
0,self_attn.o_proj,0.00026867,0.01000,0.983
0,mlp.up_proj,0.23463088,0.01000,0.968
0,mlp.gate_proj,0.28276342,0.01000,0.967
0,mlp.down_proj,0.00119561,0.01000,4.012
1,self_attn.k_proj,0.24816991,0.01000,0.951
1,self_attn.v_proj,0.00948147,0.01000,0.942
1,self_attn.q_proj,0.44486734,0.01000,0.962
1,self_attn.o_proj,0.00069429,0.01000,0.968
1,mlp.up_proj,0.44346130,0.01000,0.977
1,mlp.gate_proj,0.52371848,0.01000,0.978
1,mlp.down_proj,0.16304456,0.01000,4.006
2,self_attn.k_proj,1.27576137,0.01000,0.947
2,self_attn.v_proj,0.05388402,0.01000,0.972
2,self_attn.q_proj,1.91546702,0.01000,0.963
2,self_attn.o_proj,0.00095444,0.01000,0.962
2,mlp.up_proj,0.75267899,0.01000,0.978
2,mlp.gate_proj,0.93858600,0.01000,0.971
2,mlp.down_proj,0.00534942,0.01000,4.054
3,self_attn.k_proj,1.07618117,0.01000,0.951
3,self_attn.v_proj,0.09808896,0.01000,0.966
3,self_attn.q_proj,1.91644359,0.01000,0.963
3,self_attn.o_proj,0.00214759,0.01000,0.961
3,mlp.up_proj,1.06110489,0.01000,0.982
3,mlp.gate_proj,1.51582575,0.01000,0.989
3,mlp.down_proj,0.01012792,0.01000,3.993
4,self_attn.k_proj,1.03121889,0.01000,0.952
4,self_attn.v_proj,0.09737435,0.01000,0.943
4,self_attn.q_proj,1.78057146,0.01000,0.967
4,self_attn.o_proj,0.00524764,0.01000,0.964
4,mlp.up_proj,1.38912082,0.01000,0.981
4,mlp.gate_proj,2.25040221,0.01000,0.976
4,mlp.down_proj,0.01820908,0.01000,4.032
5,self_attn.k_proj,1.77245164,0.01000,0.949
5,self_attn.v_proj,0.10094162,0.01000,0.958
5,self_attn.q_proj,2.76073647,0.01000,0.963
5,self_attn.o_proj,0.00572381,0.01000,0.962
5,mlp.up_proj,1.76203442,0.01000,0.984
5,mlp.gate_proj,2.82282686,0.01000,0.978
5,mlp.down_proj,0.02650169,0.01000,4.003
6,self_attn.k_proj,1.46186721,0.01000,0.951
6,self_attn.v_proj,0.11557909,0.01000,0.950
6,self_attn.q_proj,2.57779884,0.01000,0.960
6,self_attn.o_proj,0.01030868,0.01000,0.965
6,mlp.up_proj,1.95960164,0.01000,0.987
6,mlp.gate_proj,3.18044949,0.01000,0.982
6,mlp.down_proj,0.03279492,0.01000,4.409
7,self_attn.k_proj,1.48253345,0.01000,0.948
7,self_attn.v_proj,0.12368202,0.01000,0.944
7,self_attn.q_proj,2.45336533,0.01000,0.955
7,self_attn.o_proj,0.01420613,0.01000,0.970
7,mlp.up_proj,2.13492918,0.01000,0.988
7,mlp.gate_proj,3.24488592,0.01000,0.983
7,mlp.down_proj,0.03850950,0.01000,4.023
8,self_attn.k_proj,1.93849897,0.01000,0.954
8,self_attn.v_proj,0.16590264,0.01000,0.950
8,self_attn.q_proj,3.13656378,0.01000,0.970
8,self_attn.o_proj,0.01967191,0.01000,0.958
8,mlp.up_proj,2.29845905,0.01000,0.982
8,mlp.gate_proj,3.54030752,0.01000,0.982
8,mlp.down_proj,0.04251836,0.01000,4.048
9,self_attn.k_proj,1.89687407,0.01000,0.955
9,self_attn.v_proj,0.23918010,0.01000,0.973
9,self_attn.q_proj,3.16648197,0.01000,0.965
9,self_attn.o_proj,0.02422045,0.01000,0.962
9,mlp.up_proj,2.43423367,0.01000,1.343
9,mlp.gate_proj,3.77251744,0.01000,0.981
9,mlp.down_proj,0.04667648,0.01000,4.252
10,self_attn.k_proj,2.30144119,0.01000,0.954
10,self_attn.v_proj,0.18498819,0.01000,0.965
10,self_attn.q_proj,3.73618531,0.01000,0.973
10,self_attn.o_proj,0.02161483,0.01000,0.963
10,mlp.up_proj,2.54761338,0.01000,0.989
10,mlp.gate_proj,3.68303084,0.01000,0.980
10,mlp.down_proj,0.04879866,0.01000,4.002
11,self_attn.k_proj,2.10925364,0.01000,0.953
11,self_attn.v_proj,0.19330561,0.01000,0.947
11,self_attn.q_proj,3.28746176,0.01000,0.961
11,self_attn.o_proj,0.02294213,0.01000,0.965
11,mlp.up_proj,2.67688942,0.01000,0.983
11,mlp.gate_proj,3.74871111,0.01000,0.980
11,mlp.down_proj,0.05176591,0.01000,4.099
12,self_attn.k_proj,1.64494085,0.01000,0.949
12,self_attn.v_proj,0.22913060,0.01000,0.956
12,self_attn.q_proj,2.86509371,0.01000,0.969
12,self_attn.o_proj,0.02996064,0.01000,0.961
12,mlp.up_proj,2.74297428,0.01000,0.989
12,mlp.gate_proj,3.63758588,0.01000,0.985
12,mlp.down_proj,0.05879739,0.01000,4.043
13,self_attn.k_proj,2.44561863,0.01000,0.956
13,self_attn.v_proj,0.25090086,0.01000,0.978
13,self_attn.q_proj,3.72013021,0.01000,0.972
13,self_attn.o_proj,0.03329192,0.01000,0.967
13,mlp.up_proj,2.89052248,0.01000,0.989
13,mlp.gate_proj,3.83109856,0.01000,1.001
13,mlp.down_proj,0.06681926,0.01000,4.075
14,self_attn.k_proj,2.59889841,0.01000,0.956
14,self_attn.v_proj,0.25943100,0.01000,0.980
14,self_attn.q_proj,3.71864319,0.01000,0.979
14,self_attn.o_proj,0.03607188,0.01000,0.963
14,mlp.up_proj,3.16311407,0.01000,0.986
14,mlp.gate_proj,4.43673038,0.01000,0.983
14,mlp.down_proj,0.08331311,0.01000,4.020
15,self_attn.k_proj,2.41041493,0.01000,0.961
15,self_attn.v_proj,0.32465303,0.01000,0.970
15,self_attn.q_proj,4.43637896,0.01000,0.982
15,self_attn.o_proj,0.04316147,0.01000,0.970
15,mlp.up_proj,3.33997822,0.01000,0.988
15,mlp.gate_proj,4.94344902,0.01000,1.021
15,mlp.down_proj,0.10118946,0.01000,4.714
16,self_attn.k_proj,2.50961113,0.01000,0.965
16,self_attn.v_proj,0.29429543,0.01000,0.957
16,self_attn.q_proj,4.07947636,0.01000,0.968
16,self_attn.o_proj,0.03333106,0.01000,0.975
16,mlp.up_proj,3.60199404,0.01000,0.984
16,mlp.gate_proj,5.63074589,0.01000,0.976
16,mlp.down_proj,0.11140943,0.01000,4.086
17,self_attn.k_proj,2.74082637,0.01000,0.961
17,self_attn.v_proj,0.32146555,0.01000,0.955
17,self_attn.q_proj,4.31714869,0.01000,0.977
17,self_attn.o_proj,0.03052786,0.01000,0.967
17,mlp.up_proj,3.74027133,0.01000,0.986
17,mlp.gate_proj,5.97789478,0.01000,0.992
17,mlp.down_proj,0.12818229,0.01000,4.005
18,self_attn.k_proj,3.02894711,0.01000,0.957
18,self_attn.v_proj,0.33139157,0.01000,0.962
18,self_attn.q_proj,4.38174438,0.01000,1.187
18,self_attn.o_proj,0.02073601,0.01000,0.973
18,mlp.up_proj,3.95718646,0.01000,1.081
18,mlp.gate_proj,6.38988972,0.01000,1.134
18,mlp.down_proj,0.12699364,0.01000,4.431
19,self_attn.k_proj,2.72588944,0.01000,1.079
19,self_attn.v_proj,0.36277997,0.01000,1.053
19,self_attn.q_proj,4.48861694,0.01000,1.078
19,self_attn.o_proj,0.01849649,0.01000,1.106
19,mlp.up_proj,4.11148834,0.01000,1.104
19,mlp.gate_proj,6.76255035,0.01000,1.077
19,mlp.down_proj,0.13344963,0.01000,4.397
20,self_attn.k_proj,2.99772930,0.01000,1.048
20,self_attn.v_proj,0.39009190,0.01000,1.045
20,self_attn.q_proj,4.62490082,0.01000,1.075
20,self_attn.o_proj,0.02120636,0.01000,1.091
20,mlp.up_proj,4.43619490,0.01000,1.133
20,mlp.gate_proj,7.22839403,0.01000,1.113
20,mlp.down_proj,0.14441478,0.01000,4.425
21,self_attn.k_proj,2.94480252,0.01000,1.066
21,self_attn.v_proj,0.42260897,0.01000,1.056
21,self_attn.q_proj,4.43837166,0.01000,1.074
21,self_attn.o_proj,0.02850885,0.01000,1.062
21,mlp.up_proj,4.73225355,0.01000,1.021
21,mlp.gate_proj,7.77117300,0.01000,1.070
21,mlp.down_proj,0.16843449,0.01000,5.555
22,self_attn.k_proj,3.09630203,0.01000,0.971
22,self_attn.v_proj,0.49371791,0.01000,1.004
22,self_attn.q_proj,4.48650932,0.01000,0.987
22,self_attn.o_proj,0.02654779,0.01000,0.978
22,mlp.up_proj,4.93645144,0.01000,1.015
22,mlp.gate_proj,8.03310680,0.01000,1.009
22,mlp.down_proj,0.17289530,0.01000,4.040
23,self_attn.k_proj,2.98398399,0.01000,0.954
23,self_attn.v_proj,0.53825200,0.01000,0.972
23,self_attn.q_proj,4.67381859,0.01000,0.961
23,self_attn.o_proj,0.02713704,0.01000,0.963
23,mlp.up_proj,5.21848965,0.01000,0.993
23,mlp.gate_proj,8.43232536,0.01000,0.997
23,mlp.down_proj,0.18386570,0.01000,4.056
24,self_attn.k_proj,2.98328638,0.01000,0.953
24,self_attn.v_proj,0.67641538,0.01000,0.944
24,self_attn.q_proj,4.71260357,0.01000,0.964
24,self_attn.o_proj,0.02995079,0.01000,0.968
24,mlp.up_proj,5.57473373,0.01000,0.982
24,mlp.gate_proj,9.01408386,0.01000,0.981
24,mlp.down_proj,0.19735718,0.01000,4.019
25,self_attn.k_proj,2.80995131,0.01000,0.971
25,self_attn.v_proj,0.70912492,0.01000,0.987
25,self_attn.q_proj,4.73544788,0.01000,0.968
25,self_attn.o_proj,0.03377030,0.01000,0.962
25,mlp.up_proj,5.95643902,0.01000,0.983
25,mlp.gate_proj,9.63203812,0.01000,0.981
25,mlp.down_proj,0.21878015,0.01000,4.016
26,self_attn.k_proj,2.99053884,0.01000,0.956
26,self_attn.v_proj,0.65835601,0.01000,0.969
26,self_attn.q_proj,4.58326244,0.01000,0.982
26,self_attn.o_proj,0.04630172,0.01000,0.966
26,mlp.up_proj,6.38272285,0.01000,0.983
26,mlp.gate_proj,10.33224392,0.01000,0.979
26,mlp.down_proj,0.24722236,0.01000,4.049
27,self_attn.k_proj,3.26289296,0.01000,0.950
27,self_attn.v_proj,0.95175558,0.01000,0.966
27,self_attn.q_proj,4.78752518,0.01000,0.960
27,self_attn.o_proj,0.06208333,0.01000,0.982
27,mlp.up_proj,7.02820301,0.01000,0.990
27,mlp.gate_proj,11.29987144,0.01000,0.986
27,mlp.down_proj,0.29721794,0.01000,4.009
28,self_attn.k_proj,2.59787798,0.01000,0.953
28,self_attn.v_proj,0.84426367,0.01000,0.946
28,self_attn.q_proj,4.46915436,0.01000,0.964
28,self_attn.o_proj,0.09729099,0.01000,0.970
28,mlp.up_proj,7.81499147,0.01000,0.996
28,mlp.gate_proj,11.99997711,0.01000,0.981
28,mlp.down_proj,0.38746351,0.01000,4.051
29,self_attn.k_proj,2.69152451,0.01000,0.954
29,self_attn.v_proj,1.02270174,0.01000,0.950
29,self_attn.q_proj,4.71809244,0.01000,0.973
29,self_attn.o_proj,0.08194697,0.01000,0.969
29,mlp.up_proj,8.35252285,0.01000,0.995
29,mlp.gate_proj,12.24577141,0.01000,1.003
29,mlp.down_proj,0.53259313,0.01000,4.059
30,self_attn.k_proj,2.70090246,0.01000,0.956
30,self_attn.v_proj,1.38668847,0.01000,1.731
30,self_attn.q_proj,4.37570143,0.01000,1.174
30,self_attn.o_proj,0.16421506,0.01000,0.969
30,mlp.up_proj,8.91942406,0.01000,0.990
30,mlp.gate_proj,13.37013245,0.01000,0.986
30,mlp.down_proj,0.85872936,0.01000,4.022
31,self_attn.k_proj,1.97329688,0.01000,0.959
31,self_attn.v_proj,0.84535497,0.01000,0.967
31,self_attn.q_proj,3.81004381,0.01000,1.001
31,self_attn.o_proj,0.26083553,0.01000,0.969
31,mlp.up_proj,8.20458317,0.01000,0.988
31,mlp.gate_proj,11.96145439,0.01000,0.987
31,mlp.down_proj,2.20310783,0.01000,4.006