File size: 9,297 Bytes
00b2f1e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00022096,0.01000,1.099
0,self_attn.v_proj,0.00000229,0.01000,2.435
0,self_attn.q_proj,0.00036210,0.01000,2.448
0,self_attn.o_proj,0.00000175,0.01000,2.415
0,mlp.up_proj,0.00150737,0.01000,1.416
0,mlp.gate_proj,0.00142441,0.01000,0.274
0,mlp.down_proj,0.00595958,0.01000,0.739
1,self_attn.k_proj,0.00078274,0.01000,0.286
1,self_attn.v_proj,0.00015115,0.01000,0.272
1,self_attn.q_proj,0.00174118,0.01000,0.162
1,self_attn.o_proj,0.00103411,0.01000,0.769
1,mlp.up_proj,0.00179594,0.01000,1.660
1,mlp.gate_proj,0.00228291,0.01000,0.973
1,mlp.down_proj,0.00224895,0.01000,0.746
2,self_attn.k_proj,0.00125878,0.01000,0.437
2,self_attn.v_proj,0.00020735,0.01000,0.269
2,self_attn.q_proj,0.00295782,0.01000,0.638
2,self_attn.o_proj,0.00098028,0.01000,0.810
2,mlp.up_proj,0.00240148,0.01000,0.318
2,mlp.gate_proj,0.00286920,0.01000,0.260
2,mlp.down_proj,0.00500130,0.01000,6.505
3,self_attn.k_proj,0.00188067,0.01000,1.197
3,self_attn.v_proj,0.00074529,0.01000,0.289
3,self_attn.q_proj,0.00454102,0.01000,0.292
3,self_attn.o_proj,0.00114469,0.01000,0.283
3,mlp.up_proj,0.00272536,0.01000,0.309
3,mlp.gate_proj,0.00309045,0.01000,0.279
3,mlp.down_proj,0.00337280,0.01000,0.736
4,self_attn.k_proj,0.00178011,0.01000,0.471
4,self_attn.v_proj,0.00069859,0.01000,0.149
4,self_attn.q_proj,0.00427734,0.01000,0.145
4,self_attn.o_proj,0.00194755,0.01000,1.499
4,mlp.up_proj,0.00357304,0.01000,0.308
4,mlp.gate_proj,0.00408032,0.01000,0.289
4,mlp.down_proj,0.00474062,0.01000,0.744
5,self_attn.k_proj,0.00194141,0.01000,0.269
5,self_attn.v_proj,0.00072606,0.01000,0.919
5,self_attn.q_proj,0.00453751,0.01000,1.476
5,self_attn.o_proj,0.00234540,0.01000,0.281
5,mlp.up_proj,0.00409303,0.01000,0.266
5,mlp.gate_proj,0.00449629,0.01000,0.596
5,mlp.down_proj,0.00556781,0.01000,6.516
6,self_attn.k_proj,0.00163071,0.01000,0.275
6,self_attn.v_proj,0.00068974,0.01000,0.287
6,self_attn.q_proj,0.00406556,0.01000,0.276
6,self_attn.o_proj,0.00182722,0.01000,0.284
6,mlp.up_proj,0.00438432,0.01000,0.273
6,mlp.gate_proj,0.00448065,0.01000,0.271
6,mlp.down_proj,0.00687783,0.01000,0.819
7,self_attn.k_proj,0.00229149,0.01000,0.366
7,self_attn.v_proj,0.00139370,0.01000,0.148
7,self_attn.q_proj,0.00637256,0.01000,0.142
7,self_attn.o_proj,0.00216803,0.01000,1.421
7,mlp.up_proj,0.00479016,0.01000,0.280
7,mlp.gate_proj,0.00473948,0.01000,0.287
7,mlp.down_proj,0.00823352,0.01000,0.831
8,self_attn.k_proj,0.00214538,0.01000,1.666
8,self_attn.v_proj,0.00103131,0.01000,1.952
8,self_attn.q_proj,0.00540090,0.01000,1.636
8,self_attn.o_proj,0.00283757,0.01000,0.303
8,mlp.up_proj,0.00546549,0.01000,0.274
8,mlp.gate_proj,0.00495393,0.01000,0.275
8,mlp.down_proj,0.01154038,0.01000,6.464
9,self_attn.k_proj,0.00147208,0.01000,1.818
9,self_attn.v_proj,0.00058141,0.01000,1.731
9,self_attn.q_proj,0.00394661,0.01000,1.675
9,self_attn.o_proj,0.00251221,0.01000,0.324
9,mlp.up_proj,0.00595842,0.01000,0.347
9,mlp.gate_proj,0.00489875,0.01000,0.343
9,mlp.down_proj,0.01428184,0.01000,0.904
10,self_attn.k_proj,0.00132155,0.01000,2.685
10,self_attn.v_proj,0.00068617,0.01000,2.503
10,self_attn.q_proj,0.00363028,0.01000,1.752
10,self_attn.o_proj,0.00545926,0.01000,0.408
10,mlp.up_proj,0.00611763,0.01000,1.632
10,mlp.gate_proj,0.00474317,0.01000,1.328
10,mlp.down_proj,0.01347071,0.01000,2.937
11,self_attn.k_proj,0.00115821,0.01000,3.339
11,self_attn.v_proj,0.00065106,0.01000,2.422
11,self_attn.q_proj,0.00344706,0.01000,2.382
11,self_attn.o_proj,0.00740811,0.01000,2.400
11,mlp.up_proj,0.00620620,0.01000,2.718
11,mlp.gate_proj,0.00449832,0.01000,2.710
11,mlp.down_proj,0.27257532,0.01000,5.754
12,self_attn.k_proj,0.00163961,0.01000,0.344
12,self_attn.v_proj,0.00094356,0.01000,0.337
12,self_attn.q_proj,0.00456318,0.01000,0.338
12,self_attn.o_proj,0.00419531,0.01000,1.311
12,mlp.up_proj,0.00565002,0.01000,0.279
12,mlp.gate_proj,0.00445975,0.01000,1.091
12,mlp.down_proj,0.01192240,0.01000,4.327
13,self_attn.k_proj,0.00174242,0.01000,0.339
13,self_attn.v_proj,0.00083272,0.01000,0.344
13,self_attn.q_proj,0.00502530,0.01000,0.395
13,self_attn.o_proj,0.00500150,0.01000,0.343
13,mlp.up_proj,0.00570113,0.01000,1.926
13,mlp.gate_proj,0.00524486,0.01000,1.750
13,mlp.down_proj,0.01178209,0.01000,2.821
14,self_attn.k_proj,0.00200629,0.01000,0.361
14,self_attn.v_proj,0.00157519,0.01000,0.359
14,self_attn.q_proj,0.00566488,0.01000,0.366
14,self_attn.o_proj,0.00620107,0.01000,2.248
14,mlp.up_proj,0.00577955,0.01000,4.655
14,mlp.gate_proj,0.00547774,0.01000,5.042
14,mlp.down_proj,0.01469438,0.01000,8.832
15,self_attn.k_proj,0.00194205,0.01000,0.349
15,self_attn.v_proj,0.00151308,0.01000,0.345
15,self_attn.q_proj,0.00563300,0.01000,0.342
15,self_attn.o_proj,0.00601548,0.01000,0.344
15,mlp.up_proj,0.00601284,0.01000,0.342
15,mlp.gate_proj,0.00594717,0.01000,0.336
15,mlp.down_proj,0.01753610,0.01000,5.689
16,self_attn.k_proj,0.00155090,0.01000,1.763
16,self_attn.v_proj,0.00110804,0.01000,0.365
16,self_attn.q_proj,0.00422240,0.01000,0.357
16,self_attn.o_proj,0.00903260,0.01000,0.345
16,mlp.up_proj,0.00553630,0.01000,1.181
16,mlp.gate_proj,0.00532908,0.01000,1.499
16,mlp.down_proj,0.01532181,0.01000,5.315
17,self_attn.k_proj,0.00241632,0.01000,0.830
17,self_attn.v_proj,0.00194845,0.01000,2.641
17,self_attn.q_proj,0.00834111,0.01000,4.413
17,self_attn.o_proj,0.01061929,0.01000,2.746
17,mlp.up_proj,0.00562216,0.01000,2.742
17,mlp.gate_proj,0.00506327,0.01000,1.101
17,mlp.down_proj,0.01818097,0.01000,4.789
18,self_attn.k_proj,0.00273163,0.01000,2.613
18,self_attn.v_proj,0.00311299,0.01000,1.891
18,self_attn.q_proj,0.00828936,0.01000,0.344
18,self_attn.o_proj,0.00938506,0.01000,0.345
18,mlp.up_proj,0.00625932,0.01000,0.344
18,mlp.gate_proj,0.00583430,0.01000,0.339
18,mlp.down_proj,0.03318551,0.01000,2.234
19,self_attn.k_proj,0.00133622,0.01000,0.326
19,self_attn.v_proj,0.00225405,0.01000,0.800
19,self_attn.q_proj,0.00550781,0.01000,1.800
19,self_attn.o_proj,0.01567704,0.01000,0.449
19,mlp.up_proj,0.00725614,0.01000,2.903
19,mlp.gate_proj,0.00687203,0.01000,2.471
19,mlp.down_proj,0.03395692,0.01000,2.946
20,self_attn.k_proj,0.00182818,0.01000,0.388
20,self_attn.v_proj,0.00369986,0.01000,1.045
20,self_attn.q_proj,0.00668970,0.01000,3.772
20,self_attn.o_proj,0.01447436,0.01000,3.580
20,mlp.up_proj,0.00868652,0.01000,2.710
20,mlp.gate_proj,0.00763109,0.01000,1.037
20,mlp.down_proj,0.06614500,0.01000,3.153
21,self_attn.k_proj,0.00169165,0.01000,0.353
21,self_attn.v_proj,0.00278996,0.01000,1.556
21,self_attn.q_proj,0.00603606,0.01000,2.608
21,self_attn.o_proj,0.01160419,0.01000,2.633
21,mlp.up_proj,0.00941546,0.01000,2.761
21,mlp.gate_proj,0.00857336,0.01000,1.637
21,mlp.down_proj,0.05236044,0.01000,3.023
22,self_attn.k_proj,0.00173458,0.01000,0.340
22,self_attn.v_proj,0.00304587,0.01000,0.335
22,self_attn.q_proj,0.00609978,0.01000,1.500
22,self_attn.o_proj,0.01699413,0.01000,0.329
22,mlp.up_proj,0.01043702,0.01000,3.157
22,mlp.gate_proj,0.00901166,0.01000,2.403
22,mlp.down_proj,0.08635419,0.01000,2.277
23,self_attn.k_proj,0.00235798,0.01000,2.724
23,self_attn.v_proj,0.00853371,0.01000,2.700
23,self_attn.q_proj,0.00731025,0.01000,2.679
23,self_attn.o_proj,0.04595792,0.01000,0.347
23,mlp.up_proj,0.01267573,0.01000,1.922
23,mlp.gate_proj,0.00977481,0.01000,1.572
23,mlp.down_proj,0.09878369,0.01000,1.992
24,self_attn.k_proj,0.00193833,0.01000,0.352
24,self_attn.v_proj,0.00926276,0.01000,0.343
24,self_attn.q_proj,0.00732911,0.01000,0.354
24,self_attn.o_proj,0.02490180,0.01000,0.294
24,mlp.up_proj,0.01275103,0.01000,3.643
24,mlp.gate_proj,0.00968059,0.01000,4.339
24,mlp.down_proj,0.13135986,0.01000,6.748
25,self_attn.k_proj,0.00188807,0.01000,1.592
25,self_attn.v_proj,0.00410724,0.01000,1.087
25,self_attn.q_proj,0.00648702,0.01000,0.338
25,self_attn.o_proj,0.01829978,0.01000,1.828
25,mlp.up_proj,0.01323432,0.01000,0.353
25,mlp.gate_proj,0.01043347,0.01000,0.343
25,mlp.down_proj,0.10982227,0.01000,6.597
26,self_attn.k_proj,0.00186195,0.01000,3.885
26,self_attn.v_proj,0.00593649,0.01000,2.686
26,self_attn.q_proj,0.00663982,0.01000,0.818
26,self_attn.o_proj,0.02385299,0.01000,0.346
26,mlp.up_proj,0.01519259,0.01000,0.357
26,mlp.gate_proj,0.01179895,0.01000,0.383
26,mlp.down_proj,0.16240232,0.01000,2.805
27,self_attn.k_proj,0.00188216,0.01000,0.753
27,self_attn.v_proj,0.00480582,0.01000,2.568
27,self_attn.q_proj,0.00687713,0.01000,3.243
27,self_attn.o_proj,0.03130198,0.01000,1.944
27,mlp.up_proj,0.01527163,0.01000,0.361
27,mlp.gate_proj,0.01144433,0.01000,0.350
27,mlp.down_proj,0.20937583,0.01000,6.981
28,self_attn.k_proj,0.00163398,0.01000,2.274
28,self_attn.v_proj,0.00619308,0.01000,0.347
28,self_attn.q_proj,0.00561940,0.01000,1.200
28,self_attn.o_proj,0.02704479,0.01000,0.391
28,mlp.up_proj,0.01647252,0.01000,0.362
28,mlp.gate_proj,0.01167521,0.01000,0.348
28,mlp.down_proj,3.19434714,0.01000,7.166
29,self_attn.k_proj,0.00153822,0.01000,1.574
29,self_attn.v_proj,0.00717453,0.01000,0.978
29,self_attn.q_proj,0.00649254,0.01000,1.795
29,self_attn.o_proj,0.06275121,0.01000,0.949
29,mlp.up_proj,0.02440672,0.01000,2.122
29,mlp.gate_proj,0.01807862,0.01000,0.632
29,mlp.down_proj,0.86159390,0.01000,0.909