File size: 9,067 Bytes
c5c0a20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
layer,module,loss,samples,damp,time
0,self_attn.q_proj,0.0000044066,0.01000,0.476
0,self_attn.k_proj,0.0000019805,0.01000,0.236
0,self_attn.v_proj,0.0000015923,0.01000,0.235
0,self_attn.o_proj,0.0000012302,0.01000,0.467
0,mlp.gate_proj,0.0000475180,0.01000,0.230
0,mlp.up_proj,0.0000243452,0.01000,0.230
0,mlp.down_proj,0.0000015617,0.01000,0.697
1,self_attn.q_proj,0.0000019853,0.01000,0.342
1,self_attn.k_proj,0.0000008835,0.01000,0.291
1,self_attn.v_proj,0.0000008538,0.01000,0.266
1,self_attn.o_proj,0.0000003472,0.01000,0.471
1,mlp.gate_proj,0.0002938726,0.01000,0.234
1,mlp.up_proj,0.0000850689,0.01000,0.233
1,mlp.down_proj,0.0000021194,0.01000,0.699
2,self_attn.q_proj,0.0000038910,0.01000,0.279
2,self_attn.k_proj,0.0000016648,0.01000,0.231
2,self_attn.v_proj,0.0000016415,0.01000,0.231
2,self_attn.o_proj,0.0000005526,0.01000,0.462
2,mlp.gate_proj,0.0001997803,0.01000,0.232
2,mlp.up_proj,0.0000713199,0.01000,0.235
2,mlp.down_proj,0.0008174617,0.01000,0.696
3,self_attn.q_proj,0.0000274823,0.01000,0.270
3,self_attn.k_proj,0.0000134228,0.01000,0.237
3,self_attn.v_proj,0.0000133831,0.01000,0.237
3,self_attn.o_proj,0.0000007627,0.01000,0.471
3,mlp.gate_proj,0.0002638667,0.01000,0.251
3,mlp.up_proj,0.0001012415,0.01000,0.252
3,mlp.down_proj,0.0000053550,0.01000,0.701
4,self_attn.q_proj,0.0000261886,0.01000,0.255
4,self_attn.k_proj,0.0000123612,0.01000,0.229
4,self_attn.v_proj,0.0000132321,0.01000,0.230
4,self_attn.o_proj,0.0000017564,0.01000,0.463
4,mlp.gate_proj,0.0002446483,0.01000,0.234
4,mlp.up_proj,0.0001072414,0.01000,0.233
4,mlp.down_proj,0.0000070149,0.01000,0.696
5,self_attn.q_proj,0.0000465366,0.01000,0.254
5,self_attn.k_proj,0.0000193318,0.01000,0.231
5,self_attn.v_proj,0.0000204175,0.01000,0.231
5,self_attn.o_proj,0.0000022898,0.01000,0.462
5,mlp.gate_proj,0.0001662723,0.01000,0.231
5,mlp.up_proj,0.0000992902,0.01000,0.231
5,mlp.down_proj,0.0000078411,0.01000,0.695
6,self_attn.q_proj,0.0000313367,0.01000,0.256
6,self_attn.k_proj,0.0000139953,0.01000,0.229
6,self_attn.v_proj,0.0000134137,0.01000,0.230
6,self_attn.o_proj,0.0000019070,0.01000,0.462
6,mlp.gate_proj,0.0001977648,0.01000,0.229
6,mlp.up_proj,0.0001242954,0.01000,0.229
6,mlp.down_proj,0.0000100923,0.01000,0.691
7,self_attn.q_proj,0.0000582700,0.01000,0.255
7,self_attn.k_proj,0.0000240924,0.01000,0.229
7,self_attn.v_proj,0.0000268970,0.01000,0.229
7,self_attn.o_proj,0.0000028745,0.01000,0.460
7,mlp.gate_proj,0.0002205437,0.01000,0.231
7,mlp.up_proj,0.0001362631,0.01000,0.230
7,mlp.down_proj,0.0000117519,0.01000,0.694
8,self_attn.q_proj,0.0000694278,0.01000,0.255
8,self_attn.k_proj,0.0000311668,0.01000,0.227
8,self_attn.v_proj,0.0000296902,0.01000,0.229
8,self_attn.o_proj,0.0000033860,0.01000,0.460
8,mlp.gate_proj,0.0002141479,0.01000,0.230
8,mlp.up_proj,0.0001383425,0.01000,0.230
8,mlp.down_proj,0.0000117612,0.01000,0.693
9,self_attn.q_proj,0.0001289912,0.01000,0.253
9,self_attn.k_proj,0.0000529027,0.01000,0.228
9,self_attn.v_proj,0.0000542715,0.01000,0.226
9,self_attn.o_proj,0.0000050044,0.01000,0.459
9,mlp.gate_proj,0.0002396212,0.01000,0.231
9,mlp.up_proj,0.0001509409,0.01000,0.230
9,mlp.down_proj,0.0000166260,0.01000,0.687
10,self_attn.q_proj,0.0001100987,0.01000,0.253
10,self_attn.k_proj,0.0000461426,0.01000,0.226
10,self_attn.v_proj,0.0000473932,0.01000,0.226
10,self_attn.o_proj,0.0000052176,0.01000,0.462
10,mlp.gate_proj,0.0002404488,0.01000,0.229
10,mlp.up_proj,0.0001511854,0.01000,0.228
10,mlp.down_proj,0.0000251323,0.01000,0.700
11,self_attn.q_proj,0.0002361989,0.01000,0.231
11,self_attn.k_proj,0.0000922243,0.01000,0.227
11,self_attn.v_proj,0.0000842471,0.01000,0.227
11,self_attn.o_proj,0.0000151694,0.01000,0.459
11,mlp.gate_proj,0.0001903001,0.01000,0.229
11,mlp.up_proj,0.0001477866,0.01000,0.229
11,mlp.down_proj,0.0000251768,0.01000,0.694
12,self_attn.q_proj,0.0002058949,0.01000,0.256
12,self_attn.k_proj,0.0000757297,0.01000,0.230
12,self_attn.v_proj,0.0000796396,0.01000,0.228
12,self_attn.o_proj,0.0000055696,0.01000,0.460
12,mlp.gate_proj,0.0001705175,0.01000,0.231
12,mlp.up_proj,0.0001429938,0.01000,0.229
12,mlp.down_proj,0.0000244117,0.01000,0.694
13,self_attn.q_proj,0.0002131272,0.01000,0.254
13,self_attn.k_proj,0.0000752313,0.01000,0.228
13,self_attn.v_proj,0.0000870234,0.01000,0.226
13,self_attn.o_proj,0.0000073983,0.01000,0.458
13,mlp.gate_proj,0.0001896553,0.01000,0.227
13,mlp.up_proj,0.0001563918,0.01000,0.229
13,mlp.down_proj,0.0000264410,0.01000,0.687
14,self_attn.q_proj,0.0002928032,0.01000,0.256
14,self_attn.k_proj,0.0001088351,0.01000,0.229
14,self_attn.v_proj,0.0001156139,0.01000,0.228
14,self_attn.o_proj,0.0000082547,0.01000,0.462
14,mlp.gate_proj,0.0002012217,0.01000,0.227
14,mlp.up_proj,0.0001681767,0.01000,0.227
14,mlp.down_proj,0.0000352519,0.01000,0.690
15,self_attn.q_proj,0.0005602758,0.01000,0.232
15,self_attn.k_proj,0.0001800764,0.01000,0.229
15,self_attn.v_proj,0.0002261114,0.01000,0.229
15,self_attn.o_proj,0.0000099340,0.01000,0.461
15,mlp.gate_proj,0.0002238231,0.01000,0.230
15,mlp.up_proj,0.0001888835,0.01000,0.234
15,mlp.down_proj,0.0000422985,0.01000,0.696
16,self_attn.q_proj,0.0007166465,0.01000,0.240
16,self_attn.k_proj,0.0002515462,0.01000,0.238
16,self_attn.v_proj,0.0002401675,0.01000,0.228
16,self_attn.o_proj,0.0000150204,0.01000,0.461
16,mlp.gate_proj,0.0002338325,0.01000,0.231
16,mlp.up_proj,0.0002137495,0.01000,0.227
16,mlp.down_proj,0.0000872017,0.01000,0.693
17,self_attn.q_proj,0.0016075134,0.01000,0.242
17,self_attn.k_proj,0.0005267631,0.01000,0.229
17,self_attn.v_proj,0.0006408359,0.01000,0.230
17,self_attn.o_proj,0.0000315791,0.01000,0.464
17,mlp.gate_proj,0.0003384420,0.01000,0.229
17,mlp.up_proj,0.0003089405,0.01000,0.232
17,mlp.down_proj,0.0001076587,0.01000,0.700
18,self_attn.q_proj,0.0015861574,0.01000,0.254
18,self_attn.k_proj,0.0005132939,0.01000,0.228
18,self_attn.v_proj,0.0006109758,0.01000,0.228
18,self_attn.o_proj,0.0000254093,0.01000,0.461
18,mlp.gate_proj,0.0004072874,0.01000,0.228
18,mlp.up_proj,0.0003803636,0.01000,0.227
18,mlp.down_proj,0.0001712097,0.01000,0.690
19,self_attn.q_proj,0.0027800560,0.01000,0.252
19,self_attn.k_proj,0.0008529581,0.01000,0.226
19,self_attn.v_proj,0.0010568366,0.01000,0.226
19,self_attn.o_proj,0.0000415092,0.01000,0.457
19,mlp.gate_proj,0.0004365114,0.01000,0.227
19,mlp.up_proj,0.0004723935,0.01000,0.226
19,mlp.down_proj,0.0003228430,0.01000,0.693
20,self_attn.q_proj,0.0036227780,0.01000,0.254
20,self_attn.k_proj,0.0012287319,0.01000,0.228
20,self_attn.v_proj,0.0015251022,0.01000,0.226
20,self_attn.o_proj,0.0000489605,0.01000,0.462
20,mlp.gate_proj,0.0004963362,0.01000,0.228
20,mlp.up_proj,0.0005648018,0.01000,0.225
20,mlp.down_proj,0.0004068310,0.01000,0.702
21,self_attn.q_proj,0.0065157214,0.01000,0.239
21,self_attn.k_proj,0.0021859053,0.01000,0.226
21,self_attn.v_proj,0.0027217032,0.01000,0.226
21,self_attn.o_proj,0.0000782762,0.01000,0.462
21,mlp.gate_proj,0.0005434924,0.01000,0.227
21,mlp.up_proj,0.0006905879,0.01000,0.227
21,mlp.down_proj,0.0005955849,0.01000,0.687
22,self_attn.q_proj,0.0066680043,0.01000,0.239
22,self_attn.k_proj,0.0023850383,0.01000,0.228
22,self_attn.v_proj,0.0032360287,0.01000,0.228
22,self_attn.o_proj,0.0000882234,0.01000,0.463
22,mlp.gate_proj,0.0005762426,0.01000,0.229
22,mlp.up_proj,0.0007525707,0.01000,0.229
22,mlp.down_proj,0.0006313954,0.01000,0.699
23,self_attn.q_proj,0.0073616655,0.01000,0.235
23,self_attn.k_proj,0.0030943265,0.01000,0.226
23,self_attn.v_proj,0.0036315418,0.01000,0.227
23,self_attn.o_proj,0.0001049786,0.01000,0.460
23,mlp.gate_proj,0.0006277931,0.01000,0.230
23,mlp.up_proj,0.0008375677,0.01000,0.229
23,mlp.down_proj,0.0006724397,0.01000,0.693
24,self_attn.q_proj,0.0149952166,0.01000,0.240
24,self_attn.k_proj,0.0053064398,0.01000,0.230
24,self_attn.v_proj,0.0057998489,0.01000,0.229
24,self_attn.o_proj,0.0001213201,0.01000,0.455
24,mlp.gate_proj,0.0005788480,0.01000,0.230
24,mlp.up_proj,0.0008078051,0.01000,0.230
24,mlp.down_proj,0.0006965869,0.01000,0.703
25,self_attn.q_proj,0.0209445632,0.01000,0.240
25,self_attn.k_proj,0.0065191538,0.01000,0.233
25,self_attn.v_proj,0.0095592763,0.01000,0.231
25,self_attn.o_proj,0.0001847470,0.01000,0.466
25,mlp.gate_proj,0.0005431011,0.01000,0.231
25,mlp.up_proj,0.0007976848,0.01000,0.232
25,mlp.down_proj,0.0008871590,0.01000,0.700
26,self_attn.q_proj,0.0261648699,0.01000,0.238
26,self_attn.k_proj,0.0069253001,0.01000,0.233
26,self_attn.v_proj,0.0095860545,0.01000,0.232
26,self_attn.o_proj,0.0007540099,0.01000,0.463
26,mlp.gate_proj,0.0006003001,0.01000,0.228
26,mlp.up_proj,0.0008642617,0.01000,0.228
26,mlp.down_proj,0.0012626921,0.01000,0.693
27,self_attn.q_proj,0.0119673502,0.01000,0.230
27,self_attn.k_proj,0.0052954315,0.01000,0.227
27,self_attn.v_proj,0.0064633451,0.01000,0.226
27,self_attn.o_proj,0.0004531447,0.01000,0.460
27,mlp.gate_proj,0.0014340435,0.01000,0.227
27,mlp.up_proj,0.0016221918,0.01000,0.227
27,mlp.down_proj,0.0019386779,0.01000,0.691