File size: 8,680 Bytes
bb44350
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00034001,0.01000,0.702
0,self_attn.v_proj,0.00026275,0.01000,0.516
0,self_attn.q_proj,0.00078015,0.01000,0.472
0,self_attn.o_proj,0.00021305,0.01000,0.944
0,mlp.up_proj,0.00412678,0.01000,0.466
0,mlp.gate_proj,0.00822148,0.01000,0.479
0,mlp.down_proj,0.00023430,0.01000,1.461
1,self_attn.k_proj,0.00014082,0.01000,0.490
1,self_attn.v_proj,0.00013241,0.01000,0.586
1,self_attn.q_proj,0.00031780,0.01000,0.512
1,self_attn.o_proj,0.00004038,0.01000,1.020
1,mlp.up_proj,0.01444682,0.01000,0.496
1,mlp.gate_proj,0.04915192,0.01000,0.495
1,mlp.down_proj,0.00029908,0.01000,1.443
2,self_attn.k_proj,0.00026053,0.01000,0.468
2,self_attn.v_proj,0.00024813,0.01000,0.477
2,self_attn.q_proj,0.00060980,0.01000,0.515
2,self_attn.o_proj,0.00006841,0.01000,1.000
2,mlp.up_proj,0.01214469,0.01000,0.488
2,mlp.gate_proj,0.03373746,0.01000,0.526
2,mlp.down_proj,0.01297616,0.01000,1.444
3,self_attn.k_proj,0.00230989,0.01000,0.465
3,self_attn.v_proj,0.00233178,0.01000,0.470
3,self_attn.q_proj,0.00470302,0.01000,0.480
3,self_attn.o_proj,0.00012092,0.01000,1.027
3,mlp.up_proj,0.01660008,0.01000,0.603
3,mlp.gate_proj,0.04289370,0.01000,0.484
3,mlp.down_proj,0.00092249,0.01000,1.553
4,self_attn.k_proj,0.00206668,0.01000,0.468
4,self_attn.v_proj,0.00214147,0.01000,0.476
4,self_attn.q_proj,0.00418732,0.01000,-1.693
4,self_attn.o_proj,0.00030304,0.01000,0.958
4,mlp.up_proj,0.01767924,0.01000,0.577
4,mlp.gate_proj,0.04030780,0.01000,0.628
4,mlp.down_proj,0.00111819,0.01000,1.658
5,self_attn.k_proj,0.00309932,0.01000,0.472
5,self_attn.v_proj,0.00331202,0.01000,0.475
5,self_attn.q_proj,0.00744162,0.01000,0.474
5,self_attn.o_proj,0.00036463,0.01000,0.938
5,mlp.up_proj,0.01660982,0.01000,0.518
5,mlp.gate_proj,0.02776664,0.01000,0.543
5,mlp.down_proj,0.00127475,0.01000,1.419
6,self_attn.k_proj,0.00246792,0.01000,0.541
6,self_attn.v_proj,0.00227531,0.01000,0.496
6,self_attn.q_proj,0.00543098,0.01000,0.474
6,self_attn.o_proj,0.00031531,0.01000,0.913
6,mlp.up_proj,0.02119459,0.01000,0.491
6,mlp.gate_proj,0.03364027,0.01000,0.556
6,mlp.down_proj,0.00169318,0.01000,1.440
7,self_attn.k_proj,0.00427833,0.01000,0.467
7,self_attn.v_proj,0.00491385,0.01000,0.468
7,self_attn.q_proj,0.01039105,0.01000,0.461
7,self_attn.o_proj,0.00045247,0.01000,1.037
7,mlp.up_proj,0.02380912,0.01000,0.474
7,mlp.gate_proj,0.03846249,0.01000,0.477
7,mlp.down_proj,0.00207670,0.01000,1.418
8,self_attn.k_proj,0.00580886,0.01000,0.458
8,self_attn.v_proj,0.00546446,0.01000,0.457
8,self_attn.q_proj,0.01283393,0.01000,0.464
8,self_attn.o_proj,0.00049309,0.01000,0.930
8,mlp.up_proj,0.02529081,0.01000,0.506
8,mlp.gate_proj,0.03940681,0.01000,0.549
8,mlp.down_proj,0.00239061,0.01000,1.463
9,self_attn.k_proj,0.01022408,0.01000,0.466
9,self_attn.v_proj,0.01063569,0.01000,0.464
9,self_attn.q_proj,0.02464896,0.01000,0.456
9,self_attn.o_proj,0.00082228,0.01000,0.913
9,mlp.up_proj,0.02869781,0.01000,0.475
9,mlp.gate_proj,0.04569711,0.01000,0.495
9,mlp.down_proj,0.00334036,0.01000,1.488
10,self_attn.k_proj,0.00897335,0.01000,0.463
10,self_attn.v_proj,0.00938525,0.01000,0.476
10,self_attn.q_proj,0.02165450,0.01000,0.472
10,self_attn.o_proj,0.00080374,0.01000,0.915
10,mlp.up_proj,0.02908845,0.01000,0.459
10,mlp.gate_proj,0.04619259,0.01000,0.469
10,mlp.down_proj,0.00457235,0.01000,1.560
11,self_attn.k_proj,0.01702636,0.01000,0.470
11,self_attn.v_proj,0.01571462,0.01000,0.448
11,self_attn.q_proj,0.04408321,0.01000,0.460
11,self_attn.o_proj,0.00194463,0.01000,0.917
11,mlp.up_proj,0.02965630,0.01000,0.471
11,mlp.gate_proj,0.03877314,0.01000,0.465
11,mlp.down_proj,0.00576400,0.01000,-0.688
12,self_attn.k_proj,0.01535154,0.01000,0.461
12,self_attn.v_proj,0.01573815,0.01000,0.463
12,self_attn.q_proj,0.04120466,0.01000,0.464
12,self_attn.o_proj,0.00082521,0.01000,0.993
12,mlp.up_proj,0.02786373,0.01000,0.508
12,mlp.gate_proj,0.03390844,0.01000,0.500
12,mlp.down_proj,0.00530050,0.01000,1.504
13,self_attn.k_proj,0.01469768,0.01000,0.532
13,self_attn.v_proj,0.01746682,0.01000,0.644
13,self_attn.q_proj,0.04317660,0.01000,0.650
13,self_attn.o_proj,0.00115520,0.01000,0.997
13,mlp.up_proj,0.02967896,0.01000,0.475
13,mlp.gate_proj,0.03677811,0.01000,0.458
13,mlp.down_proj,0.00540835,0.01000,1.386
14,self_attn.k_proj,0.01980565,0.01000,0.452
14,self_attn.v_proj,0.02136633,0.01000,0.458
14,self_attn.q_proj,0.05437878,0.01000,0.463
14,self_attn.o_proj,0.00118582,0.01000,0.909
14,mlp.up_proj,0.03194932,0.01000,0.581
14,mlp.gate_proj,0.03921878,0.01000,0.569
14,mlp.down_proj,0.00719125,0.01000,1.398
15,self_attn.k_proj,0.03463616,0.01000,0.614
15,self_attn.v_proj,0.04363632,0.01000,0.560
15,self_attn.q_proj,0.10855717,0.01000,0.587
15,self_attn.o_proj,0.00174209,0.01000,1.039
15,mlp.up_proj,0.03514949,0.01000,0.517
15,mlp.gate_proj,0.04189382,0.01000,0.461
15,mlp.down_proj,0.00778224,0.01000,1.585
16,self_attn.k_proj,0.05131978,0.01000,0.457
16,self_attn.v_proj,0.04501638,0.01000,0.453
16,self_attn.q_proj,0.13748899,0.01000,0.460
16,self_attn.o_proj,0.00201723,0.01000,0.920
16,mlp.up_proj,0.04067000,0.01000,0.425
16,mlp.gate_proj,0.04500043,0.01000,0.482
16,mlp.down_proj,0.01533213,0.01000,-0.971
17,self_attn.k_proj,0.10121436,0.01000,0.362
17,self_attn.v_proj,0.12345707,0.01000,0.434
17,self_attn.q_proj,0.30684415,0.01000,0.469
17,self_attn.o_proj,0.00474120,0.01000,0.883
17,mlp.up_proj,0.05722951,0.01000,0.361
17,mlp.gate_proj,0.06477357,0.01000,0.368
17,mlp.down_proj,0.01754329,0.01000,1.108
18,self_attn.k_proj,0.09428492,0.01000,0.359
18,self_attn.v_proj,0.10053023,0.01000,-1.804
18,self_attn.q_proj,0.29437009,0.01000,0.374
18,self_attn.o_proj,0.00352678,0.01000,0.796
18,mlp.up_proj,0.06900685,0.01000,0.379
18,mlp.gate_proj,0.07904451,0.01000,0.397
18,mlp.down_proj,0.02755920,0.01000,1.105
19,self_attn.k_proj,0.16187871,0.01000,0.356
19,self_attn.v_proj,0.20003729,0.01000,0.351
19,self_attn.q_proj,0.52686477,0.01000,0.369
19,self_attn.o_proj,0.00656477,0.01000,0.893
19,mlp.up_proj,0.08853976,0.01000,0.449
19,mlp.gate_proj,0.08336402,0.01000,0.426
19,mlp.down_proj,0.05588865,0.01000,1.080
20,self_attn.k_proj,0.22524926,0.01000,-2.716
20,self_attn.v_proj,0.26741582,0.01000,0.359
20,self_attn.q_proj,0.65623856,0.01000,0.358
20,self_attn.o_proj,0.00873903,0.01000,0.703
20,mlp.up_proj,0.09712939,0.01000,0.365
20,mlp.gate_proj,0.08698984,0.01000,0.385
20,mlp.down_proj,0.06682739,0.01000,1.080
21,self_attn.k_proj,0.39126575,0.01000,0.358
21,self_attn.v_proj,0.50307965,0.01000,0.393
21,self_attn.q_proj,1.09633744,0.01000,0.364
21,self_attn.o_proj,0.01702069,0.01000,0.759
21,mlp.up_proj,0.11749193,0.01000,0.390
21,mlp.gate_proj,0.09473881,0.01000,0.367
21,mlp.down_proj,0.09391166,0.01000,1.339
22,self_attn.k_proj,0.42912284,0.01000,0.366
22,self_attn.v_proj,0.62853205,0.01000,0.363
22,self_attn.q_proj,1.13549972,0.01000,0.362
22,self_attn.o_proj,0.01342478,0.01000,0.734
22,mlp.up_proj,0.12709107,0.01000,0.371
22,mlp.gate_proj,0.10018895,0.01000,0.380
22,mlp.down_proj,0.10143830,0.01000,1.094
23,self_attn.k_proj,0.59195518,0.01000,0.474
23,self_attn.v_proj,0.68701136,0.01000,0.384
23,self_attn.q_proj,1.32605648,0.01000,0.414
23,self_attn.o_proj,0.01738492,0.01000,0.719
23,mlp.up_proj,0.14314744,0.01000,0.361
23,mlp.gate_proj,0.11007850,0.01000,0.408
23,mlp.down_proj,0.10754839,0.01000,1.478
24,self_attn.k_proj,1.00415301,0.01000,0.361
24,self_attn.v_proj,1.12105525,0.01000,0.355
24,self_attn.q_proj,2.56474996,0.01000,0.358
24,self_attn.o_proj,0.02551685,0.01000,0.712
24,mlp.up_proj,0.13545924,0.01000,0.408
24,mlp.gate_proj,0.10024798,0.01000,0.363
24,mlp.down_proj,0.10790002,0.01000,1.191
25,self_attn.k_proj,1.19017565,0.01000,0.356
25,self_attn.v_proj,1.88630354,0.01000,0.358
25,self_attn.q_proj,3.16219616,0.01000,0.353
25,self_attn.o_proj,0.03715168,0.01000,0.753
25,mlp.up_proj,0.13330801,0.01000,0.360
25,mlp.gate_proj,0.09387642,0.01000,0.368
25,mlp.down_proj,0.13108285,0.01000,1.079
26,self_attn.k_proj,1.18263948,0.01000,0.436
26,self_attn.v_proj,1.67280781,0.01000,0.470
26,self_attn.q_proj,3.34765911,0.01000,0.454
26,self_attn.o_proj,0.09499875,0.01000,0.728
26,mlp.up_proj,0.14457943,0.01000,0.355
26,mlp.gate_proj,0.10359854,0.01000,0.367
26,mlp.down_proj,0.20188543,0.01000,1.095
27,self_attn.k_proj,0.88096058,0.01000,0.350
27,self_attn.v_proj,1.04464459,0.01000,0.357
27,self_attn.q_proj,1.89896679,0.01000,0.349
27,self_attn.o_proj,0.05569953,0.01000,0.722
27,mlp.up_proj,0.25829488,0.01000,0.365
27,mlp.gate_proj,0.24046963,0.01000,0.367
27,mlp.down_proj,0.23538056,0.01000,1.094