File size: 7,440 Bytes
ba242ea
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00268859,0.01000,2.297
0,self_attn.v_proj,0.00012146,0.01000,1.532
0,self_attn.q_proj,0.00339818,0.01000,1.401
0,self_attn.o_proj,0.00007466,0.01000,3.458
0,mlp.up_proj,0.00165959,0.01000,3.002
0,mlp.gate_proj,0.00176081,0.01000,2.685
0,mlp.down_proj,0.00171541,0.01000,19.171
1,self_attn.k_proj,0.00514033,0.01000,3.422
1,self_attn.v_proj,0.00119326,0.01000,3.608
1,self_attn.q_proj,0.00603395,0.01000,1.613
1,self_attn.o_proj,0.00048323,0.01000,3.834
1,mlp.up_proj,0.00365061,0.01000,1.590
1,mlp.gate_proj,0.00421130,0.01000,6.380
1,mlp.down_proj,0.02673751,0.01000,7.127
2,self_attn.k_proj,0.00933676,0.01000,1.540
2,self_attn.v_proj,0.00363998,0.01000,2.579
2,self_attn.q_proj,0.01070433,0.01000,3.024
2,self_attn.o_proj,0.00095308,0.01000,1.640
2,mlp.up_proj,0.00610160,0.01000,10.450
2,mlp.gate_proj,0.00684849,0.01000,3.323
2,mlp.down_proj,0.00416326,0.01000,11.194
3,self_attn.k_proj,0.01245183,0.01000,3.158
3,self_attn.v_proj,0.00521770,0.01000,3.034
3,self_attn.q_proj,0.01259811,0.01000,3.280
3,self_attn.o_proj,0.00154380,0.01000,8.060
3,mlp.up_proj,0.00826654,0.01000,1.420
3,mlp.gate_proj,0.00868698,0.01000,1.575
3,mlp.down_proj,0.00818474,0.01000,12.702
4,self_attn.k_proj,0.01399883,0.01000,2.538
4,self_attn.v_proj,0.00609351,0.01000,9.978
4,self_attn.q_proj,0.01455349,0.01000,4.893
4,self_attn.o_proj,0.00308353,0.01000,1.867
4,mlp.up_proj,0.01101172,0.01000,1.507
4,mlp.gate_proj,0.01136096,0.01000,3.298
4,mlp.down_proj,0.01204515,0.01000,11.278
5,self_attn.k_proj,0.01381846,0.01000,5.158
5,self_attn.v_proj,0.00638836,0.01000,1.610
5,self_attn.q_proj,0.01450016,0.01000,1.798
5,self_attn.o_proj,0.00360254,0.01000,1.624
5,mlp.up_proj,0.01348488,0.01000,4.580
5,mlp.gate_proj,0.01340446,0.01000,1.761
5,mlp.down_proj,0.01536761,0.01000,22.166
6,self_attn.k_proj,0.01536616,0.01000,1.813
6,self_attn.v_proj,0.00765775,0.01000,1.057
6,self_attn.q_proj,0.01647044,0.01000,1.589
6,self_attn.o_proj,0.00484225,0.01000,1.817
6,mlp.up_proj,0.01586073,0.01000,2.670
6,mlp.gate_proj,0.01545403,0.01000,2.092
6,mlp.down_proj,0.01897714,0.01000,16.333
7,self_attn.k_proj,0.01551268,0.01000,2.392
7,self_attn.v_proj,0.00767670,0.01000,0.989
7,self_attn.q_proj,0.01955890,0.01000,2.897
7,self_attn.o_proj,0.00776187,0.01000,3.109
7,mlp.up_proj,0.02011534,0.01000,5.595
7,mlp.gate_proj,0.01881913,0.01000,8.879
7,mlp.down_proj,0.13795254,0.01000,5.252
8,self_attn.k_proj,0.01517920,0.01000,2.907
8,self_attn.v_proj,0.01077128,0.01000,3.195
8,self_attn.q_proj,0.01539815,0.01000,0.929
8,self_attn.o_proj,0.01244297,0.01000,8.706
8,mlp.up_proj,0.02336273,0.01000,1.006
8,mlp.gate_proj,0.02230725,0.01000,0.914
8,mlp.down_proj,0.03689886,0.01000,7.602
9,self_attn.k_proj,0.01419967,0.01000,3.176
9,self_attn.v_proj,0.00935659,0.01000,0.916
9,self_attn.q_proj,0.01437793,0.01000,7.752
9,self_attn.o_proj,0.01545753,0.01000,1.956
9,mlp.up_proj,0.02452471,0.01000,1.045
9,mlp.gate_proj,0.02163836,0.01000,0.934
9,mlp.down_proj,0.04093376,0.01000,8.590
10,self_attn.k_proj,0.01597095,0.01000,7.668
10,self_attn.v_proj,0.01030280,0.01000,0.955
10,self_attn.q_proj,0.01661386,0.01000,0.953
10,self_attn.o_proj,0.02046761,0.01000,0.961
10,mlp.up_proj,0.02449678,0.01000,1.783
10,mlp.gate_proj,0.02200876,0.01000,3.467
10,mlp.down_proj,0.04767245,0.01000,12.654
11,self_attn.k_proj,0.01583570,0.01000,0.988
11,self_attn.v_proj,0.01004474,0.01000,1.007
11,self_attn.q_proj,0.01681633,0.01000,0.953
11,self_attn.o_proj,0.02400013,0.01000,0.944
11,mlp.up_proj,0.02487121,0.01000,2.184
11,mlp.gate_proj,0.02244228,0.01000,0.996
11,mlp.down_proj,0.05173288,0.01000,18.105
12,self_attn.k_proj,0.01769731,0.01000,0.839
12,self_attn.v_proj,0.01472340,0.01000,0.551
12,self_attn.q_proj,0.01947594,0.01000,0.509
12,self_attn.o_proj,0.03308697,0.01000,0.642
12,mlp.up_proj,0.02705463,0.01000,0.573
12,mlp.gate_proj,0.02433215,0.01000,0.640
12,mlp.down_proj,0.06660484,0.01000,2.787
13,self_attn.k_proj,0.01724737,0.01000,0.509
13,self_attn.v_proj,0.01275570,0.01000,0.494
13,self_attn.q_proj,0.01846544,0.01000,0.557
13,self_attn.o_proj,0.02876754,0.01000,0.545
13,mlp.up_proj,0.02806181,0.01000,0.560
13,mlp.gate_proj,0.02527489,0.01000,0.524
13,mlp.down_proj,0.07755652,0.01000,2.416
14,self_attn.k_proj,0.01810676,0.01000,0.578
14,self_attn.v_proj,0.01431919,0.01000,0.505
14,self_attn.q_proj,0.01790303,0.01000,0.502
14,self_attn.o_proj,0.03729445,0.01000,0.527
14,mlp.up_proj,0.03043460,0.01000,0.550
14,mlp.gate_proj,0.02668553,0.01000,0.534
14,mlp.down_proj,0.10596363,0.01000,2.331
15,self_attn.k_proj,0.01930179,0.01000,0.515
15,self_attn.v_proj,0.02241649,0.01000,0.496
15,self_attn.q_proj,0.02011626,0.01000,0.497
15,self_attn.o_proj,0.05061907,0.01000,0.566
15,mlp.up_proj,0.03395730,0.01000,0.569
15,mlp.gate_proj,0.02911986,0.01000,0.593
15,mlp.down_proj,0.14194915,0.01000,2.274
16,self_attn.k_proj,0.02059570,0.01000,0.511
16,self_attn.v_proj,0.02086210,0.01000,0.496
16,self_attn.q_proj,0.02103812,0.01000,0.489
16,self_attn.o_proj,0.05604012,0.01000,0.514
16,mlp.up_proj,0.04187595,0.01000,0.539
16,mlp.gate_proj,0.03528344,0.01000,0.510
16,mlp.down_proj,0.21391028,0.01000,2.362
17,self_attn.k_proj,0.01972736,0.01000,0.528
17,self_attn.v_proj,0.02926025,0.01000,0.498
17,self_attn.q_proj,0.02005677,0.01000,0.498
17,self_attn.o_proj,0.09542210,0.01000,0.517
17,mlp.up_proj,0.04948561,0.01000,0.617
17,mlp.gate_proj,0.04208370,0.01000,0.527
17,mlp.down_proj,0.30404621,0.01000,2.336
18,self_attn.k_proj,0.01914989,0.01000,0.672
18,self_attn.v_proj,0.03310600,0.01000,0.540
18,self_attn.q_proj,0.02003000,0.01000,0.524
18,self_attn.o_proj,0.10906528,0.01000,0.543
18,mlp.up_proj,0.06152352,0.01000,0.530
18,mlp.gate_proj,0.05048580,0.01000,0.507
18,mlp.down_proj,0.47315487,0.01000,2.273
19,self_attn.k_proj,0.01988266,0.01000,0.521
19,self_attn.v_proj,0.04468218,0.01000,0.504
19,self_attn.q_proj,0.02098379,0.01000,0.499
19,self_attn.o_proj,0.11830558,0.01000,0.524
19,mlp.up_proj,0.07140406,0.01000,0.569
19,mlp.gate_proj,0.05682839,0.01000,0.516
19,mlp.down_proj,0.64388824,0.01000,2.303
20,self_attn.k_proj,0.01980521,0.01000,0.517
20,self_attn.v_proj,0.05296587,0.01000,0.492
20,self_attn.q_proj,0.02124322,0.01000,0.521
20,self_attn.o_proj,0.11964528,0.01000,0.517
20,mlp.up_proj,0.07959354,0.01000,0.533
20,mlp.gate_proj,0.06235816,0.01000,0.511
20,mlp.down_proj,0.80122459,0.01000,2.308
21,self_attn.k_proj,0.02273879,0.01000,0.526
21,self_attn.v_proj,0.06846954,0.01000,0.494
21,self_attn.q_proj,0.02335146,0.01000,0.498
21,self_attn.o_proj,0.21736440,0.01000,0.515
21,mlp.up_proj,0.09114946,0.01000,0.533
21,mlp.gate_proj,0.07021903,0.01000,0.509
21,mlp.down_proj,1.01436162,0.01000,2.285
22,self_attn.k_proj,0.02368175,0.01000,0.515
22,self_attn.v_proj,0.07183458,0.01000,0.500
22,self_attn.q_proj,0.02609063,0.01000,0.585
22,self_attn.o_proj,0.34090981,0.01000,0.516
22,mlp.up_proj,0.10087807,0.01000,0.555
22,mlp.gate_proj,0.07864191,0.01000,0.506
22,mlp.down_proj,1.41661644,0.01000,2.276
23,self_attn.k_proj,0.02159666,0.01000,0.523
23,self_attn.v_proj,0.08762348,0.01000,0.498
23,self_attn.q_proj,0.02072346,0.01000,0.494
23,self_attn.o_proj,0.76461768,0.01000,0.515
23,mlp.up_proj,0.09932031,0.01000,0.525
23,mlp.gate_proj,0.08260745,0.01000,0.506
23,mlp.down_proj,2.73030257,0.01000,2.283