File size: 7,379 Bytes
ba2b22a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000029813,0.05000,2.185
0,self_attn.o_proj,0.0000001116,0.05000,1.084
0,mlp.gate_proj,0.0000072175,0.05000,2.485
0,mlp.up_proj,0.0000068269,0.05000,2.472
0,mlp.down_proj,0.0000003002,0.05000,2.818
1,self_attn.qkv_proj,0.0000198021,0.05000,1.178
1,self_attn.o_proj,0.0000000840,0.05000,1.074
1,mlp.gate_proj,0.0000090921,0.05000,2.970
1,mlp.up_proj,0.0000082698,0.05000,3.030
1,mlp.down_proj,0.0000004386,0.05000,3.012
2,self_attn.qkv_proj,0.0000369951,0.05000,1.042
2,self_attn.o_proj,0.0000001405,0.05000,1.034
2,mlp.gate_proj,0.0000112209,0.05000,3.049
2,mlp.up_proj,0.0000100619,0.05000,3.136
2,mlp.down_proj,0.0000003945,0.05000,2.978
3,self_attn.qkv_proj,0.0000493181,0.05000,1.000
3,self_attn.o_proj,0.0000001907,0.05000,1.057
3,mlp.gate_proj,0.0000116083,0.05000,2.194
3,mlp.up_proj,0.0000099847,0.05000,2.211
3,mlp.down_proj,0.0001575425,0.05000,2.915
4,self_attn.qkv_proj,0.0000429134,0.05000,1.015
4,self_attn.o_proj,0.0000005166,0.05000,1.036
4,mlp.gate_proj,0.0000153442,0.05000,2.213
4,mlp.up_proj,0.0000123836,0.05000,2.234
4,mlp.down_proj,0.0000009558,0.05000,2.901
5,self_attn.qkv_proj,0.0000511098,0.05000,1.029
5,self_attn.o_proj,0.0000007915,0.05000,0.992
5,mlp.gate_proj,0.0000157261,0.05000,2.142
5,mlp.up_proj,0.0000123270,0.05000,2.167
5,mlp.down_proj,0.0000011092,0.05000,2.916
6,self_attn.qkv_proj,0.0000368397,0.05000,1.005
6,self_attn.o_proj,0.0000010816,0.05000,1.004
6,mlp.gate_proj,0.0000144746,0.05000,2.321
6,mlp.up_proj,0.0000120766,0.05000,2.343
6,mlp.down_proj,0.0000013575,0.05000,2.901
7,self_attn.qkv_proj,0.0000558010,0.05000,0.997
7,self_attn.o_proj,0.0000015489,0.05000,1.001
7,mlp.up_proj,0.0000107158,0.05000,2.283
7,mlp.gate_proj,0.0000121614,0.05000,2.292
7,mlp.down_proj,0.0000013054,0.05000,2.919
8,self_attn.qkv_proj,0.0000478846,0.05000,1.005
8,self_attn.o_proj,0.0000010530,0.05000,1.015
8,mlp.gate_proj,0.0000116524,0.05000,2.327
8,mlp.up_proj,0.0000112374,0.05000,2.347
8,mlp.down_proj,0.0000012097,0.05000,2.928
9,self_attn.qkv_proj,0.0000377997,0.05000,1.027
9,self_attn.o_proj,0.0000008833,0.05000,1.020
9,mlp.up_proj,0.0000130112,0.05000,2.346
9,mlp.gate_proj,0.0000130494,0.05000,2.366
9,mlp.down_proj,0.0000013272,0.05000,2.956
10,self_attn.qkv_proj,0.0000416774,0.05000,1.002
10,self_attn.o_proj,0.0000014399,0.05000,0.995
10,mlp.gate_proj,0.0000147789,0.05000,2.278
10,mlp.up_proj,0.0000146073,0.05000,2.298
10,mlp.down_proj,0.0000016522,0.05000,2.917
11,self_attn.qkv_proj,0.0000451865,0.05000,0.999
11,self_attn.o_proj,0.0000025101,0.05000,1.019
11,mlp.up_proj,0.0000155388,0.05000,2.297
11,mlp.gate_proj,0.0000147828,0.05000,2.319
11,mlp.down_proj,0.0000018731,0.05000,2.878
12,self_attn.qkv_proj,0.0000411135,0.05000,0.997
12,self_attn.o_proj,0.0000016274,0.05000,0.984
12,mlp.gate_proj,0.0000138808,0.05000,2.238
12,mlp.up_proj,0.0000153072,0.05000,2.255
12,mlp.down_proj,0.0000019512,0.05000,2.913
13,self_attn.qkv_proj,0.0000524880,0.05000,1.055
13,self_attn.o_proj,0.0000025486,0.05000,0.983
13,mlp.gate_proj,0.0000134808,0.05000,2.241
13,mlp.up_proj,0.0000157018,0.05000,2.267
13,mlp.down_proj,0.0000017552,0.05000,2.904
14,self_attn.qkv_proj,0.0000434523,0.05000,1.007
14,self_attn.o_proj,0.0000018440,0.05000,1.004
14,mlp.up_proj,0.0000157787,0.05000,2.369
14,mlp.gate_proj,0.0000136520,0.05000,2.391
14,mlp.down_proj,0.0000018066,0.05000,2.874
15,self_attn.qkv_proj,0.0000482138,0.05000,1.006
15,self_attn.o_proj,0.0000023607,0.05000,0.996
15,mlp.up_proj,0.0000184480,0.05000,2.258
15,mlp.gate_proj,0.0000159979,0.05000,2.285
15,mlp.down_proj,0.0000022394,0.05000,2.879
16,self_attn.qkv_proj,0.0000460684,0.05000,1.004
16,self_attn.o_proj,0.0000029966,0.05000,0.996
16,mlp.up_proj,0.0000173775,0.05000,2.229
16,mlp.gate_proj,0.0000149928,0.05000,2.250
16,mlp.down_proj,0.0000026397,0.05000,2.927
17,self_attn.qkv_proj,0.0000391842,0.05000,1.013
17,self_attn.o_proj,0.0000019919,0.05000,1.004
17,mlp.gate_proj,0.0000157793,0.05000,2.170
17,mlp.up_proj,0.0000185717,0.05000,2.195
17,mlp.down_proj,0.0000032989,0.05000,2.975
18,self_attn.qkv_proj,0.0000400155,0.05000,1.004
18,self_attn.o_proj,0.0000047167,0.05000,1.026
18,mlp.gate_proj,0.0000173240,0.05000,2.357
18,mlp.up_proj,0.0000200385,0.05000,2.378
18,mlp.down_proj,0.0000046034,0.05000,2.894
19,self_attn.qkv_proj,0.0000434654,0.05000,0.989
19,self_attn.o_proj,0.0000067645,0.05000,1.010
19,mlp.gate_proj,0.0000196353,0.05000,2.235
19,mlp.up_proj,0.0000223742,0.05000,2.258
19,mlp.down_proj,0.0000056410,0.05000,2.882
20,self_attn.qkv_proj,0.0000463234,0.05000,1.051
20,self_attn.o_proj,0.0000086217,0.05000,0.987
20,mlp.gate_proj,0.0000240742,0.05000,2.232
20,mlp.up_proj,0.0000274313,0.05000,2.254
20,mlp.down_proj,0.0000060875,0.05000,2.883
21,self_attn.qkv_proj,0.0000501621,0.05000,1.009
21,self_attn.o_proj,0.0000087416,0.05000,1.061
21,mlp.gate_proj,0.0000260591,0.05000,2.269
21,mlp.up_proj,0.0000302359,0.05000,2.288
21,mlp.down_proj,0.0000079578,0.05000,2.881
22,self_attn.qkv_proj,0.0000489731,0.05000,1.012
22,self_attn.o_proj,0.0000178103,0.05000,1.010
22,mlp.gate_proj,0.0000266433,0.05000,2.329
22,mlp.up_proj,0.0000314974,0.05000,2.348
22,mlp.down_proj,0.0000063287,0.05000,2.896
23,self_attn.qkv_proj,0.0000455062,0.05000,1.014
23,self_attn.o_proj,0.0000040400,0.05000,1.016
23,mlp.gate_proj,0.0000260997,0.05000,2.268
23,mlp.up_proj,0.0000305928,0.05000,2.296
23,mlp.down_proj,0.0000047429,0.05000,2.939
24,self_attn.qkv_proj,0.0000446666,0.05000,1.041
24,self_attn.o_proj,0.0000039479,0.05000,1.019
24,mlp.gate_proj,0.0000253762,0.05000,2.208
24,mlp.up_proj,0.0000301786,0.05000,2.233
24,mlp.down_proj,0.0000058199,0.05000,2.930
25,self_attn.qkv_proj,0.0000491577,0.05000,1.018
25,self_attn.o_proj,0.0000154031,0.05000,0.992
25,mlp.up_proj,0.0000329190,0.05000,2.297
25,mlp.gate_proj,0.0000275557,0.05000,2.325
25,mlp.down_proj,0.0000069694,0.05000,2.888
26,self_attn.qkv_proj,0.0000472160,0.05000,1.000
26,self_attn.o_proj,0.0000240206,0.05000,1.013
26,mlp.up_proj,0.0000331026,0.05000,2.370
26,mlp.gate_proj,0.0000278213,0.05000,2.383
26,mlp.down_proj,0.0000075888,0.05000,2.879
27,self_attn.qkv_proj,0.0000390911,0.05000,0.997
27,self_attn.o_proj,0.0000069230,0.05000,0.982
27,mlp.up_proj,0.0000385140,0.05000,2.292
27,mlp.gate_proj,0.0000329811,0.05000,2.326
27,mlp.down_proj,0.0000150313,0.05000,2.866
28,self_attn.qkv_proj,0.0000598709,0.05000,1.005
28,self_attn.o_proj,0.0000301717,0.05000,0.998
28,mlp.up_proj,0.0000483479,0.05000,2.217
28,mlp.gate_proj,0.0000434695,0.05000,2.222
28,mlp.down_proj,0.0000254065,0.05000,2.887
29,self_attn.qkv_proj,0.0000556419,0.05000,1.006
29,self_attn.o_proj,0.0000174969,0.05000,0.994
29,mlp.up_proj,0.0000489981,0.05000,2.362
29,mlp.gate_proj,0.0000497381,0.05000,2.376
29,mlp.down_proj,0.0000467694,0.05000,2.925
30,self_attn.qkv_proj,0.0000398120,0.05000,1.037
30,self_attn.o_proj,0.0000189608,0.05000,0.996
30,mlp.up_proj,0.0000495070,0.05000,2.266
30,mlp.gate_proj,0.0000596360,0.05000,2.280
30,mlp.down_proj,0.0003538760,0.05000,2.929
31,self_attn.qkv_proj,0.0000012725,0.05000,1.016
31,self_attn.o_proj,0.0000023444,0.05000,0.995
31,mlp.up_proj,0.0000169833,0.05000,2.230
31,mlp.gate_proj,0.0000333658,0.05000,2.260
31,mlp.down_proj,0.0001084470,0.05000,2.915