File size: 7,379 Bytes
f09e7d3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000036928,0.05000,1.790
0,self_attn.o_proj,0.0000001945,0.05000,1.331
0,mlp.up_proj,0.0000102390,0.05000,2.562
0,mlp.gate_proj,0.0000106993,0.05000,2.597
0,mlp.down_proj,0.0000007873,0.05000,3.140
1,self_attn.qkv_proj,0.0000288658,0.05000,1.350
1,self_attn.o_proj,0.0000003944,0.05000,1.314
1,mlp.up_proj,0.0000151884,0.05000,3.192
1,mlp.gate_proj,0.0000162423,0.05000,3.248
1,mlp.down_proj,0.0000017862,0.05000,3.335
2,self_attn.qkv_proj,0.0000672307,0.05000,1.265
2,self_attn.o_proj,0.0000004262,0.05000,1.162
2,mlp.up_proj,0.0000219007,0.05000,2.728
2,mlp.gate_proj,0.0000236388,0.05000,2.739
2,mlp.down_proj,0.0000015235,0.05000,3.191
3,self_attn.qkv_proj,0.0000958284,0.05000,1.113
3,self_attn.o_proj,0.0000007994,0.05000,1.071
3,mlp.gate_proj,0.0000320000,0.05000,2.401
3,mlp.up_proj,0.0000289537,0.05000,2.435
3,mlp.down_proj,0.0003337474,0.05000,3.272
4,self_attn.qkv_proj,0.0000909789,0.05000,1.106
4,self_attn.o_proj,0.0000012312,0.05000,1.100
4,mlp.up_proj,0.0000345329,0.05000,2.538
4,mlp.gate_proj,0.0000400292,0.05000,2.554
4,mlp.down_proj,0.0000039765,0.05000,3.210
5,self_attn.qkv_proj,0.0001159516,0.05000,1.133
5,self_attn.o_proj,0.0000017395,0.05000,1.128
5,mlp.up_proj,0.0000430088,0.05000,2.448
5,mlp.gate_proj,0.0000509520,0.05000,2.467
5,mlp.down_proj,0.0000057463,0.05000,3.189
6,self_attn.qkv_proj,0.0000961327,0.05000,1.115
6,self_attn.o_proj,0.0000022428,0.05000,1.125
6,mlp.up_proj,0.0000430322,0.05000,2.552
6,mlp.gate_proj,0.0000487083,0.05000,2.587
6,mlp.down_proj,0.0000063000,0.05000,3.109
7,self_attn.qkv_proj,0.0001434261,0.05000,1.093
7,self_attn.o_proj,0.0000029053,0.05000,1.076
7,mlp.up_proj,0.0000461718,0.05000,2.553
7,mlp.gate_proj,0.0000501546,0.05000,2.579
7,mlp.down_proj,0.0000080737,0.05000,3.201
8,self_attn.qkv_proj,0.0001350463,0.05000,1.091
8,self_attn.o_proj,0.0000040604,0.05000,1.109
8,mlp.up_proj,0.0000482156,0.05000,2.403
8,mlp.gate_proj,0.0000492231,0.05000,2.431
8,mlp.down_proj,0.0000089525,0.05000,3.215
9,self_attn.qkv_proj,0.0001197565,0.05000,1.137
9,self_attn.o_proj,0.0000039595,0.05000,1.111
9,mlp.up_proj,0.0000522804,0.05000,2.498
9,mlp.gate_proj,0.0000520745,0.05000,2.531
9,mlp.down_proj,0.0000084691,0.05000,3.158
10,self_attn.qkv_proj,0.0001285350,0.05000,1.141
10,self_attn.o_proj,0.0000056212,0.05000,1.134
10,mlp.up_proj,0.0000538686,0.05000,2.537
10,mlp.gate_proj,0.0000539127,0.05000,2.535
10,mlp.down_proj,0.0000092388,0.05000,3.212
11,self_attn.qkv_proj,0.0001265468,0.05000,1.102
11,self_attn.o_proj,0.0000049263,0.05000,1.106
11,mlp.up_proj,0.0000561754,0.05000,2.543
11,mlp.gate_proj,0.0000538750,0.05000,2.569
11,mlp.down_proj,0.0000098257,0.05000,3.231
12,self_attn.qkv_proj,0.0001307771,0.05000,1.150
12,self_attn.o_proj,0.0000049451,0.05000,1.125
12,mlp.gate_proj,0.0000524987,0.05000,2.460
12,mlp.up_proj,0.0000571596,0.05000,2.484
12,mlp.down_proj,0.0000116566,0.05000,3.190
13,self_attn.qkv_proj,0.0001563531,0.05000,1.108
13,self_attn.o_proj,0.0000065090,0.05000,1.103
13,mlp.up_proj,0.0000612276,0.05000,2.490
13,mlp.gate_proj,0.0000543759,0.05000,2.508
13,mlp.down_proj,0.0000127317,0.05000,3.187
14,self_attn.qkv_proj,0.0001393042,0.05000,1.131
14,self_attn.o_proj,0.0000061571,0.05000,1.116
14,mlp.gate_proj,0.0000600704,0.05000,2.562
14,mlp.up_proj,0.0000672100,0.05000,2.584
14,mlp.down_proj,0.0000145146,0.05000,3.154
15,self_attn.qkv_proj,0.0001545983,0.05000,1.100
15,self_attn.o_proj,0.0000057894,0.05000,1.103
15,mlp.gate_proj,0.0000662487,0.05000,2.484
15,mlp.up_proj,0.0000739427,0.05000,2.506
15,mlp.down_proj,0.0000164698,0.05000,3.217
16,self_attn.qkv_proj,0.0001466132,0.05000,1.126
16,self_attn.o_proj,0.0000097625,0.05000,1.116
16,mlp.up_proj,0.0000786630,0.05000,2.562
16,mlp.gate_proj,0.0000699401,0.05000,2.584
16,mlp.down_proj,0.0000218803,0.05000,3.116
17,self_attn.qkv_proj,0.0001490546,0.05000,1.142
17,self_attn.o_proj,0.0000076505,0.05000,1.103
17,mlp.up_proj,0.0000841039,0.05000,2.591
17,mlp.gate_proj,0.0000739672,0.05000,2.615
17,mlp.down_proj,0.0000262042,0.05000,3.182
18,self_attn.qkv_proj,0.0001470632,0.05000,1.166
18,self_attn.o_proj,0.0000125533,0.05000,1.141
18,mlp.up_proj,0.0000932287,0.05000,2.532
18,mlp.gate_proj,0.0000829974,0.05000,2.548
18,mlp.down_proj,0.0000385317,0.05000,3.301
19,self_attn.qkv_proj,0.0001654606,0.05000,1.171
19,self_attn.o_proj,0.0000149239,0.05000,1.165
19,mlp.up_proj,0.0000991290,0.05000,2.623
19,mlp.gate_proj,0.0000894585,0.05000,2.664
19,mlp.down_proj,0.0000435778,0.05000,3.377
20,self_attn.qkv_proj,0.0001578730,0.05000,1.156
20,self_attn.o_proj,0.0000184642,0.05000,1.195
20,mlp.up_proj,0.0001209617,0.05000,2.661
20,mlp.gate_proj,0.0001092768,0.05000,2.687
20,mlp.down_proj,0.0000563793,0.05000,3.294
21,self_attn.qkv_proj,0.0001870555,0.05000,1.213
21,self_attn.o_proj,0.0000136906,0.05000,1.101
21,mlp.gate_proj,0.0001159161,0.05000,2.587
21,mlp.up_proj,0.0001299713,0.05000,2.605
21,mlp.down_proj,0.0000704598,0.05000,3.190
22,self_attn.qkv_proj,0.0001782628,0.05000,1.132
22,self_attn.o_proj,0.0000249007,0.05000,1.132
22,mlp.up_proj,0.0001397206,0.05000,2.564
22,mlp.gate_proj,0.0001231925,0.05000,2.572
22,mlp.down_proj,0.0000832951,0.05000,3.299
23,self_attn.qkv_proj,0.0001967909,0.05000,1.156
23,self_attn.o_proj,0.0000105388,0.05000,1.119
23,mlp.gate_proj,0.0001326374,0.05000,2.511
23,mlp.up_proj,0.0001492243,0.05000,2.540
23,mlp.down_proj,0.0000830157,0.05000,3.201
24,self_attn.qkv_proj,0.0002110393,0.05000,1.125
24,self_attn.o_proj,0.0000124396,0.05000,1.090
24,mlp.up_proj,0.0001615396,0.05000,2.512
24,mlp.gate_proj,0.0001421848,0.05000,2.535
24,mlp.down_proj,0.0000963378,0.05000,3.219
25,self_attn.qkv_proj,0.0002265083,0.05000,1.141
25,self_attn.o_proj,0.0000209731,0.05000,1.112
25,mlp.gate_proj,0.0001558134,0.05000,2.658
25,mlp.up_proj,0.0001774229,0.05000,2.676
25,mlp.down_proj,0.0001089506,0.05000,3.236
26,self_attn.qkv_proj,0.0001990848,0.05000,1.134
26,self_attn.o_proj,0.0000347294,0.05000,1.136
26,mlp.up_proj,0.0001846280,0.05000,2.560
26,mlp.gate_proj,0.0001625094,0.05000,2.582
26,mlp.down_proj,0.0001322558,0.05000,3.308
27,self_attn.qkv_proj,0.0001973591,0.05000,1.118
27,self_attn.o_proj,0.0000244647,0.05000,1.148
27,mlp.gate_proj,0.0001797843,0.05000,2.541
27,mlp.up_proj,0.0002011022,0.05000,2.557
27,mlp.down_proj,0.0001692445,0.05000,3.208
28,self_attn.qkv_proj,0.0002489807,0.05000,1.203
28,self_attn.o_proj,0.0000308398,0.05000,1.119
28,mlp.up_proj,0.0002172940,0.05000,2.558
28,mlp.gate_proj,0.0002009149,0.05000,2.579
28,mlp.down_proj,0.0002246512,0.05000,3.171
29,self_attn.qkv_proj,0.0002247108,0.05000,1.150
29,self_attn.o_proj,0.0000370290,0.05000,1.123
29,mlp.gate_proj,0.0002232223,0.05000,2.595
29,mlp.up_proj,0.0002207740,0.05000,2.619
29,mlp.down_proj,0.0003816118,0.05000,3.237
30,self_attn.qkv_proj,0.0001591859,0.05000,1.131
30,self_attn.o_proj,0.0000362225,0.05000,1.087
30,mlp.gate_proj,0.0002359733,0.05000,2.611
30,mlp.up_proj,0.0002075650,0.05000,2.634
30,mlp.down_proj,0.0014728911,0.05000,3.272
31,self_attn.qkv_proj,0.0000035844,0.05000,1.131
31,self_attn.o_proj,0.0000039555,0.05000,1.124
31,mlp.gate_proj,0.0001033877,0.05000,2.621
31,mlp.up_proj,0.0000604577,0.05000,2.628
31,mlp.down_proj,0.0004907257,0.05000,3.331