File size: 8,233 Bytes
e91eb74
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
layer,module,loss,samples,damp,time
0,self_attn.q_proj,0.00143004,0.01000,1.666
0,self_attn.k_proj,0.00152641,0.01000,1.244
0,self_attn.v_proj,0.00055014,0.01000,1.224
0,self_attn.dense,0.00040645,0.01000,1.199
0,mlp.fc1,0.00156395,0.01000,1.471
0,mlp.fc2,45.18684896,0.01250,8.215
1,self_attn.q_proj,0.00098901,0.01000,1.230
1,self_attn.k_proj,0.00098037,0.01000,1.193
1,self_attn.v_proj,0.00025730,0.01000,1.200
1,self_attn.dense,0.00010639,0.01000,1.247
1,mlp.fc1,0.00321254,0.01000,1.491
1,mlp.fc2,47.71025594,0.01250,8.363
2,self_attn.q_proj,0.00124894,0.01000,1.345
2,self_attn.k_proj,0.00125460,0.01000,1.299
2,self_attn.v_proj,0.00052309,0.01000,1.253
2,self_attn.dense,0.00011987,0.01000,1.390
2,mlp.fc1,0.00455974,0.01000,1.709
2,mlp.fc2,51.62885539,0.01250,8.104
3,self_attn.q_proj,0.00130572,0.01000,1.189
3,self_attn.k_proj,0.00125844,0.01000,1.239
3,self_attn.v_proj,0.00100104,0.01000,1.399
3,self_attn.dense,0.00010456,0.01000,1.400
3,mlp.fc1,0.00656331,0.01000,1.650
3,mlp.fc2,52.00990804,0.01250,8.130
4,self_attn.q_proj,0.00165055,0.01000,1.275
4,self_attn.k_proj,0.00151279,0.01000,1.267
4,self_attn.v_proj,0.00109894,0.01000,1.210
4,self_attn.dense,0.00008104,0.01000,1.164
4,mlp.fc1,0.00635077,0.01000,1.470
4,mlp.fc2,45.79121908,0.01250,7.909
5,self_attn.q_proj,0.00146975,0.01000,1.218
5,self_attn.k_proj,0.00134510,0.01000,1.212
5,self_attn.v_proj,0.00096357,0.01000,1.230
5,self_attn.dense,0.00009522,0.01000,1.167
5,mlp.fc1,0.00543682,0.01000,1.510
5,mlp.fc2,39.91021474,0.01250,8.151
6,self_attn.q_proj,0.00179219,0.01000,1.304
6,self_attn.k_proj,0.00164673,0.01000,1.153
6,self_attn.v_proj,0.00118458,0.01000,1.130
6,self_attn.dense,0.00008672,0.01000,1.179
6,mlp.fc1,0.00587255,0.01000,1.484
6,mlp.fc2,44.64824422,0.01250,8.148
7,self_attn.q_proj,0.00186776,0.01000,1.171
7,self_attn.k_proj,0.00177774,0.01000,1.137
7,self_attn.v_proj,0.00120310,0.01000,1.267
7,self_attn.dense,0.00006188,0.01000,1.291
7,mlp.fc1,0.00593133,0.01000,1.634
7,mlp.fc2,39.13363139,0.01250,8.085
8,self_attn.q_proj,0.00189651,0.01000,1.240
8,self_attn.k_proj,0.00176293,0.01000,1.228
8,self_attn.v_proj,0.00140262,0.01000,1.245
8,self_attn.dense,0.00006599,0.01000,1.192
8,mlp.fc1,0.00588503,0.01000,1.698
8,mlp.fc2,40.45288086,0.01250,8.500
9,self_attn.q_proj,0.00191524,0.01000,1.303
9,self_attn.k_proj,0.00177061,0.01000,1.146
9,self_attn.v_proj,0.00140069,0.01000,1.155
9,self_attn.dense,0.00008725,0.01000,1.173
9,mlp.fc1,0.00577327,0.01000,1.504
9,mlp.fc2,41.11215210,0.01250,8.315
10,self_attn.q_proj,0.00192486,0.01000,1.232
10,self_attn.k_proj,0.00184659,0.01000,1.287
10,self_attn.v_proj,0.00122425,0.01000,1.217
10,self_attn.dense,0.00008808,0.01000,1.212
10,mlp.fc1,0.00560408,0.01000,1.617
10,mlp.fc2,38.80376689,0.01250,8.274
11,self_attn.q_proj,0.00201942,0.01000,1.267
11,self_attn.k_proj,0.00193283,0.01000,1.240
11,self_attn.v_proj,0.00134693,0.01000,1.196
11,self_attn.dense,0.00010903,0.01000,1.279
11,mlp.fc1,0.00545754,0.01000,1.536
11,mlp.fc2,38.56307475,0.01250,7.950
12,self_attn.q_proj,0.00209887,0.01000,1.200
12,self_attn.k_proj,0.00200503,0.01000,1.235
12,self_attn.v_proj,0.00137541,0.01000,1.226
12,self_attn.dense,0.00008138,0.01000,1.221
12,mlp.fc1,0.00540713,0.01000,1.525
12,mlp.fc2,40.88318888,0.01250,8.217
13,self_attn.q_proj,0.00200631,0.01000,1.251
13,self_attn.k_proj,0.00194197,0.01000,1.219
13,self_attn.v_proj,0.00134296,0.01000,1.149
13,self_attn.dense,0.00007691,0.01000,1.237
13,mlp.fc1,0.00549893,0.01000,1.499
13,mlp.fc2,41.56899770,0.01250,8.045
14,self_attn.q_proj,0.00210726,0.01000,1.282
14,self_attn.k_proj,0.00314308,0.01000,1.203
14,self_attn.v_proj,0.00133068,0.01000,1.242
14,self_attn.dense,0.00009206,0.01000,1.209
14,mlp.fc1,0.00539970,0.01000,1.479
14,mlp.fc2,41.86838531,0.01250,8.351
15,self_attn.q_proj,0.00199632,0.01000,1.302
15,self_attn.k_proj,0.00192289,0.01000,1.252
15,self_attn.v_proj,0.00126881,0.01000,1.190
15,self_attn.dense,0.00010529,0.01000,1.233
15,mlp.fc1,0.00512260,0.01000,1.654
15,mlp.fc2,40.16023763,0.01250,8.171
16,self_attn.q_proj,0.00206465,0.01000,1.269
16,self_attn.k_proj,0.00198583,0.01000,1.272
16,self_attn.v_proj,0.00134773,0.01000,1.218
16,self_attn.dense,0.00011100,0.01000,1.248
16,mlp.fc1,0.00523687,0.01000,1.613
16,mlp.fc2,44.88688151,0.01250,8.167
17,self_attn.q_proj,0.00197861,0.01000,1.327
17,self_attn.k_proj,0.00189119,0.01000,1.293
17,self_attn.v_proj,0.00124682,0.01000,1.285
17,self_attn.dense,0.00008207,0.01000,1.278
17,mlp.fc1,0.00489658,0.01000,1.480
17,mlp.fc2,41.40846761,0.01250,8.204
18,self_attn.q_proj,0.00228992,0.01000,1.315
18,self_attn.k_proj,0.00217069,0.01000,1.268
18,self_attn.v_proj,0.00131716,0.01000,1.255
18,self_attn.dense,0.00008202,0.01000,1.252
18,mlp.fc1,0.00499909,0.01000,1.578
18,mlp.fc2,41.80710856,0.01250,8.319
19,self_attn.q_proj,0.00216272,0.01000,1.389
19,self_attn.k_proj,0.00209569,0.01000,1.459
19,self_attn.v_proj,0.00134877,0.01000,1.276
19,self_attn.dense,0.00010894,0.01000,1.240
19,mlp.fc1,0.00535385,0.01000,1.577
19,mlp.fc2,50.55662028,0.01250,8.463
20,self_attn.q_proj,0.00229107,0.01000,1.262
20,self_attn.k_proj,0.03851147,0.01000,1.216
20,self_attn.v_proj,0.00130100,0.01000,1.126
20,self_attn.dense,0.00012769,0.01000,1.188
20,mlp.fc1,0.00545297,0.01000,1.534
20,mlp.fc2,49.51214600,0.01250,8.264
21,self_attn.q_proj,0.00218866,0.01000,1.271
21,self_attn.k_proj,0.00204123,0.01000,1.301
21,self_attn.v_proj,0.00156515,0.01000,1.246
21,self_attn.dense,0.00012658,0.01000,1.226
21,mlp.fc1,0.00584921,0.01000,1.567
21,mlp.fc2,52.78467306,0.01250,8.395
22,self_attn.q_proj,0.00225957,0.01000,1.327
22,self_attn.k_proj,0.00357083,0.01000,1.294
22,self_attn.v_proj,0.00164564,0.01000,1.182
22,self_attn.dense,0.00010589,0.01000,1.298
22,mlp.fc1,0.00612155,0.01000,1.662
22,mlp.fc2,52.80789185,0.01250,8.462
23,self_attn.q_proj,0.00243160,0.01000,1.332
23,self_attn.k_proj,0.00276039,0.01000,1.332
23,self_attn.v_proj,0.00159178,0.01000,1.117
23,self_attn.dense,0.00016935,0.01000,1.254
23,mlp.fc1,0.00641046,0.01000,1.594
23,mlp.fc2,52.62599691,0.01250,8.410
24,self_attn.q_proj,0.00232852,0.01000,1.257
24,self_attn.k_proj,0.00215273,0.01000,1.328
24,self_attn.v_proj,0.00190273,0.01000,1.293
24,self_attn.dense,0.00019747,0.01000,1.250
24,mlp.fc1,0.00686966,0.01000,1.517
24,mlp.fc2,55.26352437,0.01250,8.156
25,self_attn.q_proj,0.00253579,0.01000,1.216
25,self_attn.k_proj,0.01635120,0.01000,1.195
25,self_attn.v_proj,0.00198928,0.01000,1.303
25,self_attn.dense,0.00024381,0.01000,1.295
25,mlp.fc1,0.00749265,0.01000,1.487
25,mlp.fc2,52.59010824,0.01250,8.389
26,self_attn.q_proj,0.00319071,0.01000,1.357
26,self_attn.k_proj,0.00231659,0.01000,1.326
26,self_attn.v_proj,0.00232149,0.01000,1.287
26,self_attn.dense,0.00024788,0.01000,1.330
26,mlp.fc1,0.00773018,0.01000,1.644
26,mlp.fc2,50.22942098,0.01250,8.381
27,self_attn.q_proj,0.00275840,0.01000,1.284
27,self_attn.k_proj,0.00304915,0.01000,1.255
27,self_attn.v_proj,0.00238565,0.01000,1.236
27,self_attn.dense,0.00028637,0.01000,1.232
27,mlp.fc1,0.00808649,0.01000,1.501
27,mlp.fc2,48.66911825,0.01250,8.210
28,self_attn.q_proj,0.00248579,0.01000,1.194
28,self_attn.k_proj,0.00226670,0.01000,1.181
28,self_attn.v_proj,0.00246282,0.01000,1.183
28,self_attn.dense,0.00041967,0.01000,1.281
28,mlp.fc1,0.00824952,0.01000,1.527
28,mlp.fc2,43.05557760,0.01250,8.224
29,self_attn.q_proj,0.11153113,0.01000,1.266
29,self_attn.k_proj,0.64342054,0.01000,1.226
29,self_attn.v_proj,0.00479308,0.01000,1.228
29,self_attn.dense,0.00025549,0.01000,1.224
29,mlp.fc1,0.03276892,0.01000,1.495
29,mlp.fc2,36.04873657,0.01250,8.129
30,self_attn.q_proj,0.06741060,0.01000,1.441
30,self_attn.k_proj,0.70108302,0.01000,1.260
30,self_attn.v_proj,0.00279436,0.01000,1.327
30,self_attn.dense,0.00033670,0.01000,1.297
30,mlp.fc1,0.02931402,0.01000,1.595
30,mlp.fc2,32.39466349,0.01250,8.556
31,self_attn.q_proj,0.03431750,0.01000,1.214
31,self_attn.k_proj,5.91425705,0.01000,1.192
31,self_attn.v_proj,0.00139703,0.01000,1.202
31,self_attn.dense,0.00031197,0.01000,1.166
31,mlp.fc1,0.01573335,0.01000,1.476
31,mlp.fc2,58.13183085,0.01250,8.144