File size: 6,025 Bytes
5a2de59
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00409379,0.01000,0.993
0,self_attn.v_proj,0.00072114,0.01000,1.013
0,self_attn.q_proj,0.00414090,0.01000,1.025
0,self_attn.out_proj,0.00001093,0.01000,0.995
0,fc1,0.01083721,0.01000,0.997
0,fc2,0.00014591,0.01000,4.290
1,self_attn.k_proj,0.00460731,0.01000,0.993
1,self_attn.v_proj,0.00057901,0.01000,0.989
1,self_attn.q_proj,0.00501648,0.01000,1.004
1,self_attn.out_proj,0.00000384,0.01000,0.980
1,fc1,0.01723385,0.01000,1.018
1,fc2,0.00027718,0.01000,4.274
2,self_attn.k_proj,0.00625587,0.01000,1.028
2,self_attn.v_proj,0.00100671,0.01000,0.992
2,self_attn.q_proj,0.00620751,0.01000,1.017
2,self_attn.out_proj,0.00001057,0.01000,0.986
2,fc1,0.01686204,0.01000,1.000
2,fc2,0.00013050,0.01000,4.262
3,self_attn.k_proj,0.00688523,0.01000,0.981
3,self_attn.v_proj,0.00138955,0.01000,0.989
3,self_attn.q_proj,0.00759731,0.01000,0.988
3,self_attn.out_proj,0.00001236,0.01000,0.998
3,fc1,0.01656991,0.01000,1.003
3,fc2,0.00012674,0.01000,4.207
4,self_attn.k_proj,0.01033037,0.01000,1.005
4,self_attn.v_proj,0.00170416,0.01000,0.988
4,self_attn.q_proj,0.01105807,0.01000,0.985
4,self_attn.out_proj,0.00002068,0.01000,0.996
4,fc1,0.01853193,0.01000,1.005
4,fc2,0.00013410,0.01000,4.235
5,self_attn.k_proj,0.01293353,0.01000,1.007
5,self_attn.v_proj,0.00222387,0.01000,0.989
5,self_attn.q_proj,0.01334210,0.01000,1.003
5,self_attn.out_proj,0.00002222,0.01000,1.007
5,fc1,0.02076346,0.01000,0.994
5,fc2,0.00014411,0.01000,4.170
6,self_attn.k_proj,0.01992640,0.01000,1.042
6,self_attn.v_proj,0.00283416,0.01000,1.005
6,self_attn.q_proj,0.01790950,0.01000,1.015
6,self_attn.out_proj,0.00004584,0.01000,0.994
6,fc1,0.02586313,0.01000,0.987
6,fc2,0.00019328,0.01000,4.243
7,self_attn.k_proj,0.02163527,0.01000,0.981
7,self_attn.v_proj,0.00339857,0.01000,0.978
7,self_attn.q_proj,0.01917062,0.01000,0.995
7,self_attn.out_proj,0.00005514,0.01000,0.994
7,fc1,0.03230386,0.01000,1.036
7,fc2,0.00027319,0.01000,4.248
8,self_attn.k_proj,0.02458253,0.01000,0.986
8,self_attn.v_proj,0.00393817,0.01000,0.977
8,self_attn.q_proj,0.02009545,0.01000,0.996
8,self_attn.out_proj,0.00007193,0.01000,0.990
8,fc1,0.03901298,0.01000,1.007
8,fc2,0.00036630,0.01000,4.221
9,self_attn.k_proj,0.02626408,0.01000,1.021
9,self_attn.v_proj,0.00449418,0.01000,0.980
9,self_attn.q_proj,0.02207199,0.01000,0.988
9,self_attn.out_proj,0.00009974,0.01000,0.992
9,fc1,0.04441365,0.01000,1.009
9,fc2,0.00049525,0.01000,4.350
10,self_attn.k_proj,0.02680579,0.01000,0.992
10,self_attn.v_proj,0.00567766,0.01000,0.980
10,self_attn.q_proj,0.02212340,0.01000,0.996
10,self_attn.out_proj,0.00013059,0.01000,0.977
10,fc1,0.05002769,0.01000,1.000
10,fc2,0.00073721,0.01000,4.189
11,self_attn.k_proj,0.02718079,0.01000,1.009
11,self_attn.v_proj,0.00700397,0.01000,0.978
11,self_attn.q_proj,0.02239926,0.01000,1.007
11,self_attn.out_proj,0.00017297,0.01000,1.003
11,fc1,0.05576458,0.01000,1.005
11,fc2,0.00095275,0.01000,4.233
12,self_attn.k_proj,0.03069451,0.01000,0.995
12,self_attn.v_proj,0.00774106,0.01000,0.989
12,self_attn.q_proj,0.02362737,0.01000,0.977
12,self_attn.out_proj,0.00025744,0.01000,0.994
12,fc1,0.05810564,0.01000,1.012
12,fc2,0.00123986,0.01000,4.256
13,self_attn.k_proj,0.03295046,0.01000,0.995
13,self_attn.v_proj,0.00860731,0.01000,0.977
13,self_attn.q_proj,0.02428213,0.01000,0.986
13,self_attn.out_proj,0.00027379,0.01000,1.068
13,fc1,0.06419239,0.01000,1.021
13,fc2,0.00162063,0.01000,4.230
14,self_attn.k_proj,0.03117430,0.01000,1.009
14,self_attn.v_proj,0.01099943,0.01000,0.983
14,self_attn.q_proj,0.02365817,0.01000,0.991
14,self_attn.out_proj,0.00030741,0.01000,0.996
14,fc1,0.07080662,0.01000,1.012
14,fc2,0.00221463,0.01000,4.206
15,self_attn.k_proj,0.02812890,0.01000,1.004
15,self_attn.v_proj,0.01401449,0.01000,0.977
15,self_attn.q_proj,0.02391200,0.01000,1.010
15,self_attn.out_proj,0.00029116,0.01000,0.986
15,fc1,0.07525838,0.01000,1.011
15,fc2,0.00280922,0.01000,4.259
16,self_attn.k_proj,0.02830217,0.01000,0.986
16,self_attn.v_proj,0.01540015,0.01000,0.994
16,self_attn.q_proj,0.02135721,0.01000,0.997
16,self_attn.out_proj,0.00044422,0.01000,0.996
16,fc1,0.08256883,0.01000,1.011
16,fc2,0.00352829,0.01000,4.263
17,self_attn.k_proj,0.02758769,0.01000,1.023
17,self_attn.v_proj,0.01700824,0.01000,0.972
17,self_attn.q_proj,0.02158560,0.01000,0.995
17,self_attn.out_proj,0.00051447,0.01000,0.989
17,fc1,0.09083328,0.01000,0.998
17,fc2,0.00448523,0.01000,4.202
18,self_attn.k_proj,0.02513609,0.01000,0.985
18,self_attn.v_proj,0.01950069,0.01000,0.998
18,self_attn.q_proj,0.02091608,0.01000,0.986
18,self_attn.out_proj,0.00059864,0.01000,1.026
18,fc1,0.09597015,0.01000,0.994
18,fc2,0.00544927,0.01000,4.187
19,self_attn.k_proj,0.02561334,0.01000,1.077
19,self_attn.v_proj,0.02522137,0.01000,1.002
19,self_attn.q_proj,0.02101323,0.01000,1.015
19,self_attn.out_proj,0.00087916,0.01000,0.984
19,fc1,0.10437368,0.01000,0.997
19,fc2,0.00673680,0.01000,4.163
20,self_attn.k_proj,0.02653702,0.01000,0.983
20,self_attn.v_proj,0.02878364,0.01000,0.993
20,self_attn.q_proj,0.02050654,0.01000,0.975
20,self_attn.out_proj,0.00057599,0.01000,0.986
20,fc1,0.10855858,0.01000,0.998
20,fc2,0.00745274,0.01000,4.255
21,self_attn.k_proj,0.02398171,0.01000,1.003
21,self_attn.v_proj,0.02851950,0.01000,0.985
21,self_attn.q_proj,0.02189942,0.01000,0.983
21,self_attn.out_proj,0.00025027,0.01000,0.998
21,fc1,0.10575759,0.01000,0.985
21,fc2,0.00817760,0.01000,4.237
22,self_attn.k_proj,0.02366718,0.01000,0.994
22,self_attn.v_proj,0.03047793,0.01000,0.985
22,self_attn.q_proj,0.02532681,0.01000,0.996
22,self_attn.out_proj,0.00129898,0.01000,1.022
22,fc1,0.10098480,0.01000,1.009
22,fc2,0.00862298,0.01000,4.217
23,self_attn.k_proj,0.02841244,0.01000,1.030
23,self_attn.v_proj,0.02046534,0.01000,1.014
23,self_attn.q_proj,0.05300370,0.01000,1.000
23,self_attn.out_proj,0.00440506,0.01000,0.987
23,fc1,0.09355172,0.01000,1.001
23,fc2,0.00552451,0.01000,4.275