File size: 6,025 Bytes
2c8413d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00409379,0.01000,1.000
0,self_attn.v_proj,0.00072114,0.01000,1.006
0,self_attn.q_proj,0.00414090,0.01000,0.980
0,self_attn.out_proj,0.00001473,0.01000,1.009
0,fc1,0.00906052,0.01000,0.986
0,fc2,0.00011689,0.01000,4.245
1,self_attn.k_proj,0.00241560,0.01000,0.998
1,self_attn.v_proj,0.00030304,0.01000,0.979
1,self_attn.q_proj,0.00263582,0.01000,0.991
1,self_attn.out_proj,0.00001348,0.01000,0.990
1,fc1,0.00911925,0.01000,1.001
1,fc2,0.00113884,0.01000,4.272
2,self_attn.k_proj,0.00382860,0.01000,1.008
2,self_attn.v_proj,0.00054063,0.01000,0.996
2,self_attn.q_proj,0.00378607,0.01000,0.999
2,self_attn.out_proj,0.00000811,0.01000,0.978
2,fc1,0.01030087,0.01000,1.010
2,fc2,0.00010722,0.01000,4.167
3,self_attn.k_proj,0.00392859,0.01000,0.990
3,self_attn.v_proj,0.00063046,0.01000,0.989
3,self_attn.q_proj,0.00420090,0.01000,0.973
3,self_attn.out_proj,0.00001649,0.01000,1.002
3,fc1,0.00846032,0.01000,0.985
3,fc2,0.00012199,0.01000,4.221
4,self_attn.k_proj,0.00556619,0.01000,0.996
4,self_attn.v_proj,0.00072275,0.01000,0.987
4,self_attn.q_proj,0.00558837,0.01000,0.993
4,self_attn.out_proj,0.00001731,0.01000,1.013
4,fc1,0.00879328,0.01000,0.989
4,fc2,0.00011329,0.01000,4.202
5,self_attn.k_proj,0.00716568,0.01000,0.991
5,self_attn.v_proj,0.00093275,0.01000,0.987
5,self_attn.q_proj,0.00673818,0.01000,1.002
5,self_attn.out_proj,0.00003818,0.01000,1.005
5,fc1,0.01022671,0.01000,0.978
5,fc2,0.00017304,0.01000,4.199
6,self_attn.k_proj,0.01196123,0.01000,1.025
6,self_attn.v_proj,0.00122724,0.01000,1.007
6,self_attn.q_proj,0.00925438,0.01000,1.007
6,self_attn.out_proj,0.00006164,0.01000,1.004
6,fc1,0.01337742,0.01000,0.994
6,fc2,0.00021436,0.01000,4.231
7,self_attn.k_proj,0.01336243,0.01000,0.995
7,self_attn.v_proj,0.00149999,0.01000,0.978
7,self_attn.q_proj,0.01013738,0.01000,0.991
7,self_attn.out_proj,0.00006549,0.01000,0.991
7,fc1,0.01671198,0.01000,0.994
7,fc2,0.00019174,0.01000,4.216
8,self_attn.k_proj,0.01508483,0.01000,0.983
8,self_attn.v_proj,0.00175653,0.01000,1.034
8,self_attn.q_proj,0.01071484,0.01000,0.995
8,self_attn.out_proj,0.00006830,0.01000,0.985
8,fc1,0.01985171,0.01000,0.993
8,fc2,0.00024323,0.01000,4.181
9,self_attn.k_proj,0.01629625,0.01000,0.994
9,self_attn.v_proj,0.00207414,0.01000,0.989
9,self_attn.q_proj,0.01226537,0.01000,0.987
9,self_attn.out_proj,0.00007884,0.01000,1.017
9,fc1,0.02325909,0.01000,0.996
9,fc2,0.00029927,0.01000,4.260
10,self_attn.k_proj,0.01694436,0.01000,0.984
10,self_attn.v_proj,0.00279443,0.01000,1.003
10,self_attn.q_proj,0.01290223,0.01000,1.009
10,self_attn.out_proj,0.00008043,0.01000,0.984
10,fc1,0.02705885,0.01000,1.041
10,fc2,0.00040550,0.01000,4.158
11,self_attn.k_proj,0.01743016,0.01000,0.992
11,self_attn.v_proj,0.00366602,0.01000,0.991
11,self_attn.q_proj,0.01367142,0.01000,1.000
11,self_attn.out_proj,0.00010108,0.01000,0.988
11,fc1,0.03210959,0.01000,1.008
11,fc2,0.00055330,0.01000,4.275
12,self_attn.k_proj,0.02062906,0.01000,0.982
12,self_attn.v_proj,0.00437126,0.01000,0.979
12,self_attn.q_proj,0.01520991,0.01000,0.995
12,self_attn.out_proj,0.00014373,0.01000,0.980
12,fc1,0.03572238,0.01000,1.010
12,fc2,0.00066190,0.01000,4.168
13,self_attn.k_proj,0.02250100,0.01000,0.984
13,self_attn.v_proj,0.00493668,0.01000,1.048
13,self_attn.q_proj,0.01598719,0.01000,1.047
13,self_attn.out_proj,0.00015132,0.01000,0.999
13,fc1,0.03995991,0.01000,1.019
13,fc2,0.00083408,0.01000,4.255
14,self_attn.k_proj,0.02120009,0.01000,0.979
14,self_attn.v_proj,0.00648613,0.01000,0.987
14,self_attn.q_proj,0.01573154,0.01000,0.990
14,self_attn.out_proj,0.00017486,0.01000,1.005
14,fc1,0.04477219,0.01000,0.981
14,fc2,0.00120158,0.01000,4.182
15,self_attn.k_proj,0.01888706,0.01000,0.996
15,self_attn.v_proj,0.00828507,0.01000,0.989
15,self_attn.q_proj,0.01590251,0.01000,1.019
15,self_attn.out_proj,0.00018840,0.01000,1.015
15,fc1,0.04777357,0.01000,1.004
15,fc2,0.00149223,0.01000,4.271
16,self_attn.k_proj,0.01895629,0.01000,0.994
16,self_attn.v_proj,0.00919615,0.01000,0.988
16,self_attn.q_proj,0.01408941,0.01000,0.987
16,self_attn.out_proj,0.00027497,0.01000,0.993
16,fc1,0.05255585,0.01000,0.994
16,fc2,0.00180443,0.01000,4.196
17,self_attn.k_proj,0.01800555,0.01000,0.990
17,self_attn.v_proj,0.01010960,0.01000,0.976
17,self_attn.q_proj,0.01410830,0.01000,0.985
17,self_attn.out_proj,0.00029745,0.01000,0.998
17,fc1,0.05777301,0.01000,1.011
17,fc2,0.00218752,0.01000,4.182
18,self_attn.k_proj,0.01598491,0.01000,1.027
18,self_attn.v_proj,0.01118781,0.01000,0.995
18,self_attn.q_proj,0.01337853,0.01000,0.999
18,self_attn.out_proj,0.00052338,0.01000,0.985
18,fc1,0.05900865,0.01000,1.069
18,fc2,0.00268790,0.01000,4.194
19,self_attn.k_proj,0.01571657,0.01000,0.997
19,self_attn.v_proj,0.01393012,0.01000,1.016
19,self_attn.q_proj,0.01293182,0.01000,0.997
19,self_attn.out_proj,0.00089465,0.01000,1.000
19,fc1,0.06260797,0.01000,1.066
19,fc2,0.00281360,0.01000,4.196
20,self_attn.k_proj,0.01550068,0.01000,0.983
20,self_attn.v_proj,0.01531409,0.01000,0.990
20,self_attn.q_proj,0.01223863,0.01000,1.027
20,self_attn.out_proj,0.00108642,0.01000,1.043
20,fc1,0.06158617,0.01000,0.997
20,fc2,0.00320006,0.01000,4.245
21,self_attn.k_proj,0.01362426,0.01000,1.005
21,self_attn.v_proj,0.01469827,0.01000,0.990
21,self_attn.q_proj,0.01251260,0.01000,0.993
21,self_attn.out_proj,0.00081556,0.01000,0.997
21,fc1,0.05632990,0.01000,1.020
21,fc2,0.00376281,0.01000,4.198
22,self_attn.k_proj,0.01262085,0.01000,1.009
22,self_attn.v_proj,0.01517828,0.01000,1.001
22,self_attn.q_proj,0.01358408,0.01000,1.001
22,self_attn.out_proj,0.00131237,0.01000,1.007
22,fc1,0.04993823,0.01000,1.032
22,fc2,0.00548277,0.01000,4.281
23,self_attn.k_proj,0.01658067,0.01000,1.060
23,self_attn.v_proj,0.00926656,0.01000,0.979
23,self_attn.q_proj,0.02430908,0.01000,0.970
23,self_attn.out_proj,0.00185453,0.01000,1.000
23,fc1,0.03861813,0.01000,0.996
23,fc2,0.00391702,0.01000,4.238