File size: 6,025 Bytes
4341452
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00409379,0.01000,1.022
0,self_attn.v_proj,0.00072114,0.01000,1.006
0,self_attn.q_proj,0.00414090,0.01000,0.969
0,self_attn.out_proj,0.00000870,0.01000,0.986
0,fc1,0.00970921,0.01000,1.046
0,fc2,0.00010505,0.01000,4.252
1,self_attn.k_proj,0.00327041,0.01000,1.012
1,self_attn.v_proj,0.00041319,0.01000,1.001
1,self_attn.q_proj,0.00355976,0.01000,0.986
1,self_attn.out_proj,0.00000244,0.01000,1.018
1,fc1,0.01151395,0.01000,1.005
1,fc2,0.00014460,0.01000,4.327
2,self_attn.k_proj,0.00454492,0.01000,0.993
2,self_attn.v_proj,0.00071424,0.01000,0.980
2,self_attn.q_proj,0.00453008,0.01000,0.991
2,self_attn.out_proj,0.00000383,0.01000,1.002
2,fc1,0.01163073,0.01000,0.999
2,fc2,0.00006701,0.01000,4.270
3,self_attn.k_proj,0.00453221,0.01000,0.995
3,self_attn.v_proj,0.00088928,0.01000,1.014
3,self_attn.q_proj,0.00502093,0.01000,1.022
3,self_attn.out_proj,0.00000183,0.01000,1.003
3,fc1,0.01080185,0.01000,1.026
3,fc2,0.00006996,0.01000,4.321
4,self_attn.k_proj,0.00675831,0.01000,1.039
4,self_attn.v_proj,0.00108673,0.01000,0.992
4,self_attn.q_proj,0.00723823,0.01000,1.073
4,self_attn.out_proj,0.00000383,0.01000,1.058
4,fc1,0.01171546,0.01000,0.999
4,fc2,0.00007058,0.01000,4.253
5,self_attn.k_proj,0.00815600,0.01000,0.989
5,self_attn.v_proj,0.00138022,0.01000,1.066
5,self_attn.q_proj,0.00834911,0.01000,0.994
5,self_attn.out_proj,0.00000388,0.01000,1.050
5,fc1,0.01271201,0.01000,1.005
5,fc2,0.00009196,0.01000,4.272
6,self_attn.k_proj,0.01265277,0.01000,0.989
6,self_attn.v_proj,0.00174527,0.01000,0.975
6,self_attn.q_proj,0.01124555,0.01000,1.008
6,self_attn.out_proj,0.00000933,0.01000,1.001
6,fc1,0.01568377,0.01000,1.001
6,fc2,0.00009791,0.01000,4.231
7,self_attn.k_proj,0.01346123,0.01000,0.994
7,self_attn.v_proj,0.00204103,0.01000,0.989
7,self_attn.q_proj,0.01190130,0.01000,0.990
7,self_attn.out_proj,0.00001416,0.01000,1.009
7,fc1,0.01938798,0.01000,1.004
7,fc2,0.00014014,0.01000,4.244
8,self_attn.k_proj,0.01525222,0.01000,1.020
8,self_attn.v_proj,0.00235129,0.01000,0.988
8,self_attn.q_proj,0.01232455,0.01000,0.991
8,self_attn.out_proj,0.00001867,0.01000,1.001
8,fc1,0.02317689,0.01000,1.018
8,fc2,0.00017385,0.01000,4.215
9,self_attn.k_proj,0.01641444,0.01000,0.995
9,self_attn.v_proj,0.00270767,0.01000,1.023
9,self_attn.q_proj,0.01364542,0.01000,1.007
9,self_attn.out_proj,0.00002797,0.01000,0.987
9,fc1,0.02664278,0.01000,0.999
9,fc2,2.56742547,0.01250,4.445
10,self_attn.k_proj,0.01577057,0.01000,0.994
10,self_attn.v_proj,0.00330441,0.01000,0.999
10,self_attn.q_proj,0.01304028,0.01000,0.992
10,self_attn.out_proj,0.00005218,0.01000,0.996
10,fc1,0.02900651,0.01000,0.998
10,fc2,0.00040414,0.01000,4.289
11,self_attn.k_proj,0.01669788,0.01000,1.005
11,self_attn.v_proj,0.00428681,0.01000,0.985
11,self_attn.q_proj,0.01389177,0.01000,0.979
11,self_attn.out_proj,0.00003902,0.01000,0.997
11,fc1,0.03293292,0.01000,0.999
11,fc2,0.00036001,0.01000,4.255
12,self_attn.k_proj,0.01809878,0.01000,0.997
12,self_attn.v_proj,0.00461741,0.01000,0.969
12,self_attn.q_proj,0.01426543,0.01000,0.993
12,self_attn.out_proj,0.00008923,0.01000,1.003
12,fc1,0.03490859,0.01000,0.999
12,fc2,0.00053366,0.01000,4.238
13,self_attn.k_proj,0.02024559,0.01000,1.000
13,self_attn.v_proj,0.00529331,0.01000,1.002
13,self_attn.q_proj,0.01510829,0.01000,0.994
13,self_attn.out_proj,0.00011232,0.01000,1.021
13,fc1,0.04002735,0.01000,1.002
13,fc2,0.00079521,0.01000,4.285
14,self_attn.k_proj,0.02019605,0.01000,0.993
14,self_attn.v_proj,0.00715139,0.01000,0.986
14,self_attn.q_proj,0.01556215,0.01000,0.982
14,self_attn.out_proj,0.00013239,0.01000,0.988
14,fc1,0.04567505,0.01000,1.026
14,fc2,0.00109855,0.01000,4.247
15,self_attn.k_proj,0.01876904,0.01000,1.011
15,self_attn.v_proj,0.00927897,0.01000,1.025
15,self_attn.q_proj,0.01618721,0.01000,1.082
15,self_attn.out_proj,0.00013910,0.01000,1.037
15,fc1,0.04992504,0.01000,0.998
15,fc2,0.00144680,0.01000,4.283
16,self_attn.k_proj,0.01909367,0.01000,0.997
16,self_attn.v_proj,0.01037889,0.01000,0.986
16,self_attn.q_proj,0.01454423,0.01000,0.998
16,self_attn.out_proj,0.00020494,0.01000,0.990
16,fc1,0.05550109,0.01000,0.997
16,fc2,0.00181646,0.01000,4.268
17,self_attn.k_proj,0.01868965,0.01000,1.021
17,self_attn.v_proj,0.01156883,0.01000,0.980
17,self_attn.q_proj,0.01493619,0.01000,0.997
17,self_attn.out_proj,0.00022462,0.01000,0.999
17,fc1,0.06165383,0.01000,1.022
17,fc2,0.00235090,0.01000,4.320
18,self_attn.k_proj,0.01697141,0.01000,0.998
18,self_attn.v_proj,0.01306967,0.01000,0.993
18,self_attn.q_proj,0.01436241,0.01000,1.007
18,self_attn.out_proj,0.00025583,0.01000,0.994
18,fc1,0.06307104,0.01000,1.001
18,fc2,0.00259235,0.01000,4.204
19,self_attn.k_proj,0.01683915,0.01000,1.004
19,self_attn.v_proj,0.01634647,0.01000,0.989
19,self_attn.q_proj,0.01405389,0.01000,0.988
19,self_attn.out_proj,0.00030797,0.01000,1.010
19,fc1,0.06668582,0.01000,1.014
19,fc2,0.00294858,0.01000,4.217
20,self_attn.k_proj,0.01660586,0.01000,0.997
20,self_attn.v_proj,0.01790955,0.01000,1.003
20,self_attn.q_proj,0.01307197,0.01000,0.983
20,self_attn.out_proj,0.00048068,0.01000,0.998
20,fc1,0.06591332,0.01000,1.005
20,fc2,0.00350037,0.01000,4.249
21,self_attn.k_proj,0.01451043,0.01000,0.992
21,self_attn.v_proj,0.01692051,0.01000,0.982
21,self_attn.q_proj,0.01337012,0.01000,1.004
21,self_attn.out_proj,0.00033322,0.01000,1.010
21,fc1,0.06099212,0.01000,1.001
21,fc2,0.00390600,0.01000,4.357
22,self_attn.k_proj,0.01366263,0.01000,0.984
22,self_attn.v_proj,0.01748320,0.01000,0.997
22,self_attn.q_proj,0.01474320,0.01000,0.996
22,self_attn.out_proj,0.00038908,0.01000,1.004
22,fc1,0.05703627,0.01000,1.007
22,fc2,0.00426069,0.01000,4.242
23,self_attn.k_proj,0.01776943,0.01000,0.998
23,self_attn.v_proj,0.01178338,0.01000,1.004
23,self_attn.q_proj,0.03046774,0.01000,1.023
23,self_attn.out_proj,0.00090270,0.01000,1.002
23,fc1,0.05197454,0.01000,1.012
23,fc2,0.00358283,0.01000,4.266