File size: 7,490 Bytes
fb8ba82
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.77682245,0.01000,1.285
0,self_attn.v_proj,0.03500944,0.01000,0.555
0,self_attn.q_proj,0.99208140,0.01000,0.586
0,self_attn.o_proj,0.02151467,0.01000,0.622
0,mlp.up_proj,0.48560226,0.01000,0.688
0,mlp.gate_proj,0.51454079,0.01000,0.684
0,mlp.down_proj,0.50206679,0.01000,2.690
1,self_attn.k_proj,1.51786375,0.01000,0.619
1,self_attn.v_proj,0.34056193,0.01000,0.603
1,self_attn.q_proj,1.77233434,0.01000,0.599
1,self_attn.o_proj,0.13850473,0.01000,0.699
1,mlp.up_proj,1.10941112,0.01000,0.641
1,mlp.gate_proj,1.28043342,0.01000,0.611
1,mlp.down_proj,14.51999855,0.01000,2.696
2,self_attn.k_proj,2.82318068,0.01000,0.617
2,self_attn.v_proj,1.09324777,0.01000,0.582
2,self_attn.q_proj,3.20169973,0.01000,0.566
2,self_attn.o_proj,0.28864872,0.01000,0.662
2,mlp.up_proj,1.84167004,0.01000,0.590
2,mlp.gate_proj,2.07128930,0.01000,0.559
2,mlp.down_proj,1.27372789,0.01000,2.587
3,self_attn.k_proj,3.76621532,0.01000,0.643
3,self_attn.v_proj,1.56358862,0.01000,0.610
3,self_attn.q_proj,3.76481605,0.01000,0.616
3,self_attn.o_proj,0.44352189,0.01000,0.647
3,mlp.up_proj,2.52457261,0.01000,0.603
3,mlp.gate_proj,2.64974737,0.01000,0.623
3,mlp.down_proj,2.54826880,0.01000,2.554
4,self_attn.k_proj,4.20260096,0.01000,0.540
4,self_attn.v_proj,1.82544005,0.01000,0.488
4,self_attn.q_proj,4.33011675,0.01000,0.489
4,self_attn.o_proj,0.81763673,0.01000,0.535
4,mlp.up_proj,3.34401894,0.01000,0.512
4,mlp.gate_proj,3.44722080,0.01000,0.494
4,mlp.down_proj,3.73280597,0.01000,2.436
5,self_attn.k_proj,4.16551399,0.01000,0.610
5,self_attn.v_proj,1.92370594,0.01000,0.588
5,self_attn.q_proj,4.34254456,0.01000,0.635
5,self_attn.o_proj,0.96646106,0.01000,0.586
5,mlp.up_proj,4.14636469,0.01000,0.603
5,mlp.gate_proj,4.12169456,0.01000,0.585
5,mlp.down_proj,4.96067905,0.01000,2.481
6,self_attn.k_proj,4.64315891,0.01000,0.489
6,self_attn.v_proj,2.31881714,0.01000,0.467
6,self_attn.q_proj,4.96351624,0.01000,0.477
6,self_attn.o_proj,1.36653817,0.01000,0.526
6,mlp.up_proj,4.88970184,0.01000,0.503
6,mlp.gate_proj,4.76923084,0.01000,0.486
6,mlp.down_proj,6.02524185,0.01000,2.185
7,self_attn.k_proj,4.66848373,0.01000,0.489
7,self_attn.v_proj,2.31519604,0.01000,0.464
7,self_attn.q_proj,5.79233074,0.01000,0.480
7,self_attn.o_proj,2.15676284,0.01000,0.488
7,mlp.up_proj,6.20312214,0.01000,0.497
7,mlp.gate_proj,5.80423927,0.01000,0.483
7,mlp.down_proj,39.07165527,0.01000,2.213
8,self_attn.k_proj,4.63509369,0.01000,0.484
8,self_attn.v_proj,3.28440690,0.01000,0.523
8,self_attn.q_proj,4.71225929,0.01000,0.500
8,self_attn.o_proj,3.75382185,0.01000,0.488
8,mlp.up_proj,7.29536915,0.01000,0.504
8,mlp.gate_proj,6.96828270,0.01000,0.483
8,mlp.down_proj,11.49938583,0.01000,2.198
9,self_attn.k_proj,4.39791918,0.01000,0.498
9,self_attn.v_proj,2.88585830,0.01000,0.475
9,self_attn.q_proj,4.44140625,0.01000,0.489
9,self_attn.o_proj,4.38107252,0.01000,0.494
9,mlp.up_proj,7.57919312,0.01000,0.538
9,mlp.gate_proj,6.68407631,0.01000,0.484
9,mlp.down_proj,12.43455696,0.01000,2.212
10,self_attn.k_proj,4.90410137,0.01000,0.495
10,self_attn.v_proj,3.14827299,0.01000,0.476
10,self_attn.q_proj,5.09773064,0.01000,0.483
10,self_attn.o_proj,5.91220951,0.01000,0.493
10,mlp.up_proj,7.54940319,0.01000,0.522
10,mlp.gate_proj,6.77607632,0.01000,0.526
10,mlp.down_proj,14.59228039,0.01000,2.282
11,self_attn.k_proj,4.83724689,0.01000,0.495
11,self_attn.v_proj,3.04819179,0.01000,0.472
11,self_attn.q_proj,5.13493776,0.01000,0.481
11,self_attn.o_proj,6.75608921,0.01000,0.494
11,mlp.up_proj,7.71922398,0.01000,0.582
11,mlp.gate_proj,6.97108126,0.01000,0.491
11,mlp.down_proj,15.99707985,0.01000,2.207
12,self_attn.k_proj,5.48999071,0.01000,0.492
12,self_attn.v_proj,4.52012539,0.01000,0.469
12,self_attn.q_proj,5.99069595,0.01000,0.477
12,self_attn.o_proj,9.85486317,0.01000,0.488
12,mlp.up_proj,8.40734291,0.01000,0.503
12,mlp.gate_proj,7.56645966,0.01000,0.485
12,mlp.down_proj,21.01655579,0.01000,2.215
13,self_attn.k_proj,5.33678246,0.01000,0.491
13,self_attn.v_proj,3.92936134,0.01000,0.472
13,self_attn.q_proj,5.71902800,0.01000,0.480
13,self_attn.o_proj,8.64190197,0.01000,0.539
13,mlp.up_proj,8.67692661,0.01000,0.501
13,mlp.gate_proj,7.80695248,0.01000,0.502
13,mlp.down_proj,24.07814026,0.01000,2.222
14,self_attn.k_proj,5.57279205,0.01000,0.483
14,self_attn.v_proj,4.35658169,0.01000,0.476
14,self_attn.q_proj,5.51688099,0.01000,0.486
14,self_attn.o_proj,10.84986401,0.01000,0.490
14,mlp.up_proj,9.46220016,0.01000,0.509
14,mlp.gate_proj,8.29815006,0.01000,0.486
14,mlp.down_proj,33.66066742,0.01000,2.208
15,self_attn.k_proj,5.96792984,0.01000,0.489
15,self_attn.v_proj,6.85978556,0.01000,0.534
15,self_attn.q_proj,6.19756794,0.01000,0.491
15,self_attn.o_proj,15.63127327,0.01000,0.486
15,mlp.up_proj,10.45367622,0.01000,0.501
15,mlp.gate_proj,8.97001839,0.01000,0.478
15,mlp.down_proj,44.43462753,0.01000,2.187
16,self_attn.k_proj,6.45448399,0.01000,0.488
16,self_attn.v_proj,6.49105835,0.01000,0.468
16,self_attn.q_proj,6.57531500,0.01000,0.476
16,self_attn.o_proj,17.50428772,0.01000,0.486
16,mlp.up_proj,13.01940155,0.01000,0.512
16,mlp.gate_proj,10.95333672,0.01000,0.483
16,mlp.down_proj,66.79670715,0.01000,2.182
17,self_attn.k_proj,6.14941597,0.01000,0.485
17,self_attn.v_proj,8.96719837,0.01000,0.521
17,self_attn.q_proj,6.27163982,0.01000,0.532
17,self_attn.o_proj,30.05414200,0.01000,0.483
17,mlp.up_proj,15.46764755,0.01000,0.499
17,mlp.gate_proj,13.17247581,0.01000,0.478
17,mlp.down_proj,95.98254395,0.01000,2.191
18,self_attn.k_proj,5.98577356,0.01000,0.488
18,self_attn.v_proj,10.22346210,0.01000,0.468
18,self_attn.q_proj,6.29689360,0.01000,0.474
18,self_attn.o_proj,32.41912842,0.01000,0.481
18,mlp.up_proj,19.32838058,0.01000,0.565
18,mlp.gate_proj,15.88508987,0.01000,0.480
18,mlp.down_proj,148.66180420,0.01000,2.194
19,self_attn.k_proj,6.26510525,0.01000,0.487
19,self_attn.v_proj,13.85520744,0.01000,0.474
19,self_attn.q_proj,6.57017851,0.01000,0.473
19,self_attn.o_proj,35.20966721,0.01000,0.480
19,mlp.up_proj,22.48669624,0.01000,0.497
19,mlp.gate_proj,17.89473343,0.01000,0.481
19,mlp.down_proj,204.57714844,0.01000,2.171
20,self_attn.k_proj,6.23155594,0.01000,0.495
20,self_attn.v_proj,16.45906067,0.01000,0.476
20,self_attn.q_proj,6.64905834,0.01000,0.482
20,self_attn.o_proj,37.22135925,0.01000,0.502
20,mlp.up_proj,24.94277191,0.01000,0.501
20,mlp.gate_proj,19.56863976,0.01000,0.479
20,mlp.down_proj,253.60627747,0.01000,2.163
21,self_attn.k_proj,7.11655140,0.01000,0.485
21,self_attn.v_proj,21.37878990,0.01000,0.468
21,self_attn.q_proj,7.32550526,0.01000,0.471
21,self_attn.o_proj,64.90080261,0.01000,0.486
21,mlp.up_proj,28.40076065,0.01000,0.499
21,mlp.gate_proj,21.86407471,0.01000,0.476
21,mlp.down_proj,320.12417603,0.01000,2.247
22,self_attn.k_proj,7.32285166,0.01000,0.497
22,self_attn.v_proj,22.15027618,0.01000,0.473
22,self_attn.q_proj,8.15643311,0.01000,0.481
22,self_attn.o_proj,102.47914124,0.01000,0.485
22,mlp.up_proj,30.92877579,0.01000,0.504
22,mlp.gate_proj,24.13090897,0.01000,0.485
22,mlp.down_proj,418.65206909,0.01000,2.209
23,self_attn.k_proj,6.63460350,0.01000,0.489
23,self_attn.v_proj,26.71226501,0.01000,0.472
23,self_attn.q_proj,6.39267826,0.01000,0.481
23,self_attn.o_proj,234.22763062,0.01000,0.486
23,mlp.up_proj,31.12707901,0.01000,0.500
23,mlp.gate_proj,25.93458557,0.01000,0.479
23,mlp.down_proj,868.38049316,0.01000,2.240