File size: 9,330 Bytes
e9117d8 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 | layer,module,loss,damp,time
0,self_attn.k_proj,1.67455,0.01000,1.374
0,self_attn.v_proj,0.01563,0.01000,0.857
0,self_attn.q_proj,2.44210,0.01000,0.843
0,self_attn.o_proj,0.00120,0.01000,1.084
0,mlp.up_proj,1.12059,0.01000,1.182
0,mlp.gate_proj,1.35096,0.01000,1.257
0,mlp.down_proj,0.00533,0.01000,3.678
1,self_attn.k_proj,1.18099,0.01000,1.487
1,self_attn.v_proj,0.04712,0.01000,1.030
1,self_attn.q_proj,2.11007,0.01000,0.790
1,self_attn.o_proj,0.00340,0.01000,0.944
1,mlp.up_proj,2.02044,0.01000,1.102
1,mlp.gate_proj,2.38063,0.01000,0.839
1,mlp.down_proj,0.27413,0.01000,4.828
2,self_attn.k_proj,5.75050,0.01000,1.325
2,self_attn.v_proj,0.24798,0.01000,1.087
2,self_attn.q_proj,8.70779,0.01000,0.789
2,self_attn.o_proj,0.00482,0.01000,0.900
2,mlp.up_proj,3.30517,0.01000,0.953
2,mlp.gate_proj,4.11650,0.01000,0.793
2,mlp.down_proj,0.02226,0.01000,3.532
3,self_attn.k_proj,4.70262,0.01000,0.979
3,self_attn.v_proj,0.42861,0.01000,0.764
3,self_attn.q_proj,8.32949,0.01000,0.773
3,self_attn.o_proj,0.00949,0.01000,0.897
3,mlp.up_proj,4.45794,0.01000,0.961
3,mlp.gate_proj,6.36765,0.01000,0.791
3,mlp.down_proj,0.04013,0.01000,3.529
4,self_attn.k_proj,4.32369,0.01000,0.994
4,self_attn.v_proj,0.41342,0.01000,0.783
4,self_attn.q_proj,7.49417,0.01000,0.784
4,self_attn.o_proj,0.02278,0.01000,0.903
4,mlp.up_proj,5.73665,0.01000,0.956
4,mlp.gate_proj,9.29301,0.01000,0.788
4,mlp.down_proj,0.07160,0.01000,3.531
5,self_attn.k_proj,7.16464,0.01000,0.988
5,self_attn.v_proj,0.41958,0.01000,0.777
5,self_attn.q_proj,11.18455,0.01000,0.782
5,self_attn.o_proj,0.02738,0.01000,0.892
5,mlp.up_proj,7.10653,0.01000,0.946
5,mlp.gate_proj,11.38163,0.01000,0.790
5,mlp.down_proj,0.10580,0.01000,3.530
6,self_attn.k_proj,5.86325,0.01000,0.985
6,self_attn.v_proj,0.47806,0.01000,0.777
6,self_attn.q_proj,10.40880,0.01000,0.787
6,self_attn.o_proj,0.04742,0.01000,0.893
6,mlp.up_proj,7.93777,0.01000,0.941
6,mlp.gate_proj,12.87985,0.01000,0.789
6,mlp.down_proj,0.13405,0.01000,3.518
7,self_attn.k_proj,6.00274,0.01000,0.992
7,self_attn.v_proj,0.51351,0.01000,0.782
7,self_attn.q_proj,9.99979,0.01000,0.789
7,self_attn.o_proj,0.07018,0.01000,0.904
7,mlp.up_proj,8.87538,0.01000,0.950
7,mlp.gate_proj,13.46894,0.01000,0.804
7,mlp.down_proj,0.16375,0.01000,3.536
8,self_attn.k_proj,7.93341,0.01000,0.990
8,self_attn.v_proj,0.70737,0.01000,0.784
8,self_attn.q_proj,12.85989,0.01000,0.783
8,self_attn.o_proj,0.09924,0.01000,0.894
8,mlp.up_proj,9.40879,0.01000,0.946
8,mlp.gate_proj,14.48714,0.01000,0.788
8,mlp.down_proj,0.17780,0.01000,3.531
9,self_attn.k_proj,7.62591,0.01000,0.983
9,self_attn.v_proj,0.98705,0.01000,0.781
9,self_attn.q_proj,12.78982,0.01000,0.774
9,self_attn.o_proj,0.12301,0.01000,0.894
9,mlp.up_proj,9.83696,0.01000,0.947
9,mlp.gate_proj,15.24170,0.01000,0.782
9,mlp.down_proj,0.19016,0.01000,3.520
10,self_attn.k_proj,9.20124,0.01000,0.991
10,self_attn.v_proj,0.76641,0.01000,0.780
10,self_attn.q_proj,14.94425,0.01000,0.781
10,self_attn.o_proj,0.11261,0.01000,0.932
10,mlp.up_proj,10.17253,0.01000,0.965
10,mlp.gate_proj,14.70482,0.01000,0.800
10,mlp.down_proj,0.19970,0.01000,3.538
11,self_attn.k_proj,8.29908,0.01000,0.985
11,self_attn.v_proj,0.77584,0.01000,0.788
11,self_attn.q_proj,12.99333,0.01000,0.808
11,self_attn.o_proj,0.11676,0.01000,0.944
11,mlp.up_proj,10.72510,0.01000,0.978
11,mlp.gate_proj,15.03487,0.01000,0.821
11,mlp.down_proj,0.21327,0.01000,3.583
12,self_attn.k_proj,6.44645,0.01000,1.021
12,self_attn.v_proj,0.91089,0.01000,0.796
12,self_attn.q_proj,11.28430,0.01000,0.779
12,self_attn.o_proj,0.13829,0.01000,0.936
12,mlp.up_proj,11.09363,0.01000,0.978
12,mlp.gate_proj,14.70452,0.01000,0.805
12,mlp.down_proj,0.24356,0.01000,4.140
13,self_attn.k_proj,9.63378,0.01000,1.097
13,self_attn.v_proj,0.99925,0.01000,0.881
13,self_attn.q_proj,14.75355,0.01000,0.894
13,self_attn.o_proj,0.16912,0.01000,1.016
13,mlp.up_proj,11.90938,0.01000,1.172
13,mlp.gate_proj,15.78435,0.01000,0.916
13,mlp.down_proj,0.27893,0.01000,4.015
14,self_attn.k_proj,10.38642,0.01000,1.284
14,self_attn.v_proj,1.07203,0.01000,1.051
14,self_attn.q_proj,15.21779,0.01000,0.881
14,self_attn.o_proj,0.19986,0.01000,1.216
14,mlp.up_proj,13.33181,0.01000,1.147
14,mlp.gate_proj,18.61642,0.01000,1.023
14,mlp.down_proj,0.35034,0.01000,4.122
15,self_attn.k_proj,9.63450,0.01000,1.434
15,self_attn.v_proj,1.32576,0.01000,0.933
15,self_attn.q_proj,18.02941,0.01000,0.930
15,self_attn.o_proj,0.21734,0.01000,1.394
15,mlp.up_proj,14.15202,0.01000,1.456
15,mlp.gate_proj,20.87254,0.01000,1.301
15,mlp.down_proj,0.41982,0.01000,5.002
16,self_attn.k_proj,10.17006,0.01000,1.537
16,self_attn.v_proj,1.19822,0.01000,1.368
16,self_attn.q_proj,16.77322,0.01000,1.332
16,self_attn.o_proj,0.17319,0.01000,1.437
16,mlp.up_proj,15.03896,0.01000,1.548
16,mlp.gate_proj,23.45555,0.01000,1.320
16,mlp.down_proj,0.44929,0.01000,4.138
17,self_attn.k_proj,10.98778,0.01000,1.230
17,self_attn.v_proj,1.32671,0.01000,1.160
17,self_attn.q_proj,17.59847,0.01000,1.167
17,self_attn.o_proj,0.14944,0.01000,1.362
17,mlp.up_proj,15.58763,0.01000,1.431
17,mlp.gate_proj,24.89798,0.01000,1.265
17,mlp.down_proj,0.50724,0.01000,5.410
18,self_attn.k_proj,12.20277,0.01000,1.061
18,self_attn.v_proj,1.34966,0.01000,0.860
18,self_attn.q_proj,17.89468,0.01000,0.859
18,self_attn.o_proj,0.09903,0.01000,0.969
18,mlp.up_proj,16.20828,0.01000,1.016
18,mlp.gate_proj,26.16949,0.01000,1.014
18,mlp.down_proj,0.49752,0.01000,3.768
19,self_attn.k_proj,10.93621,0.01000,1.069
19,self_attn.v_proj,1.46302,0.01000,0.864
19,self_attn.q_proj,18.15470,0.01000,0.892
19,self_attn.o_proj,0.09105,0.01000,0.966
19,mlp.up_proj,16.72400,0.01000,1.025
19,mlp.gate_proj,27.49463,0.01000,0.859
19,mlp.down_proj,0.52641,0.01000,3.792
20,self_attn.k_proj,12.09173,0.01000,1.080
20,self_attn.v_proj,1.61016,0.01000,0.849
20,self_attn.q_proj,18.90335,0.01000,0.848
20,self_attn.o_proj,0.11517,0.01000,0.975
20,mlp.up_proj,18.19626,0.01000,1.018
20,mlp.gate_proj,29.64920,0.01000,0.863
20,mlp.down_proj,0.58271,0.01000,3.782
21,self_attn.k_proj,12.01518,0.01000,1.055
21,self_attn.v_proj,1.76573,0.01000,0.847
21,self_attn.q_proj,18.27858,0.01000,0.852
21,self_attn.o_proj,0.13262,0.01000,0.967
21,mlp.up_proj,19.45468,0.01000,1.116
21,mlp.gate_proj,31.98465,0.01000,0.862
21,mlp.down_proj,0.67858,0.01000,3.763
22,self_attn.k_proj,12.72928,0.01000,1.063
22,self_attn.v_proj,2.06985,0.01000,0.857
22,self_attn.q_proj,18.57751,0.01000,0.860
22,self_attn.o_proj,0.13445,0.01000,1.005
22,mlp.up_proj,20.37171,0.01000,1.036
22,mlp.gate_proj,33.14872,0.01000,0.859
22,mlp.down_proj,0.69553,0.01000,3.849
23,self_attn.k_proj,12.33203,0.01000,1.063
23,self_attn.v_proj,2.26092,0.01000,0.848
23,self_attn.q_proj,19.39859,0.01000,0.839
23,self_attn.o_proj,0.10357,0.01000,0.974
23,mlp.up_proj,21.54764,0.01000,1.021
23,mlp.gate_proj,34.85669,0.01000,0.880
23,mlp.down_proj,0.73572,0.01000,3.760
24,self_attn.k_proj,12.36280,0.01000,1.060
24,self_attn.v_proj,2.82739,0.01000,0.858
24,self_attn.q_proj,19.50312,0.01000,0.853
24,self_attn.o_proj,0.12827,0.01000,0.973
24,mlp.up_proj,22.87259,0.01000,1.019
24,mlp.gate_proj,37.01811,0.01000,0.854
24,mlp.down_proj,0.78521,0.01000,3.805
25,self_attn.k_proj,11.61044,0.01000,1.061
25,self_attn.v_proj,2.95012,0.01000,0.875
25,self_attn.q_proj,19.60500,0.01000,0.886
25,self_attn.o_proj,0.13309,0.01000,1.018
25,mlp.up_proj,24.36775,0.01000,1.044
25,mlp.gate_proj,39.39181,0.01000,0.863
25,mlp.down_proj,0.86602,0.01000,3.757
26,self_attn.k_proj,12.30509,0.01000,1.084
26,self_attn.v_proj,2.74246,0.01000,0.853
26,self_attn.q_proj,18.88729,0.01000,0.847
26,self_attn.o_proj,0.19489,0.01000,0.997
26,mlp.up_proj,25.92906,0.01000,1.036
26,mlp.gate_proj,42.05636,0.01000,0.878
26,mlp.down_proj,0.97078,0.01000,3.787
27,self_attn.k_proj,13.45363,0.01000,1.077
27,self_attn.v_proj,3.96388,0.01000,0.875
27,self_attn.q_proj,19.69077,0.01000,0.855
27,self_attn.o_proj,0.23587,0.01000,0.994
27,mlp.up_proj,28.29988,0.01000,1.044
27,mlp.gate_proj,45.52046,0.01000,0.866
27,mlp.down_proj,1.14506,0.01000,3.800
28,self_attn.k_proj,10.64583,0.01000,1.074
28,self_attn.v_proj,3.52820,0.01000,0.853
28,self_attn.q_proj,18.24191,0.01000,0.848
28,self_attn.o_proj,0.43366,0.01000,0.962
28,mlp.up_proj,31.36622,0.01000,1.023
28,mlp.gate_proj,48.24959,0.01000,0.859
28,mlp.down_proj,1.47378,0.01000,3.777
29,self_attn.k_proj,11.08085,0.01000,1.051
29,self_attn.v_proj,4.26497,0.01000,1.238
29,self_attn.q_proj,19.39488,0.01000,0.862
29,self_attn.o_proj,0.35388,0.01000,1.016
29,mlp.up_proj,33.49432,0.01000,1.029
29,mlp.gate_proj,49.36393,0.01000,0.887
29,mlp.down_proj,1.94291,0.01000,3.813
30,self_attn.k_proj,11.22392,0.01000,1.064
30,self_attn.v_proj,5.82378,0.01000,0.860
30,self_attn.q_proj,17.92860,0.01000,0.885
30,self_attn.o_proj,0.66760,0.01000,0.974
30,mlp.up_proj,35.52309,0.01000,1.037
30,mlp.gate_proj,53.53950,0.01000,0.871
30,mlp.down_proj,3.13855,0.01000,3.752
31,self_attn.k_proj,8.07040,0.01000,1.064
31,self_attn.v_proj,3.51582,0.01000,0.857
31,self_attn.q_proj,15.25764,0.01000,0.857
31,self_attn.o_proj,1.23350,0.01000,0.969
31,mlp.up_proj,33.48654,0.01000,1.024
31,mlp.gate_proj,48.67476,0.01000,0.865
31,mlp.down_proj,8.08488,0.01000,3.776
|