File size: 10,367 Bytes
c2bfc8a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000099,0.05000,4.817
0,self_attn.q_proj,0.0000000326,0.05000,4.873
0,self_attn.v_proj,0.0000000008,0.05000,4.883
0,self_attn.o_proj,0.0000000000,0.05000,1.506
0,mlp.gate_proj,0.0000000322,0.05000,2.852
0,mlp.up_proj,0.0000000279,0.05000,2.861
0,mlp.down_proj,0.0000000000,0.05000,5.854
1,self_attn.v_proj,0.0000000075,0.05000,5.948
1,self_attn.q_proj,0.0000000986,0.05000,5.967
1,self_attn.k_proj,0.0000000453,0.05000,5.986
1,self_attn.o_proj,0.0000000000,0.05000,1.513
1,mlp.gate_proj,0.0000001107,0.05000,2.723
1,mlp.up_proj,0.0000000970,0.05000,2.728
1,mlp.down_proj,0.0000000181,0.05000,5.748
2,self_attn.v_proj,0.0000000473,0.05000,5.806
2,self_attn.k_proj,0.0000003621,0.05000,5.825
2,self_attn.q_proj,0.0000007457,0.05000,5.841
2,self_attn.o_proj,0.0000000000,0.05000,1.545
2,mlp.gate_proj,0.0000002318,0.05000,2.761
2,mlp.up_proj,0.0000002023,0.05000,2.779
2,mlp.down_proj,0.0000000001,0.05000,5.801
3,self_attn.q_proj,0.0000004040,0.05000,5.748
3,self_attn.k_proj,0.0000001964,0.05000,5.757
3,self_attn.v_proj,0.0000000324,0.05000,5.836
3,self_attn.o_proj,0.0000000000,0.05000,1.507
3,mlp.up_proj,0.0000003335,0.05000,2.726
3,mlp.gate_proj,0.0000003861,0.05000,2.737
3,mlp.down_proj,0.0000000001,0.05000,5.850
4,self_attn.k_proj,0.0000002752,0.05000,5.885
4,self_attn.q_proj,0.0000006219,0.05000,5.899
4,self_attn.v_proj,0.0000000542,0.05000,5.920
4,self_attn.o_proj,0.0000000000,0.05000,1.511
4,mlp.gate_proj,0.0000005583,0.05000,2.707
4,mlp.up_proj,0.0000004521,0.05000,2.712
4,mlp.down_proj,0.0000000003,0.05000,5.795
5,self_attn.v_proj,0.0000000601,0.05000,5.651
5,self_attn.k_proj,0.0000003567,0.05000,5.685
5,self_attn.q_proj,0.0000008041,0.05000,5.708
5,self_attn.o_proj,0.0000000001,0.05000,1.530
5,mlp.gate_proj,0.0000007742,0.05000,2.754
5,mlp.up_proj,0.0000005881,0.05000,2.759
5,mlp.down_proj,0.0000000004,0.05000,5.792
6,self_attn.q_proj,0.0000007546,0.05000,5.715
6,self_attn.v_proj,0.0000000610,0.05000,5.753
6,self_attn.k_proj,0.0000003538,0.05000,5.763
6,self_attn.o_proj,0.0000000001,0.05000,1.491
6,mlp.up_proj,0.0000006991,0.05000,2.700
6,mlp.gate_proj,0.0000008995,0.05000,2.717
6,mlp.down_proj,0.0000000006,0.05000,5.790
7,self_attn.k_proj,0.0000004439,0.05000,5.755
7,self_attn.q_proj,0.0000009290,0.05000,5.785
7,self_attn.v_proj,0.0000000806,0.05000,5.807
7,self_attn.o_proj,0.0000000002,0.05000,1.512
7,mlp.up_proj,0.0000008049,0.05000,2.738
7,mlp.gate_proj,0.0000010599,0.05000,2.751
7,mlp.down_proj,0.0000000008,0.05000,5.833
8,self_attn.v_proj,0.0000000749,0.05000,5.644
8,self_attn.k_proj,0.0000003480,0.05000,5.679
8,self_attn.q_proj,0.0000007657,0.05000,5.711
8,self_attn.o_proj,0.0000000003,0.05000,1.486
8,mlp.gate_proj,0.0000011395,0.05000,2.710
8,mlp.up_proj,0.0000008825,0.05000,2.716
8,mlp.down_proj,0.0000000009,0.05000,5.785
9,self_attn.k_proj,0.0000004894,0.05000,5.779
9,self_attn.q_proj,0.0000010457,0.05000,5.846
9,self_attn.v_proj,0.0000000885,0.05000,5.857
9,self_attn.o_proj,0.0000000003,0.05000,1.521
9,mlp.gate_proj,0.0000011959,0.05000,2.735
9,mlp.up_proj,0.0000009581,0.05000,2.754
9,mlp.down_proj,0.0000000011,0.05000,5.800
10,self_attn.v_proj,0.0000000776,0.05000,5.689
10,self_attn.k_proj,0.0000004430,0.05000,5.697
10,self_attn.q_proj,0.0000009305,0.05000,5.710
10,self_attn.o_proj,0.0000000006,0.05000,1.482
10,mlp.gate_proj,0.0000012489,0.05000,2.718
10,mlp.up_proj,0.0000010243,0.05000,2.723
10,mlp.down_proj,0.0000000013,0.05000,5.783
11,self_attn.q_proj,0.0000011214,0.05000,5.811
11,self_attn.k_proj,0.0000005155,0.05000,5.824
11,self_attn.v_proj,0.0000001141,0.05000,5.853
11,self_attn.o_proj,0.0000000008,0.05000,1.511
11,mlp.gate_proj,0.0000013628,0.05000,2.734
11,mlp.up_proj,0.0000011338,0.05000,2.743
11,mlp.down_proj,0.0000000015,0.05000,5.785
12,self_attn.q_proj,0.0000014866,0.05000,5.701
12,self_attn.v_proj,0.0000001297,0.05000,5.702
12,self_attn.k_proj,0.0000006694,0.05000,5.701
12,self_attn.o_proj,0.0000000009,0.05000,1.521
12,mlp.up_proj,0.0000012766,0.05000,2.776
12,mlp.gate_proj,0.0000015000,0.05000,2.783
12,mlp.down_proj,0.0000000019,0.05000,5.699
13,self_attn.k_proj,0.0000005692,0.05000,5.850
13,self_attn.v_proj,0.0000001234,0.05000,5.908
13,self_attn.q_proj,0.0000011665,0.05000,5.942
13,self_attn.o_proj,0.0000000011,0.05000,1.479
13,mlp.up_proj,0.0000014674,0.05000,2.721
13,mlp.gate_proj,0.0000016768,0.05000,2.732
13,mlp.down_proj,0.0000000024,0.05000,5.763
14,self_attn.q_proj,0.0000013253,0.05000,5.565
14,self_attn.k_proj,0.0000005664,0.05000,5.643
14,self_attn.v_proj,0.0000001981,0.05000,5.653
14,self_attn.o_proj,0.0000000014,0.05000,1.508
14,mlp.gate_proj,0.0000018725,0.05000,2.713
14,mlp.up_proj,0.0000016302,0.05000,2.741
14,mlp.down_proj,0.0000000030,0.05000,5.708
15,self_attn.k_proj,0.0000007359,0.05000,5.857
15,self_attn.q_proj,0.0000016581,0.05000,5.863
15,self_attn.v_proj,0.0000002239,0.05000,5.899
15,self_attn.o_proj,0.0000000015,0.05000,1.513
15,mlp.up_proj,0.0000017916,0.05000,2.713
15,mlp.gate_proj,0.0000021294,0.05000,2.719
15,mlp.down_proj,0.0000000038,0.05000,5.826
16,self_attn.v_proj,0.0000002110,0.05000,5.704
16,self_attn.k_proj,0.0000006766,0.05000,5.723
16,self_attn.q_proj,0.0000014709,0.05000,5.736
16,self_attn.o_proj,0.0000000017,0.05000,1.504
16,mlp.up_proj,0.0000020874,0.05000,2.717
16,mlp.gate_proj,0.0000026221,0.05000,2.732
16,mlp.down_proj,0.0000000054,0.05000,5.778
17,self_attn.v_proj,0.0000002017,0.05000,5.752
17,self_attn.q_proj,0.0000013624,0.05000,5.840
17,self_attn.k_proj,0.0000005692,0.05000,5.847
17,self_attn.o_proj,0.0000000022,0.05000,1.490
17,mlp.gate_proj,0.0000030491,0.05000,2.742
17,mlp.up_proj,0.0000024313,0.05000,2.746
17,mlp.down_proj,0.0000000074,0.05000,5.748
18,self_attn.k_proj,0.0000006751,0.05000,5.822
18,self_attn.v_proj,0.0000002480,0.05000,5.845
18,self_attn.q_proj,0.0000017297,0.05000,5.888
18,self_attn.o_proj,0.0000000020,0.05000,1.496
18,mlp.gate_proj,0.0000034365,0.05000,2.732
18,mlp.up_proj,0.0000027417,0.05000,2.739
18,mlp.down_proj,0.0000000107,0.05000,5.821
19,self_attn.v_proj,0.0000002874,0.05000,5.735
19,self_attn.q_proj,0.0000015817,0.05000,5.766
19,self_attn.k_proj,0.0000006702,0.05000,5.773
19,self_attn.o_proj,0.0000000025,0.05000,1.524
19,mlp.up_proj,0.0000030297,0.05000,2.756
19,mlp.gate_proj,0.0000038671,0.05000,2.773
19,mlp.down_proj,0.0000000143,0.05000,5.762
20,self_attn.q_proj,0.0000016975,0.05000,5.790
20,self_attn.k_proj,0.0000006890,0.05000,5.835
20,self_attn.v_proj,0.0000003146,0.05000,5.849
20,self_attn.o_proj,0.0000000023,0.05000,1.505
20,mlp.up_proj,0.0000033502,0.05000,2.737
20,mlp.gate_proj,0.0000043862,0.05000,2.745
20,mlp.down_proj,0.0000000149,0.05000,5.762
21,self_attn.q_proj,0.0000016742,0.05000,5.741
21,self_attn.v_proj,0.0000003297,0.05000,5.744
21,self_attn.k_proj,0.0000006758,0.05000,5.762
21,self_attn.o_proj,0.0000000024,0.05000,1.527
21,mlp.up_proj,0.0000036733,0.05000,2.724
21,mlp.gate_proj,0.0000051593,0.05000,2.730
21,mlp.down_proj,0.0000000152,0.05000,5.811
22,self_attn.k_proj,0.0000006403,0.05000,5.796
22,self_attn.v_proj,0.0000003419,0.05000,5.830
22,self_attn.q_proj,0.0000016118,0.05000,5.901
22,self_attn.o_proj,0.0000000014,0.05000,1.528
22,mlp.up_proj,0.0000039479,0.05000,2.729
22,mlp.gate_proj,0.0000054861,0.05000,2.733
22,mlp.down_proj,0.0000000157,0.05000,5.797
23,self_attn.v_proj,0.0000003579,0.05000,5.894
23,self_attn.k_proj,0.0000006380,0.05000,5.895
23,self_attn.q_proj,0.0000016239,0.05000,5.922
23,self_attn.o_proj,0.0000000023,0.05000,1.531
23,mlp.gate_proj,0.0000060618,0.05000,2.698
23,mlp.up_proj,0.0000043452,0.05000,2.699
23,mlp.down_proj,0.0000000177,0.05000,5.782
24,self_attn.k_proj,0.0000007371,0.05000,5.596
24,self_attn.q_proj,0.0000018533,0.05000,5.663
24,self_attn.v_proj,0.0000004165,0.05000,5.676
24,self_attn.o_proj,0.0000000021,0.05000,1.492
24,mlp.gate_proj,0.0000068435,0.05000,2.771
24,mlp.up_proj,0.0000048163,0.05000,2.777
24,mlp.down_proj,0.0000000192,0.05000,5.771
25,self_attn.k_proj,0.0000007104,0.05000,5.831
25,self_attn.v_proj,0.0000004764,0.05000,5.842
25,self_attn.q_proj,0.0000018583,0.05000,5.841
25,self_attn.o_proj,0.0000000024,0.05000,1.509
25,mlp.up_proj,0.0000052669,0.05000,2.721
25,mlp.gate_proj,0.0000074224,0.05000,2.730
25,mlp.down_proj,0.0000000218,0.05000,5.820
26,self_attn.v_proj,0.0000005038,0.05000,5.621
26,self_attn.k_proj,0.0000006691,0.05000,5.630
26,self_attn.q_proj,0.0000017644,0.05000,5.648
26,self_attn.o_proj,0.0000000033,0.05000,1.515
26,mlp.up_proj,0.0000057272,0.05000,2.755
26,mlp.gate_proj,0.0000077866,0.05000,2.775
26,mlp.down_proj,0.0000000250,0.05000,5.808
27,self_attn.q_proj,0.0000018230,0.05000,5.916
27,self_attn.v_proj,0.0000004564,0.05000,5.989
27,self_attn.k_proj,0.0000006762,0.05000,6.016
27,self_attn.o_proj,0.0000000037,0.05000,1.485
27,mlp.up_proj,0.0000063079,0.05000,2.725
27,mlp.gate_proj,0.0000085269,0.05000,2.739
27,mlp.down_proj,0.0000000300,0.05000,5.801
28,self_attn.v_proj,0.0000006713,0.05000,5.844
28,self_attn.k_proj,0.0000006783,0.05000,5.868
28,self_attn.q_proj,0.0000017780,0.05000,5.884
28,self_attn.o_proj,0.0000000056,0.05000,1.507
28,mlp.up_proj,0.0000070183,0.05000,2.716
28,mlp.gate_proj,0.0000091368,0.05000,2.723
28,mlp.down_proj,0.0000000409,0.05000,5.721
29,self_attn.v_proj,0.0000009821,0.05000,5.830
29,self_attn.k_proj,0.0000006843,0.05000,5.854
29,self_attn.q_proj,0.0000020354,0.05000,5.860
29,self_attn.o_proj,0.0000000119,0.05000,1.516
29,mlp.gate_proj,0.0000088944,0.05000,2.812
29,mlp.up_proj,0.0000071220,0.05000,2.825
29,mlp.down_proj,0.0000000519,0.05000,5.835
30,self_attn.q_proj,0.0000018947,0.05000,5.718
30,self_attn.k_proj,0.0000006325,0.05000,5.845
30,self_attn.v_proj,0.0000010680,0.05000,5.874
30,self_attn.o_proj,0.0000000106,0.05000,1.507
30,mlp.gate_proj,0.0000089889,0.05000,2.782
30,mlp.up_proj,0.0000073173,0.05000,2.796
30,mlp.down_proj,0.0000000681,0.05000,5.731
31,self_attn.v_proj,0.0000010866,0.05000,5.793
31,self_attn.k_proj,0.0000006014,0.05000,5.846
31,self_attn.q_proj,0.0000017606,0.05000,5.861
31,self_attn.o_proj,0.0000000142,0.05000,1.512
31,mlp.gate_proj,0.0000075029,0.05000,2.765
31,mlp.up_proj,0.0000059300,0.05000,2.774
31,mlp.down_proj,0.0000001083,0.05000,5.806
|