File size: 9,067 Bytes
441d865 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 |
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000472167,0.10000,1.635
0,self_attn.v_proj,0.0000078736,0.10000,0.761
0,self_attn.q_proj,0.0002322893,0.10000,0.775
0,self_attn.o_proj,0.0000110702,0.10000,0.771
0,mlp.up_proj,0.0004552265,0.10000,0.827
0,mlp.gate_proj,0.0008605841,0.10000,0.821
0,mlp.down_proj,0.0000372180,0.10000,5.562
1,self_attn.k_proj,0.0000501259,0.10000,0.757
1,self_attn.v_proj,0.0000165444,0.10000,0.743
1,self_attn.q_proj,0.0001916083,0.10000,0.751
1,self_attn.o_proj,0.0000040245,0.10000,0.765
1,mlp.up_proj,0.0092325296,0.10000,0.840
1,mlp.gate_proj,0.0138325553,0.10000,0.819
1,mlp.down_proj,0.0000251277,0.10000,5.547
2,self_attn.k_proj,0.0001338489,0.10000,0.768
2,self_attn.v_proj,0.0000271386,0.10000,0.753
2,self_attn.q_proj,0.0005077048,0.10000,0.756
2,self_attn.o_proj,0.0000081085,0.10000,0.756
2,mlp.up_proj,0.0088262850,0.10000,0.830
2,mlp.gate_proj,0.0135353442,0.10000,0.822
2,mlp.down_proj,0.0000469443,0.10000,5.641
3,self_attn.k_proj,0.0001345897,0.10000,0.772
3,self_attn.v_proj,0.0000399959,0.10000,0.760
3,self_attn.q_proj,0.0005372458,0.10000,0.763
3,self_attn.o_proj,0.0000187831,0.10000,0.762
3,mlp.up_proj,0.0167387179,0.10000,0.836
3,mlp.gate_proj,0.0207291428,0.10000,0.825
3,mlp.down_proj,0.0006986494,0.10000,5.543
4,self_attn.k_proj,0.0002373652,0.10000,0.760
4,self_attn.v_proj,0.0001024738,0.10000,0.747
4,self_attn.q_proj,0.0010985888,0.10000,0.749
4,self_attn.o_proj,0.0000181369,0.10000,0.761
4,mlp.up_proj,0.0122986446,0.10000,0.838
4,mlp.gate_proj,0.0167416077,0.10000,0.831
4,mlp.down_proj,0.0001518217,0.10000,5.565
5,self_attn.k_proj,0.0002180186,0.10000,0.763
5,self_attn.v_proj,0.0001001975,0.10000,0.768
5,self_attn.q_proj,0.0010695679,0.10000,0.756
5,self_attn.o_proj,0.0000169917,0.10000,0.769
5,mlp.up_proj,0.0181349126,0.10000,0.842
5,mlp.gate_proj,0.0210626856,0.10000,0.832
5,mlp.down_proj,0.0000545735,0.10000,5.585
6,self_attn.k_proj,0.0001318691,0.10000,0.759
6,self_attn.v_proj,0.0000696637,0.10000,0.750
6,self_attn.q_proj,0.0006738798,0.10000,0.748
6,self_attn.o_proj,0.0000257538,0.10000,0.761
6,mlp.up_proj,0.0029716475,0.10000,0.837
6,mlp.gate_proj,0.0042372570,0.10000,0.827
6,mlp.down_proj,0.0001331812,0.10000,5.695
7,self_attn.k_proj,0.0001290255,0.10000,0.759
7,self_attn.v_proj,0.0001260896,0.10000,0.745
7,self_attn.q_proj,0.0007587422,0.10000,0.747
7,self_attn.o_proj,0.0000583953,0.10000,0.754
7,mlp.up_proj,0.0023285143,0.10000,0.835
7,mlp.gate_proj,0.0025514315,0.10000,0.818
7,mlp.down_proj,0.0002113085,0.10000,5.588
8,self_attn.k_proj,0.0002543362,0.10000,0.760
8,self_attn.v_proj,0.0001154977,0.10000,0.749
8,self_attn.q_proj,0.0011885152,0.10000,0.752
8,self_attn.o_proj,0.0000742859,0.10000,0.761
8,mlp.up_proj,0.0026835205,0.10000,0.836
8,mlp.gate_proj,0.0027838197,0.10000,0.836
8,mlp.down_proj,0.0002283458,0.10000,5.535
9,self_attn.k_proj,0.0001838648,0.10000,0.759
9,self_attn.v_proj,0.0001650378,0.10000,0.744
9,self_attn.q_proj,0.0010429632,0.10000,0.751
9,self_attn.o_proj,0.0001184023,0.10000,0.758
9,mlp.up_proj,0.0057535404,0.10000,0.832
9,mlp.gate_proj,0.0091259328,0.10000,0.825
9,mlp.down_proj,0.0003028532,0.10000,5.987
10,self_attn.k_proj,0.0001916147,0.10000,0.773
10,self_attn.v_proj,0.0001171599,0.10000,0.743
10,self_attn.q_proj,0.0010033896,0.10000,0.750
10,self_attn.o_proj,0.0000735668,0.10000,0.770
10,mlp.up_proj,0.0029951623,0.10000,0.831
10,mlp.gate_proj,0.0032918856,0.10000,0.816
10,mlp.down_proj,0.0002347663,0.10000,5.543
11,self_attn.k_proj,0.0002426945,0.10000,0.754
11,self_attn.v_proj,0.0001072995,0.10000,0.844
11,self_attn.q_proj,0.0011513309,0.10000,0.899
11,self_attn.o_proj,0.0000928968,0.10000,0.912
11,mlp.up_proj,0.0028736497,0.10000,1.027
11,mlp.gate_proj,0.0029332547,0.10000,0.832
11,mlp.down_proj,0.0002235528,0.10000,5.550
12,self_attn.k_proj,0.0002664533,0.10000,0.766
12,self_attn.v_proj,0.0001384261,0.10000,0.748
12,self_attn.q_proj,0.0012836385,0.10000,0.755
12,self_attn.o_proj,0.0001158217,0.10000,0.800
12,mlp.up_proj,0.0030152578,0.10000,0.856
12,mlp.gate_proj,0.0029214713,0.10000,0.852
12,mlp.down_proj,0.0002485149,0.10000,5.819
13,self_attn.k_proj,0.0002370596,0.10000,0.751
13,self_attn.v_proj,0.0001593123,0.10000,0.751
13,self_attn.q_proj,0.0013060732,0.10000,0.753
13,self_attn.o_proj,0.0001333592,0.10000,0.761
13,mlp.up_proj,0.0030158192,0.10000,0.844
13,mlp.gate_proj,0.0031320744,0.10000,0.832
13,mlp.down_proj,0.0002281524,0.10000,5.580
14,self_attn.k_proj,0.0003049479,0.10000,0.756
14,self_attn.v_proj,0.0001570591,0.10000,0.736
14,self_attn.q_proj,0.0016287128,0.10000,0.747
14,self_attn.o_proj,0.0001430852,0.10000,0.768
14,mlp.up_proj,0.0032785469,0.10000,0.844
14,mlp.gate_proj,0.0031912735,0.10000,0.828
14,mlp.down_proj,0.0002534288,0.10000,5.665
15,self_attn.k_proj,0.0002922762,0.10000,0.747
15,self_attn.v_proj,0.0001391043,0.10000,0.745
15,self_attn.q_proj,0.0013987548,0.10000,0.754
15,self_attn.o_proj,0.0001067492,0.10000,0.759
15,mlp.up_proj,0.0032067114,0.10000,0.831
15,mlp.gate_proj,0.0030483367,0.10000,0.821
15,mlp.down_proj,0.0002609062,0.10000,5.764
16,self_attn.k_proj,0.0002632407,0.10000,0.754
16,self_attn.v_proj,0.0001856220,0.10000,0.744
16,self_attn.q_proj,0.0014148347,0.10000,0.748
16,self_attn.o_proj,0.0001408646,0.10000,0.762
16,mlp.up_proj,0.0033665611,0.10000,0.843
16,mlp.gate_proj,0.0032078180,0.10000,0.823
16,mlp.down_proj,0.0002613587,0.10000,5.541
17,self_attn.k_proj,0.0002712536,0.10000,0.752
17,self_attn.v_proj,0.0002099971,0.10000,0.748
17,self_attn.q_proj,0.0016259497,0.10000,0.749
17,self_attn.o_proj,0.0001131741,0.10000,0.758
17,mlp.up_proj,0.0039933213,0.10000,0.833
17,mlp.gate_proj,0.0037328810,0.10000,0.824
17,mlp.down_proj,0.0003456270,0.10000,5.574
18,self_attn.k_proj,0.0002159712,0.10000,0.754
18,self_attn.v_proj,0.0002325307,0.10000,0.743
18,self_attn.q_proj,0.0013481819,0.10000,0.761
18,self_attn.o_proj,0.0001833125,0.10000,0.759
18,mlp.up_proj,0.0043035444,0.10000,0.836
18,mlp.gate_proj,0.0040026095,0.10000,0.828
18,mlp.down_proj,0.0004392644,0.10000,5.576
19,self_attn.k_proj,0.0002050852,0.10000,0.763
19,self_attn.v_proj,0.0002661283,0.10000,0.746
19,self_attn.q_proj,0.0014559043,0.10000,0.756
19,self_attn.o_proj,0.0002159337,0.10000,0.758
19,mlp.up_proj,0.0047093964,0.10000,0.832
19,mlp.gate_proj,0.0046096435,0.10000,0.822
19,mlp.down_proj,0.0005018536,0.10000,5.554
20,self_attn.k_proj,0.0002232794,0.10000,0.761
20,self_attn.v_proj,0.0003003416,0.10000,0.750
20,self_attn.q_proj,0.0014417838,0.10000,0.748
20,self_attn.o_proj,0.0001322579,0.10000,0.758
20,mlp.up_proj,0.0060516974,0.10000,0.834
20,mlp.gate_proj,0.0059635491,0.10000,0.820
20,mlp.down_proj,0.0009318391,0.10000,5.566
21,self_attn.k_proj,0.0002299286,0.10000,0.755
21,self_attn.v_proj,0.0004667530,0.10000,0.763
21,self_attn.q_proj,0.0017117155,0.10000,0.756
21,self_attn.o_proj,0.0003423200,0.10000,0.765
21,mlp.up_proj,0.0080906422,0.10000,0.843
21,mlp.gate_proj,0.0084336273,0.10000,0.825
21,mlp.down_proj,0.0014748711,0.10000,5.943
22,self_attn.k_proj,0.0003220915,0.10000,1.087
22,self_attn.v_proj,0.0008169382,0.10000,0.802
22,self_attn.q_proj,0.0025697731,0.10000,0.770
22,self_attn.o_proj,0.0002277115,0.10000,0.778
22,mlp.up_proj,0.0119962620,0.10000,0.844
22,mlp.gate_proj,0.0124196528,0.10000,0.831
22,mlp.down_proj,0.0026358763,0.10000,5.724
23,self_attn.k_proj,0.0004014596,0.10000,0.764
23,self_attn.v_proj,0.0011422982,0.10000,0.754
23,self_attn.q_proj,0.0030751132,0.10000,0.769
23,self_attn.o_proj,0.0006334905,0.10000,0.921
23,mlp.up_proj,0.0183306920,0.10000,0.976
23,mlp.gate_proj,0.0189817467,0.10000,0.960
23,mlp.down_proj,0.0041346475,0.10000,5.643
24,self_attn.k_proj,0.0003703904,0.10000,0.762
24,self_attn.v_proj,0.0011029526,0.10000,0.750
24,self_attn.q_proj,0.0028345045,0.10000,0.770
24,self_attn.o_proj,0.0005504099,0.10000,0.909
24,mlp.up_proj,0.0217335806,0.10000,0.969
24,mlp.gate_proj,0.0206995038,0.10000,0.960
24,mlp.down_proj,0.0059107753,0.10000,5.554
25,self_attn.k_proj,0.0004121669,0.10000,0.757
25,self_attn.v_proj,0.0018403888,0.10000,0.748
25,self_attn.q_proj,0.0034511876,0.10000,0.761
25,self_attn.o_proj,0.0008662717,0.10000,0.764
25,mlp.up_proj,0.0319784486,0.10000,0.838
25,mlp.gate_proj,0.0287693461,0.10000,0.826
25,mlp.down_proj,0.0109144369,0.10000,5.618
26,self_attn.k_proj,0.0005639863,0.10000,0.755
26,self_attn.v_proj,0.0034550298,0.10000,0.754
26,self_attn.q_proj,0.0046535053,0.10000,0.780
26,self_attn.o_proj,0.0017360485,0.10000,0.763
26,mlp.up_proj,0.0365648842,0.10000,0.832
26,mlp.gate_proj,0.0322582898,0.10000,0.820
26,mlp.down_proj,0.0291283776,0.10000,5.539
27,self_attn.k_proj,0.0007934201,0.10000,0.758
27,self_attn.v_proj,0.0045992423,0.10000,0.746
27,self_attn.q_proj,0.0079554333,0.10000,0.945
27,self_attn.o_proj,0.0039928038,0.10000,0.907
27,mlp.up_proj,0.0661130137,0.10000,0.876
27,mlp.gate_proj,0.0631849785,0.10000,0.850
27,mlp.down_proj,0.0570357308,0.10000,5.818
|