| layer,module,loss,samples,damp,time | |
| 0,self_attn.q_proj,0.0000000324,0.05000,4.436 | |
| 0,self_attn.v_proj,0.0000000035,0.05000,4.455 | |
| 0,self_attn.k_proj,0.0000000111,0.05000,4.459 | |
| 0,self_attn.o_proj,0.0000000759,0.05000,1.211 | |
| 0,mlp.gate_proj,0.0000000274,0.05000,2.813 | |
| 0,mlp.up_proj,0.0000000245,0.05000,2.824 | |
| 0,mlp.down_proj,0.0000000294,0.05000,10.000 | |
| 1,self_attn.q_proj,0.0000000009,0.05000,4.127 | |
| 1,self_attn.v_proj,0.0000000002,0.05000,4.230 | |
| 1,self_attn.k_proj,0.0000000003,0.05000,4.249 | |
| 1,self_attn.o_proj,0.0000000006,0.05000,1.204 | |
| 1,mlp.gate_proj,0.0000003582,0.05000,2.661 | |
| 1,mlp.up_proj,0.0000001132,0.05000,2.667 | |
| 1,mlp.down_proj,0.0000000022,0.05000,10.466 | |
| 2,self_attn.q_proj,0.0000000043,0.05000,3.938 | |
| 2,self_attn.v_proj,0.0000000008,0.05000,4.050 | |
| 2,self_attn.k_proj,0.0000000016,0.05000,4.061 | |
| 2,self_attn.o_proj,0.0000000039,0.05000,1.220 | |
| 2,mlp.up_proj,0.0000002441,0.05000,2.791 | |
| 2,mlp.gate_proj,0.0000005469,0.05000,2.802 | |
| 2,mlp.down_proj,0.0000000187,0.05000,10.187 | |
| 3,self_attn.q_proj,0.0000000301,0.05000,3.879 | |
| 3,self_attn.v_proj,0.0000000048,0.05000,3.900 | |
| 3,self_attn.k_proj,0.0000000102,0.05000,3.948 | |
| 3,self_attn.o_proj,0.0000000171,0.05000,1.212 | |
| 3,mlp.gate_proj,0.0000007210,0.05000,2.708 | |
| 3,mlp.up_proj,0.0000002926,0.05000,2.718 | |
| 3,mlp.down_proj,0.0000000532,0.05000,10.084 | |
| 4,self_attn.q_proj,0.0000000334,0.05000,4.845 | |
| 4,self_attn.v_proj,0.0000000064,0.05000,4.913 | |
| 4,self_attn.k_proj,0.0000000108,0.05000,4.953 | |
| 4,self_attn.o_proj,0.0000000321,0.05000,1.210 | |
| 4,mlp.gate_proj,0.0000013479,0.05000,3.096 | |
| 4,mlp.up_proj,0.0000007025,0.05000,3.113 | |
| 4,mlp.down_proj,0.0000259130,0.05000,10.195 | |
| 5,self_attn.q_proj,0.0000001416,0.05000,5.425 | |
| 5,self_attn.v_proj,0.0000000291,0.05000,5.547 | |
| 5,self_attn.k_proj,0.0000000431,0.05000,5.627 | |
| 5,self_attn.o_proj,0.0000000541,0.05000,1.249 | |
| 5,mlp.up_proj,0.0000012457,0.05000,2.783 | |
| 5,mlp.gate_proj,0.0000022161,0.05000,2.793 | |
| 5,mlp.down_proj,0.0000287616,0.05000,10.440 | |
| 6,self_attn.q_proj,0.0000001439,0.05000,4.196 | |
| 6,self_attn.k_proj,0.0000000409,0.05000,4.206 | |
| 6,self_attn.v_proj,0.0000000335,0.05000,4.227 | |
| 6,self_attn.o_proj,0.0000000399,0.05000,1.195 | |
| 6,mlp.up_proj,0.0000021073,0.05000,2.691 | |
| 6,mlp.gate_proj,0.0000034542,0.05000,2.697 | |
| 6,mlp.down_proj,0.0000011519,0.05000,10.137 | |
| 7,self_attn.q_proj,0.0000002029,0.05000,4.391 | |
| 7,self_attn.v_proj,0.0000000490,0.05000,4.433 | |
| 7,self_attn.k_proj,0.0000000571,0.05000,4.463 | |
| 7,self_attn.o_proj,0.0000000491,0.05000,1.220 | |
| 7,mlp.gate_proj,0.0000044998,0.05000,2.703 | |
| 7,mlp.up_proj,0.0000027890,0.05000,2.715 | |
| 7,mlp.down_proj,0.0000001909,0.05000,10.121 | |
| 8,self_attn.q_proj,0.0000002344,0.05000,4.085 | |
| 8,self_attn.k_proj,0.0000000704,0.05000,4.127 | |
| 8,self_attn.v_proj,0.0000000546,0.05000,4.155 | |
| 8,self_attn.o_proj,0.0000000372,0.05000,1.215 | |
| 8,mlp.gate_proj,0.0000030072,0.05000,2.711 | |
| 8,mlp.up_proj,0.0000019047,0.05000,2.723 | |
| 8,mlp.down_proj,0.0000002122,0.05000,10.096 | |
| 9,self_attn.q_proj,0.0000002134,0.05000,4.216 | |
| 9,self_attn.v_proj,0.0000000544,0.05000,4.328 | |
| 9,self_attn.k_proj,0.0000000608,0.05000,4.347 | |
| 9,self_attn.o_proj,0.0000000745,0.05000,1.223 | |
| 9,mlp.gate_proj,0.0000010763,0.05000,2.700 | |
| 9,mlp.up_proj,0.0000009586,0.05000,2.706 | |
| 9,mlp.down_proj,0.0000002252,0.05000,10.224 | |
| 10,self_attn.q_proj,0.0000003315,0.05000,4.369 | |
| 10,self_attn.k_proj,0.0000000905,0.05000,4.403 | |
| 10,self_attn.v_proj,0.0000000744,0.05000,4.459 | |
| 10,self_attn.o_proj,0.0000000645,0.05000,1.223 | |
| 10,mlp.gate_proj,0.0000012525,0.05000,2.651 | |
| 10,mlp.up_proj,0.0000011368,0.05000,2.662 | |
| 10,mlp.down_proj,0.0000003049,0.05000,10.193 | |
| 11,self_attn.q_proj,0.0000002354,0.05000,4.125 | |
| 11,self_attn.v_proj,0.0000000549,0.05000,4.173 | |
| 11,self_attn.k_proj,0.0000000649,0.05000,4.225 | |
| 11,self_attn.o_proj,0.0000001205,0.05000,1.222 | |
| 11,mlp.up_proj,0.0000013557,0.05000,2.724 | |
| 11,mlp.gate_proj,0.0000016419,0.05000,2.729 | |
| 11,mlp.down_proj,0.0000002738,0.05000,10.202 | |
| 12,self_attn.q_proj,0.0000002923,0.05000,4.096 | |
| 12,self_attn.k_proj,0.0000000794,0.05000,4.143 | |
| 12,self_attn.v_proj,0.0000000662,0.05000,4.193 | |
| 12,self_attn.o_proj,0.0000001310,0.05000,1.194 | |
| 12,mlp.gate_proj,0.0000014627,0.05000,2.731 | |
| 12,mlp.up_proj,0.0000013635,0.05000,2.741 | |
| 12,mlp.down_proj,0.0000003253,0.05000,10.116 | |
| 13,self_attn.q_proj,0.0000003143,0.05000,3.821 | |
| 13,self_attn.k_proj,0.0000000899,0.05000,3.880 | |
| 13,self_attn.v_proj,0.0000000788,0.05000,3.931 | |
| 13,self_attn.o_proj,0.0000001147,0.05000,1.228 | |
| 13,mlp.gate_proj,0.0000016954,0.05000,2.748 | |
| 13,mlp.up_proj,0.0000015649,0.05000,2.748 | |
| 13,mlp.down_proj,0.0000003720,0.05000,10.206 | |
| 14,self_attn.k_proj,0.0000001135,0.05000,4.393 | |
| 14,self_attn.v_proj,0.0000000852,0.05000,4.438 | |
| 14,self_attn.q_proj,0.0000004012,0.05000,4.449 | |
| 14,self_attn.o_proj,0.0000001137,0.05000,1.240 | |
| 14,mlp.up_proj,0.0000016302,0.05000,2.790 | |
| 14,mlp.gate_proj,0.0000017848,0.05000,2.790 | |
| 14,mlp.down_proj,0.0000003895,0.05000,10.124 | |
| 15,self_attn.v_proj,0.0000000835,0.05000,4.047 | |
| 15,self_attn.q_proj,0.0000003443,0.05000,4.055 | |
| 15,self_attn.k_proj,0.0000000982,0.05000,4.089 | |
| 15,self_attn.o_proj,0.0000001418,0.05000,1.205 | |
| 15,mlp.up_proj,0.0000017047,0.05000,2.747 | |
| 15,mlp.gate_proj,0.0000019363,0.05000,2.747 | |
| 15,mlp.down_proj,0.0000004060,0.05000,10.131 | |
| 16,self_attn.q_proj,0.0000002841,0.05000,3.986 | |
| 16,self_attn.v_proj,0.0000000640,0.05000,4.085 | |
| 16,self_attn.k_proj,0.0000000856,0.05000,4.094 | |
| 16,self_attn.o_proj,0.0000001066,0.05000,1.210 | |
| 16,mlp.gate_proj,0.0000017007,0.05000,2.742 | |
| 16,mlp.up_proj,0.0000015746,0.05000,2.741 | |
| 16,mlp.down_proj,0.0000003646,0.05000,10.223 | |
| 17,self_attn.v_proj,0.0000000767,0.05000,4.194 | |
| 17,self_attn.q_proj,0.0000003798,0.05000,4.202 | |
| 17,self_attn.k_proj,0.0000001117,0.05000,4.211 | |
| 17,self_attn.o_proj,0.0000000858,0.05000,1.205 | |
| 17,mlp.gate_proj,0.0000016459,0.05000,2.756 | |
| 17,mlp.up_proj,0.0000015492,0.05000,2.756 | |
| 17,mlp.down_proj,0.0000003436,0.05000,10.194 | |
| 18,self_attn.q_proj,0.0000003655,0.05000,4.023 | |
| 18,self_attn.v_proj,0.0000000815,0.05000,4.067 | |
| 18,self_attn.k_proj,0.0000001092,0.05000,4.075 | |
| 18,self_attn.o_proj,0.0000000890,0.05000,1.210 | |
| 18,mlp.gate_proj,0.0000015888,0.05000,2.762 | |
| 18,mlp.up_proj,0.0000015035,0.05000,2.762 | |
| 18,mlp.down_proj,0.0000003304,0.05000,10.181 | |
| 19,self_attn.q_proj,0.0000003485,0.05000,3.986 | |
| 19,self_attn.v_proj,0.0000000731,0.05000,4.113 | |
| 19,self_attn.k_proj,0.0000000987,0.05000,4.126 | |
| 19,self_attn.o_proj,0.0000000734,0.05000,1.184 | |
| 19,mlp.gate_proj,0.0000015835,0.05000,2.742 | |
| 19,mlp.up_proj,0.0000015013,0.05000,2.753 | |
| 19,mlp.down_proj,0.0000003303,0.05000,10.054 | |
| 20,self_attn.q_proj,0.0000003767,0.05000,3.847 | |
| 20,self_attn.v_proj,0.0000000803,0.05000,3.858 | |
| 20,self_attn.k_proj,0.0000001126,0.05000,3.914 | |
| 20,self_attn.o_proj,0.0000001024,0.05000,1.228 | |
| 20,mlp.gate_proj,0.0000014873,0.05000,2.219 | |
| 20,mlp.up_proj,0.0000014336,0.05000,2.219 | |
| 20,mlp.down_proj,0.0000003261,0.05000,10.260 | |
| 21,self_attn.q_proj,0.0000003187,0.05000,3.842 | |
| 21,self_attn.k_proj,0.0000000929,0.05000,3.909 | |
| 21,self_attn.v_proj,0.0000000607,0.05000,3.916 | |
| 21,self_attn.o_proj,0.0000001203,0.05000,1.226 | |
| 21,mlp.gate_proj,0.0000014625,0.05000,2.236 | |
| 21,mlp.up_proj,0.0000014037,0.05000,2.236 | |
| 21,mlp.down_proj,0.0000003176,0.05000,10.220 | |
| 22,self_attn.q_proj,0.0000003521,0.05000,4.241 | |
| 22,self_attn.k_proj,0.0000000992,0.05000,4.316 | |
| 22,self_attn.v_proj,0.0000000847,0.05000,4.420 | |
| 22,self_attn.o_proj,0.0000001443,0.05000,1.248 | |
| 22,mlp.gate_proj,0.0000015310,0.05000,2.211 | |
| 22,mlp.up_proj,0.0000014704,0.05000,2.211 | |
| 22,mlp.down_proj,0.0000003498,0.05000,10.147 | |
| 23,self_attn.q_proj,0.0000003513,0.05000,4.031 | |
| 23,self_attn.v_proj,0.0000000866,0.05000,4.151 | |
| 23,self_attn.k_proj,0.0000000968,0.05000,4.175 | |
| 23,self_attn.o_proj,0.0000001508,0.05000,1.231 | |
| 23,mlp.up_proj,0.0000015408,0.05000,2.238 | |
| 23,mlp.gate_proj,0.0000016314,0.05000,2.238 | |
| 23,mlp.down_proj,0.0000003758,0.05000,10.225 | |
| 24,self_attn.k_proj,0.0000001262,0.05000,4.002 | |
| 24,self_attn.v_proj,0.0000000947,0.05000,4.090 | |
| 24,self_attn.q_proj,0.0000004348,0.05000,4.094 | |
| 24,self_attn.o_proj,0.0000001277,0.05000,1.246 | |
| 24,mlp.up_proj,0.0000015618,0.05000,2.258 | |
| 24,mlp.gate_proj,0.0000016283,0.05000,2.259 | |
| 24,mlp.down_proj,0.0000003730,0.05000,10.252 | |
| 25,self_attn.q_proj,0.0000004887,0.05000,4.635 | |
| 25,self_attn.v_proj,0.0000001125,0.05000,4.715 | |
| 25,self_attn.k_proj,0.0000001366,0.05000,4.722 | |
| 25,self_attn.o_proj,0.0000000967,0.05000,1.244 | |
| 25,mlp.up_proj,0.0000015764,0.05000,3.467 | |
| 25,mlp.gate_proj,0.0000016196,0.05000,3.473 | |
| 25,mlp.down_proj,0.0000003874,0.05000,10.163 | |
| 26,self_attn.q_proj,0.0000004309,0.05000,4.149 | |
| 26,self_attn.v_proj,0.0000000726,0.05000,4.203 | |
| 26,self_attn.k_proj,0.0000001209,0.05000,4.280 | |
| 26,self_attn.o_proj,0.0000001364,0.05000,1.219 | |
| 26,mlp.gate_proj,0.0000016653,0.05000,2.857 | |
| 26,mlp.up_proj,0.0000016355,0.05000,2.866 | |
| 26,mlp.down_proj,0.0000004174,0.05000,10.207 | |
| 27,self_attn.q_proj,0.0000003868,0.05000,4.468 | |
| 27,self_attn.k_proj,0.0000001159,0.05000,4.596 | |
| 27,self_attn.v_proj,0.0000000769,0.05000,4.613 | |
| 27,self_attn.o_proj,0.0000002341,0.05000,1.213 | |
| 27,mlp.up_proj,0.0000016877,0.05000,2.784 | |
| 27,mlp.gate_proj,0.0000017243,0.05000,2.796 | |
| 27,mlp.down_proj,0.0000004770,0.05000,10.177 | |
| 28,self_attn.q_proj,0.0000004039,0.05000,4.876 | |
| 28,self_attn.k_proj,0.0000001083,0.05000,4.974 | |
| 28,self_attn.v_proj,0.0000001101,0.05000,4.988 | |
| 28,self_attn.o_proj,0.0000002252,0.05000,1.244 | |
| 28,mlp.gate_proj,0.0000018486,0.05000,3.210 | |
| 28,mlp.up_proj,0.0000018237,0.05000,3.221 | |
| 28,mlp.down_proj,0.0000005318,0.05000,10.279 | |
| 29,self_attn.q_proj,0.0000005587,0.05000,3.988 | |
| 29,self_attn.v_proj,0.0000001449,0.05000,4.006 | |
| 29,self_attn.k_proj,0.0000001623,0.05000,4.035 | |
| 29,self_attn.o_proj,0.0000002199,0.05000,1.195 | |
| 29,mlp.up_proj,0.0000019346,0.05000,2.699 | |
| 29,mlp.gate_proj,0.0000019535,0.05000,2.699 | |
| 29,mlp.down_proj,0.0000005662,0.05000,10.096 | |
| 30,self_attn.q_proj,0.0000004907,0.05000,4.348 | |
| 30,self_attn.v_proj,0.0000001386,0.05000,4.377 | |
| 30,self_attn.k_proj,0.0000001323,0.05000,4.481 | |
| 30,self_attn.o_proj,0.0000003155,0.05000,1.211 | |
| 30,mlp.gate_proj,0.0000020732,0.05000,2.428 | |
| 30,mlp.up_proj,0.0000020535,0.05000,2.436 | |
| 30,mlp.down_proj,0.0000006065,0.05000,10.140 | |
| 31,self_attn.k_proj,0.0000001404,0.05000,4.519 | |
| 31,self_attn.q_proj,0.0000005059,0.05000,4.536 | |
| 31,self_attn.v_proj,0.0000001345,0.05000,4.547 | |
| 31,self_attn.o_proj,0.0000002848,0.05000,1.252 | |
| 31,mlp.up_proj,0.0000022315,0.05000,2.833 | |
| 31,mlp.gate_proj,0.0000022544,0.05000,2.842 | |
| 31,mlp.down_proj,0.0000006625,0.05000,10.037 | |
| 32,self_attn.q_proj,0.0000004777,0.05000,4.633 | |
| 32,self_attn.v_proj,0.0000001113,0.05000,4.658 | |
| 32,self_attn.k_proj,0.0000001374,0.05000,4.705 | |
| 32,self_attn.o_proj,0.0000002631,0.05000,1.271 | |
| 32,mlp.up_proj,0.0000025071,0.05000,3.905 | |
| 32,mlp.gate_proj,0.0000026300,0.05000,3.910 | |
| 32,mlp.down_proj,0.0000007179,0.05000,10.141 | |
| 33,self_attn.q_proj,0.0000005258,0.05000,4.372 | |
| 33,self_attn.v_proj,0.0000001103,0.05000,4.389 | |
| 33,self_attn.k_proj,0.0000001439,0.05000,4.400 | |
| 33,self_attn.o_proj,0.0000002456,0.05000,1.221 | |
| 33,mlp.up_proj,0.0000023659,0.05000,2.896 | |
| 33,mlp.gate_proj,0.0000024260,0.05000,2.911 | |
| 33,mlp.down_proj,0.0000006518,0.05000,10.165 | |
| 34,self_attn.q_proj,0.0000005065,0.05000,4.120 | |
| 34,self_attn.v_proj,0.0000001260,0.05000,4.171 | |
| 34,self_attn.k_proj,0.0000001377,0.05000,4.211 | |
| 34,self_attn.o_proj,0.0000002940,0.05000,1.205 | |
| 34,mlp.gate_proj,0.0000023332,0.05000,2.818 | |
| 34,mlp.up_proj,0.0000023197,0.05000,2.827 | |
| 34,mlp.down_proj,0.0000006274,0.05000,10.295 | |
| 35,self_attn.k_proj,0.0000001457,0.05000,4.742 | |
| 35,self_attn.v_proj,0.0000001265,0.05000,4.808 | |
| 35,self_attn.q_proj,0.0000005797,0.05000,4.860 | |
| 35,self_attn.o_proj,0.0000002040,0.05000,1.249 | |
| 35,mlp.up_proj,0.0000023275,0.05000,4.168 | |
| 35,mlp.gate_proj,0.0000023273,0.05000,4.187 | |
| 35,mlp.down_proj,0.0000006254,0.05000,10.052 | |
| 36,self_attn.k_proj,0.0000001522,0.05000,5.259 | |
| 36,self_attn.v_proj,0.0000001243,0.05000,5.288 | |
| 36,self_attn.q_proj,0.0000005616,0.05000,5.317 | |
| 36,self_attn.o_proj,0.0000002905,0.05000,1.204 | |
| 36,mlp.up_proj,0.0000021971,0.05000,3.434 | |
| 36,mlp.gate_proj,0.0000021111,0.05000,3.434 | |
| 36,mlp.down_proj,0.0000006072,0.05000,10.185 | |
| 37,self_attn.v_proj,0.0000001041,0.05000,5.204 | |
| 37,self_attn.k_proj,0.0000001296,0.05000,5.272 | |
| 37,self_attn.q_proj,0.0000004768,0.05000,5.281 | |
| 37,self_attn.o_proj,0.0000002766,0.05000,1.284 | |
| 37,mlp.gate_proj,0.0000020717,0.05000,4.166 | |
| 37,mlp.up_proj,0.0000021557,0.05000,4.190 | |
| 37,mlp.down_proj,0.0000005665,0.05000,10.365 | |
| 38,self_attn.q_proj,0.0000005129,0.05000,4.760 | |
| 38,self_attn.k_proj,0.0000001389,0.05000,4.773 | |
| 38,self_attn.v_proj,0.0000001542,0.05000,4.855 | |
| 38,self_attn.o_proj,0.0000002993,0.05000,1.251 | |
| 38,mlp.gate_proj,0.0000020834,0.05000,3.610 | |
| 38,mlp.up_proj,0.0000021530,0.05000,3.621 | |
| 38,mlp.down_proj,0.0000005768,0.05000,10.607 | |
| 39,self_attn.q_proj,0.0000005103,0.05000,4.553 | |
| 39,self_attn.v_proj,0.0000001502,0.05000,4.653 | |
| 39,self_attn.k_proj,0.0000001281,0.05000,4.786 | |
| 39,self_attn.o_proj,0.0000002914,0.05000,1.273 | |
| 39,mlp.up_proj,0.0000021633,0.05000,3.484 | |
| 39,mlp.gate_proj,0.0000021818,0.05000,3.494 | |
| 39,mlp.down_proj,0.0000005776,0.05000,10.279 | |
| 40,self_attn.q_proj,0.0000005716,0.05000,4.459 | |
| 40,self_attn.v_proj,0.0000001353,0.05000,4.543 | |
| 40,self_attn.k_proj,0.0000001658,0.05000,4.624 | |
| 40,self_attn.o_proj,0.0000003121,0.05000,1.261 | |
| 40,mlp.up_proj,0.0000020561,0.05000,3.387 | |
| 40,mlp.gate_proj,0.0000020347,0.05000,3.396 | |
| 40,mlp.down_proj,0.0000005213,0.05000,10.449 | |
| 41,self_attn.q_proj,0.0000005977,0.05000,4.511 | |
| 41,self_attn.v_proj,0.0000001723,0.05000,4.620 | |
| 41,self_attn.k_proj,0.0000001549,0.05000,4.671 | |
| 41,self_attn.o_proj,0.0000002078,0.05000,1.197 | |
| 41,mlp.up_proj,0.0000020584,0.05000,3.206 | |
| 41,mlp.gate_proj,0.0000019811,0.05000,3.211 | |
| 41,mlp.down_proj,0.0000005440,0.05000,10.192 | |
| 42,self_attn.q_proj,0.0000005447,0.05000,4.799 | |
| 42,self_attn.v_proj,0.0000001046,0.05000,4.869 | |
| 42,self_attn.k_proj,0.0000001418,0.05000,4.898 | |
| 42,self_attn.o_proj,0.0000002300,0.05000,1.202 | |
| 42,mlp.gate_proj,0.0000020579,0.05000,3.090 | |
| 42,mlp.up_proj,0.0000021793,0.05000,3.099 | |
| 42,mlp.down_proj,0.0000006287,0.05000,10.203 | |
| 43,self_attn.q_proj,0.0000005050,0.05000,4.882 | |
| 43,self_attn.v_proj,0.0000001233,0.05000,4.938 | |
| 43,self_attn.k_proj,0.0000001402,0.05000,4.942 | |
| 43,self_attn.o_proj,0.0000003650,0.05000,1.224 | |
| 43,mlp.up_proj,0.0000022805,0.05000,2.933 | |
| 43,mlp.gate_proj,0.0000021644,0.05000,2.941 | |
| 43,mlp.down_proj,0.0000007716,0.05000,10.269 | |
| 44,self_attn.q_proj,0.0000004853,0.05000,4.852 | |
| 44,self_attn.k_proj,0.0000001162,0.05000,4.984 | |
| 44,self_attn.v_proj,0.0000001711,0.05000,5.029 | |
| 44,self_attn.o_proj,0.0000003831,0.05000,1.223 | |
| 44,mlp.gate_proj,0.0000021933,0.05000,3.294 | |
| 44,mlp.up_proj,0.0000023132,0.05000,3.304 | |
| 44,mlp.down_proj,0.0000008341,0.05000,10.113 | |
| 45,self_attn.q_proj,0.0000005621,0.05000,5.854 | |
| 45,self_attn.v_proj,0.0000001808,0.05000,5.953 | |
| 45,self_attn.k_proj,0.0000001470,0.05000,5.965 | |
| 45,self_attn.o_proj,0.0000004248,0.05000,1.248 | |
| 45,mlp.gate_proj,0.0000022108,0.05000,4.233 | |
| 45,mlp.up_proj,0.0000023189,0.05000,4.260 | |
| 45,mlp.down_proj,0.0000008981,0.05000,10.290 | |
| 46,self_attn.v_proj,0.0000001954,0.05000,4.785 | |
| 46,self_attn.q_proj,0.0000005156,0.05000,4.826 | |
| 46,self_attn.k_proj,0.0000001268,0.05000,4.900 | |
| 46,self_attn.o_proj,0.0000005321,0.05000,1.249 | |
| 46,mlp.up_proj,0.0000024360,0.05000,3.471 | |
| 46,mlp.gate_proj,0.0000023494,0.05000,3.472 | |
| 46,mlp.down_proj,0.0000010055,0.05000,10.201 | |
| 47,self_attn.v_proj,0.0000001679,0.05000,4.691 | |
| 47,self_attn.q_proj,0.0000005223,0.05000,4.710 | |
| 47,self_attn.k_proj,0.0000001289,0.05000,4.719 | |
| 47,self_attn.o_proj,0.0000004607,0.05000,1.268 | |
| 47,mlp.gate_proj,0.0000026893,0.05000,3.858 | |
| 47,mlp.up_proj,0.0000027448,0.05000,3.864 | |
| 47,mlp.down_proj,0.0000012588,0.05000,10.172 | |
| 48,self_attn.q_proj,0.0000006327,0.05000,5.073 | |
| 48,self_attn.v_proj,0.0000002648,0.05000,5.203 | |
| 48,self_attn.k_proj,0.0000001448,0.05000,5.233 | |
| 48,self_attn.o_proj,0.0000004758,0.05000,1.231 | |
| 48,mlp.gate_proj,0.0000029461,0.05000,2.935 | |
| 48,mlp.up_proj,0.0000029765,0.05000,2.940 | |
| 48,mlp.down_proj,0.0000014690,0.05000,10.244 | |
| 49,self_attn.v_proj,0.0000002245,0.05000,4.624 | |
| 49,self_attn.k_proj,0.0000001446,0.05000,4.632 | |
| 49,self_attn.q_proj,0.0000006315,0.05000,4.658 | |
| 49,self_attn.o_proj,0.0000005271,0.05000,1.234 | |
| 49,mlp.gate_proj,0.0000036356,0.05000,3.329 | |
| 49,mlp.up_proj,0.0000036252,0.05000,3.334 | |
| 49,mlp.down_proj,0.0000021298,0.05000,10.279 | |
| 50,self_attn.k_proj,0.0000001516,0.05000,4.756 | |
| 50,self_attn.q_proj,0.0000007270,0.05000,4.776 | |
| 50,self_attn.v_proj,0.0000002842,0.05000,4.813 | |
| 50,self_attn.o_proj,0.0000004582,0.05000,1.252 | |
| 50,mlp.gate_proj,0.0000043000,0.05000,3.275 | |
| 50,mlp.up_proj,0.0000042078,0.05000,3.286 | |
| 50,mlp.down_proj,0.0000025875,0.05000,10.223 | |
| 51,self_attn.q_proj,0.0000006938,0.05000,4.371 | |
| 51,self_attn.v_proj,0.0000002596,0.05000,4.424 | |
| 51,self_attn.k_proj,0.0000001618,0.05000,4.483 | |
| 51,self_attn.o_proj,0.0000008299,0.05000,1.229 | |
| 51,mlp.gate_proj,0.0000049657,0.05000,2.427 | |
| 51,mlp.up_proj,0.0000048277,0.05000,2.438 | |
| 51,mlp.down_proj,0.0000031356,0.05000,9.978 | |
| 52,self_attn.q_proj,0.0000008375,0.05000,4.276 | |
| 52,self_attn.k_proj,0.0000001707,0.05000,4.316 | |
| 52,self_attn.v_proj,0.0000004551,0.05000,4.418 | |
| 52,self_attn.o_proj,0.0000006151,0.05000,1.184 | |
| 52,mlp.gate_proj,0.0000053379,0.05000,3.183 | |
| 52,mlp.up_proj,0.0000052264,0.05000,3.193 | |
| 52,mlp.down_proj,0.0000036994,0.05000,10.057 | |
| 53,self_attn.v_proj,0.0000004279,0.05000,4.637 | |
| 53,self_attn.q_proj,0.0000009236,0.05000,4.660 | |
| 53,self_attn.k_proj,0.0000001956,0.05000,4.687 | |
| 53,self_attn.o_proj,0.0000007764,0.05000,1.210 | |
| 53,mlp.gate_proj,0.0000058551,0.05000,3.038 | |
| 53,mlp.up_proj,0.0000057679,0.05000,3.049 | |
| 53,mlp.down_proj,0.0000040391,0.05000,10.019 | |
| 54,self_attn.q_proj,0.0000008725,0.05000,4.701 | |
| 54,self_attn.v_proj,0.0000003937,0.05000,4.768 | |
| 54,self_attn.k_proj,0.0000001916,0.05000,4.812 | |
| 54,self_attn.o_proj,0.0000007127,0.05000,1.175 | |
| 54,mlp.gate_proj,0.0000064098,0.05000,3.128 | |
| 54,mlp.up_proj,0.0000063912,0.05000,3.136 | |
| 54,mlp.down_proj,0.0000045518,0.05000,10.050 | |
| 55,self_attn.q_proj,0.0000008602,0.05000,4.418 | |
| 55,self_attn.k_proj,0.0000001819,0.05000,4.427 | |
| 55,self_attn.v_proj,0.0000004298,0.05000,4.438 | |
| 55,self_attn.o_proj,0.0000009435,0.05000,1.193 | |
| 55,mlp.gate_proj,0.0000069606,0.05000,3.039 | |
| 55,mlp.up_proj,0.0000070381,0.05000,3.044 | |
| 55,mlp.down_proj,0.0000053272,0.05000,9.995 | |
| 56,self_attn.q_proj,0.0000009497,0.05000,4.476 | |
| 56,self_attn.k_proj,0.0000001961,0.05000,4.625 | |
| 56,self_attn.v_proj,0.0000005621,0.05000,4.638 | |
| 56,self_attn.o_proj,0.0000008565,0.05000,1.178 | |
| 56,mlp.gate_proj,0.0000074443,0.05000,2.925 | |
| 56,mlp.up_proj,0.0000075807,0.05000,2.925 | |
| 56,mlp.down_proj,0.0000060127,0.05000,9.997 | |
| 57,self_attn.q_proj,0.0000009704,0.05000,4.552 | |
| 57,self_attn.v_proj,0.0000005494,0.05000,4.596 | |
| 57,self_attn.k_proj,0.0000001951,0.05000,4.629 | |
| 57,self_attn.o_proj,0.0000006838,0.05000,1.187 | |
| 57,mlp.gate_proj,0.0000078137,0.05000,3.010 | |
| 57,mlp.up_proj,0.0000081059,0.05000,3.023 | |
| 57,mlp.down_proj,0.0000066844,0.05000,10.025 | |
| 58,self_attn.k_proj,0.0000001917,0.05000,4.447 | |
| 58,self_attn.v_proj,0.0000005683,0.05000,4.470 | |
| 58,self_attn.q_proj,0.0000010161,0.05000,4.486 | |
| 58,self_attn.o_proj,0.0000007372,0.05000,1.170 | |
| 58,mlp.gate_proj,0.0000083187,0.05000,3.149 | |
| 58,mlp.up_proj,0.0000087371,0.05000,3.149 | |
| 58,mlp.down_proj,0.0000079389,0.05000,10.073 | |
| 59,self_attn.v_proj,0.0000008826,0.05000,4.021 | |
| 59,self_attn.k_proj,0.0000002084,0.05000,4.037 | |
| 59,self_attn.q_proj,0.0000010680,0.05000,4.068 | |
| 59,self_attn.o_proj,0.0000014713,0.05000,1.204 | |
| 59,mlp.gate_proj,0.0000090754,0.05000,3.040 | |
| 59,mlp.up_proj,0.0000097120,0.05000,3.053 | |
| 59,mlp.down_proj,0.0000100502,0.05000,10.089 | |
| 60,self_attn.q_proj,0.0000009944,0.05000,4.322 | |
| 60,self_attn.k_proj,0.0000001706,0.05000,4.379 | |
| 60,self_attn.v_proj,0.0000009851,0.05000,4.447 | |
| 60,self_attn.o_proj,0.0000019561,0.05000,1.221 | |
| 60,mlp.up_proj,0.0000104985,0.05000,3.135 | |
| 60,mlp.gate_proj,0.0000096193,0.05000,3.149 | |
| 60,mlp.down_proj,0.0000167195,0.05000,10.041 | |
| 61,self_attn.q_proj,0.0000010872,0.05000,4.283 | |
| 61,self_attn.k_proj,0.0000001805,0.05000,4.307 | |
| 61,self_attn.v_proj,0.0000012091,0.05000,4.324 | |
| 61,self_attn.o_proj,0.0000021933,0.05000,1.195 | |
| 61,mlp.up_proj,0.0000111990,0.05000,3.331 | |
| 61,mlp.gate_proj,0.0000103223,0.05000,3.331 | |
| 61,mlp.down_proj,0.0000168270,0.05000,10.114 | |
| 62,self_attn.v_proj,0.0000013395,0.05000,4.572 | |
| 62,self_attn.q_proj,0.0000010536,0.05000,4.683 | |
| 62,self_attn.k_proj,0.0000001778,0.05000,4.695 | |
| 62,self_attn.o_proj,0.0000037245,0.05000,1.225 | |
| 62,mlp.gate_proj,0.0000105226,0.05000,3.888 | |
| 62,mlp.up_proj,0.0000111446,0.05000,3.898 | |
| 62,mlp.down_proj,0.0000328190,0.05000,10.277 | |
| 63,self_attn.q_proj,0.0000008867,0.05000,4.402 | |
| 63,self_attn.k_proj,0.0000001444,0.05000,4.447 | |
| 63,self_attn.v_proj,0.0000006649,0.05000,4.507 | |
| 63,self_attn.o_proj,0.0000016701,0.05000,1.206 | |
| 63,mlp.gate_proj,0.0000111833,0.05000,2.759 | |
| 63,mlp.up_proj,0.0000115803,0.05000,2.759 | |
| 63,mlp.down_proj,0.0000507795,0.05000,10.147 | |