| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000083,0.05000,2.801 | |
| 0,self_attn.v_proj,0.0000000015,0.05000,3.668 | |
| 0,self_attn.q_proj,0.0000000251,0.05000,3.745 | |
| 0,self_attn.o_proj,0.0000000110,0.05000,1.639 | |
| 0,mlp.up_proj,0.0000001725,0.05000,3.559 | |
| 0,mlp.gate_proj,0.0000001806,0.05000,3.618 | |
| 0,mlp.down_proj,0.0000002677,0.05000,10.839 | |
| 1,self_attn.k_proj,0.0000000149,0.05000,2.811 | |
| 1,self_attn.q_proj,0.0000000459,0.05000,3.997 | |
| 1,self_attn.v_proj,0.0000000011,0.05000,4.111 | |
| 1,self_attn.o_proj,0.0000000008,0.05000,1.864 | |
| 1,mlp.up_proj,0.0000005314,0.05000,2.267 | |
| 1,mlp.gate_proj,0.0000005708,0.05000,2.466 | |
| 1,mlp.down_proj,0.0008954810,0.05000,10.477 | |
| 2,self_attn.k_proj,0.0000017003,0.05000,2.652 | |
| 2,self_attn.v_proj,0.0000007950,0.05000,3.484 | |
| 2,self_attn.q_proj,0.0000059055,0.05000,3.614 | |
| 2,self_attn.o_proj,0.0000000424,0.05000,1.277 | |
| 2,mlp.gate_proj,0.0000011904,0.05000,2.334 | |
| 2,mlp.up_proj,0.0000011452,0.05000,2.412 | |
| 2,mlp.down_proj,0.0000004341,0.05000,10.311 | |
| 3,self_attn.k_proj,0.0000009851,0.05000,2.816 | |
| 3,self_attn.v_proj,0.0000006563,0.05000,3.597 | |
| 3,self_attn.q_proj,0.0000038229,0.05000,3.621 | |
| 3,self_attn.o_proj,0.0000000834,0.05000,1.285 | |
| 3,mlp.up_proj,0.0000022597,0.05000,2.520 | |
| 3,mlp.gate_proj,0.0000022850,0.05000,3.079 | |
| 3,mlp.down_proj,0.0000005211,0.05000,10.449 | |
| 4,self_attn.k_proj,0.0000018191,0.05000,2.985 | |
| 4,self_attn.v_proj,0.0000010711,0.05000,3.764 | |
| 4,self_attn.q_proj,0.0000081581,0.05000,3.782 | |
| 4,self_attn.o_proj,0.0000000304,0.05000,1.860 | |
| 4,mlp.up_proj,0.0000046734,0.05000,2.533 | |
| 4,mlp.gate_proj,0.0000047490,0.05000,2.683 | |
| 4,mlp.down_proj,0.0000006586,0.05000,10.609 | |
| 5,self_attn.k_proj,0.0000023617,0.05000,2.850 | |
| 5,self_attn.q_proj,0.0000099481,0.05000,3.971 | |
| 5,self_attn.v_proj,0.0000015744,0.05000,4.083 | |
| 5,self_attn.o_proj,0.0000000285,0.05000,1.372 | |
| 5,mlp.up_proj,0.0000073123,0.05000,2.438 | |
| 5,mlp.gate_proj,0.0000075287,0.05000,2.879 | |
| 5,mlp.down_proj,0.0000008138,0.05000,10.709 | |
| 6,self_attn.k_proj,0.0000017332,0.05000,4.147 | |
| 6,self_attn.v_proj,0.0000011686,0.05000,4.478 | |
| 6,self_attn.q_proj,0.0000073121,0.05000,4.581 | |
| 6,self_attn.o_proj,0.0000000446,0.05000,1.469 | |
| 6,mlp.gate_proj,0.0000097913,0.05000,2.368 | |
| 6,mlp.up_proj,0.0000095291,0.05000,2.919 | |
| 6,mlp.down_proj,0.0000009594,0.05000,10.571 | |
| 7,self_attn.k_proj,0.0000027421,0.05000,2.770 | |
| 7,self_attn.q_proj,0.0000113997,0.05000,3.784 | |
| 7,self_attn.v_proj,0.0000015898,0.05000,3.829 | |
| 7,self_attn.o_proj,0.0000000912,0.05000,1.297 | |
| 7,mlp.up_proj,0.0000124562,0.05000,3.032 | |
| 7,mlp.gate_proj,0.0000126258,0.05000,3.314 | |
| 7,mlp.down_proj,0.0000011960,0.05000,10.648 | |
| 8,self_attn.k_proj,0.0000023173,0.05000,3.331 | |
| 8,self_attn.v_proj,0.0000015135,0.05000,3.717 | |
| 8,self_attn.q_proj,0.0000095175,0.05000,3.746 | |
| 8,self_attn.o_proj,0.0000003093,0.05000,1.370 | |
| 8,mlp.up_proj,0.0000149982,0.05000,2.418 | |
| 8,mlp.gate_proj,0.0000154397,0.05000,2.432 | |
| 8,mlp.down_proj,0.0000014202,0.05000,10.242 | |
| 9,self_attn.k_proj,0.0000066278,0.05000,2.205 | |
| 9,self_attn.v_proj,0.0000042719,0.05000,3.611 | |
| 9,self_attn.q_proj,0.0000310723,0.05000,3.647 | |
| 9,self_attn.o_proj,0.0000003253,0.05000,1.521 | |
| 9,mlp.up_proj,0.0000164987,0.05000,2.277 | |
| 9,mlp.gate_proj,0.0000169119,0.05000,2.939 | |
| 9,mlp.down_proj,0.0000014821,0.05000,9.982 | |
| 10,self_attn.k_proj,0.0000041501,0.05000,4.286 | |
| 10,self_attn.v_proj,0.0000025467,0.05000,5.287 | |
| 10,self_attn.q_proj,0.0000184065,0.05000,5.428 | |
| 10,self_attn.o_proj,0.0000005432,0.05000,2.022 | |
| 10,mlp.up_proj,0.0000209421,0.05000,2.286 | |
| 10,mlp.gate_proj,0.0000215232,0.05000,2.288 | |
| 10,mlp.down_proj,0.0000019321,0.05000,9.870 | |
| 11,self_attn.k_proj,0.0000050158,0.05000,2.621 | |
| 11,self_attn.q_proj,0.0000225202,0.05000,4.319 | |
| 11,self_attn.v_proj,0.0000027536,0.05000,4.330 | |
| 11,self_attn.o_proj,0.0000005548,0.05000,1.415 | |
| 11,mlp.up_proj,0.0000250286,0.05000,2.988 | |
| 11,mlp.gate_proj,0.0000259055,0.05000,3.693 | |
| 11,mlp.down_proj,0.0000024918,0.05000,10.089 | |
| 12,self_attn.k_proj,0.0000068994,0.05000,3.237 | |
| 12,self_attn.v_proj,0.0000042734,0.05000,3.701 | |
| 12,self_attn.q_proj,0.0000326316,0.05000,3.724 | |
| 12,self_attn.o_proj,0.0000007876,0.05000,1.301 | |
| 12,mlp.gate_proj,0.0000298471,0.05000,3.191 | |
| 12,mlp.up_proj,0.0000289676,0.05000,3.479 | |
| 12,mlp.down_proj,0.0000029149,0.05000,10.114 | |
| 13,self_attn.k_proj,0.0000064426,0.05000,5.791 | |
| 13,self_attn.v_proj,0.0000039875,0.05000,5.964 | |
| 13,self_attn.q_proj,0.0000294749,0.05000,5.970 | |
| 13,self_attn.o_proj,0.0000007967,0.05000,1.514 | |
| 13,mlp.up_proj,0.0000338720,0.05000,2.458 | |
| 13,mlp.gate_proj,0.0000348873,0.05000,2.836 | |
| 13,mlp.down_proj,0.0000035293,0.05000,10.281 | |
| 14,self_attn.k_proj,0.0000058921,0.05000,3.164 | |
| 14,self_attn.q_proj,0.0000269218,0.05000,3.748 | |
| 14,self_attn.v_proj,0.0000036618,0.05000,3.829 | |
| 14,self_attn.o_proj,0.0000012175,0.05000,1.601 | |
| 14,mlp.gate_proj,0.0000368255,0.05000,2.808 | |
| 14,mlp.up_proj,0.0000357753,0.05000,3.098 | |
| 14,mlp.down_proj,0.0000040114,0.05000,10.563 | |
| 15,self_attn.k_proj,0.0000086019,0.05000,3.701 | |
| 15,self_attn.v_proj,0.0000053368,0.05000,5.146 | |
| 15,self_attn.q_proj,0.0000419557,0.05000,5.228 | |
| 15,self_attn.o_proj,0.0000008724,0.05000,1.579 | |
| 15,mlp.up_proj,0.0000460644,0.05000,2.887 | |
| 15,mlp.gate_proj,0.0000476075,0.05000,3.425 | |
| 15,mlp.down_proj,0.0000048976,0.05000,9.888 | |
| 16,self_attn.k_proj,0.0000082341,0.05000,5.013 | |
| 16,self_attn.v_proj,0.0000048371,0.05000,5.535 | |
| 16,self_attn.q_proj,0.0000386040,0.05000,5.702 | |
| 16,self_attn.o_proj,0.0000010662,0.05000,2.095 | |
| 16,mlp.gate_proj,0.0000521022,0.05000,2.975 | |
| 16,mlp.up_proj,0.0000503771,0.05000,3.305 | |
| 16,mlp.down_proj,0.0000054525,0.05000,10.122 | |
| 17,self_attn.k_proj,0.0000061613,0.05000,4.726 | |
| 17,self_attn.q_proj,0.0000277395,0.05000,5.913 | |
| 17,self_attn.v_proj,0.0000041849,0.05000,6.056 | |
| 17,self_attn.o_proj,0.0000012010,0.05000,1.321 | |
| 17,mlp.up_proj,0.0000482309,0.05000,3.047 | |
| 17,mlp.gate_proj,0.0000496327,0.05000,3.600 | |
| 17,mlp.down_proj,0.0000058314,0.05000,9.859 | |
| 18,self_attn.k_proj,0.0000118444,0.05000,4.966 | |
| 18,self_attn.v_proj,0.0000075373,0.05000,5.667 | |
| 18,self_attn.q_proj,0.0000540507,0.05000,5.745 | |
| 18,self_attn.o_proj,0.0000008202,0.05000,1.912 | |
| 18,mlp.gate_proj,0.0000609206,0.05000,2.793 | |
| 18,mlp.up_proj,0.0000588649,0.05000,3.529 | |
| 18,mlp.down_proj,0.0000070946,0.05000,10.016 | |
| 19,self_attn.k_proj,0.0000157993,0.05000,3.537 | |
| 19,self_attn.v_proj,0.0000108652,0.05000,4.267 | |
| 19,self_attn.q_proj,0.0000753431,0.05000,4.286 | |
| 19,self_attn.o_proj,0.0000013361,0.05000,1.404 | |
| 19,mlp.up_proj,0.0000660162,0.05000,2.908 | |
| 19,mlp.gate_proj,0.0000681782,0.05000,3.769 | |
| 19,mlp.down_proj,0.0000091892,0.05000,9.745 | |
| 20,self_attn.k_proj,0.0000056131,0.05000,3.304 | |
| 20,self_attn.q_proj,0.0000264988,0.05000,3.821 | |
| 20,self_attn.v_proj,0.0000038339,0.05000,3.839 | |
| 20,self_attn.o_proj,0.0000018202,0.05000,1.302 | |
| 20,mlp.gate_proj,0.0000797798,0.05000,3.315 | |
| 20,mlp.up_proj,0.0000766321,0.05000,4.039 | |
| 20,mlp.down_proj,0.0000116587,0.05000,10.135 | |
| 21,self_attn.k_proj,0.0000042461,0.05000,4.730 | |
| 21,self_attn.v_proj,0.0000033028,0.05000,5.579 | |
| 21,self_attn.q_proj,0.0000213052,0.05000,5.632 | |
| 21,self_attn.o_proj,0.0000021744,0.05000,1.345 | |
| 21,mlp.up_proj,0.0000685877,0.05000,2.487 | |
| 21,mlp.gate_proj,0.0000712155,0.05000,2.985 | |
| 21,mlp.down_proj,0.0000109436,0.05000,10.802 | |
| 22,self_attn.k_proj,0.0000133198,0.05000,3.967 | |
| 22,self_attn.q_proj,0.0000699285,0.05000,4.560 | |
| 22,self_attn.v_proj,0.0000091933,0.05000,4.602 | |
| 22,self_attn.o_proj,0.0000039613,0.05000,1.496 | |
| 22,mlp.gate_proj,0.0000963684,0.05000,3.037 | |
| 22,mlp.up_proj,0.0000934268,0.05000,3.375 | |
| 22,mlp.down_proj,0.0000168737,0.05000,10.091 | |
| 23,self_attn.k_proj,0.0000105332,0.05000,4.407 | |
| 23,self_attn.v_proj,0.0000078797,0.05000,5.499 | |
| 23,self_attn.q_proj,0.0000594658,0.05000,5.634 | |
| 23,self_attn.o_proj,0.0000044322,0.05000,1.477 | |
| 23,mlp.up_proj,0.0001014435,0.05000,2.413 | |
| 23,mlp.gate_proj,0.0001047793,0.05000,3.027 | |
| 23,mlp.down_proj,0.0000205954,0.05000,10.521 | |
| 24,self_attn.k_proj,0.0000087163,0.05000,4.241 | |
| 24,self_attn.v_proj,0.0000081206,0.05000,5.273 | |
| 24,self_attn.q_proj,0.0000487051,0.05000,5.349 | |
| 24,self_attn.o_proj,0.0000041695,0.05000,1.943 | |
| 24,mlp.gate_proj,0.0001185606,0.05000,2.247 | |
| 24,mlp.up_proj,0.0001142659,0.05000,2.634 | |
| 24,mlp.down_proj,0.0000222536,0.05000,9.938 | |
| 25,self_attn.k_proj,0.0000159422,0.05000,5.600 | |
| 25,self_attn.q_proj,0.0000910267,0.05000,6.226 | |
| 25,self_attn.v_proj,0.0000118083,0.05000,6.265 | |
| 25,self_attn.o_proj,0.0000043021,0.05000,1.467 | |
| 25,mlp.up_proj,0.0001309119,0.05000,2.772 | |
| 25,mlp.gate_proj,0.0001353980,0.05000,3.218 | |
| 25,mlp.down_proj,0.0000241417,0.05000,10.532 | |
| 26,self_attn.k_proj,0.0000108861,0.05000,4.942 | |
| 26,self_attn.v_proj,0.0000087073,0.05000,5.588 | |
| 26,self_attn.q_proj,0.0000611677,0.05000,5.713 | |
| 26,self_attn.o_proj,0.0000065317,0.05000,1.936 | |
| 26,mlp.gate_proj,0.0001480991,0.05000,3.145 | |
| 26,mlp.up_proj,0.0001433836,0.05000,3.778 | |
| 26,mlp.down_proj,0.0000240256,0.05000,10.395 | |
| 27,self_attn.k_proj,0.0000106976,0.05000,5.811 | |
| 27,self_attn.v_proj,0.0000089176,0.05000,7.266 | |
| 27,self_attn.q_proj,0.0000583077,0.05000,7.287 | |
| 27,self_attn.o_proj,0.0000055713,0.05000,1.422 | |
| 27,mlp.up_proj,0.0001546191,0.05000,3.105 | |
| 27,mlp.gate_proj,0.0001595489,0.05000,3.358 | |
| 27,mlp.down_proj,0.0000252766,0.05000,10.085 | |
| 28,self_attn.k_proj,0.0000106178,0.05000,3.588 | |
| 28,self_attn.v_proj,0.0000092871,0.05000,5.132 | |
| 28,self_attn.q_proj,0.0000590332,0.05000,5.250 | |
| 28,self_attn.o_proj,0.0000037944,0.05000,1.689 | |
| 28,mlp.gate_proj,0.0001684963,0.05000,2.882 | |
| 28,mlp.up_proj,0.0001638806,0.05000,3.409 | |
| 28,mlp.down_proj,0.0000282866,0.05000,10.498 | |
| 29,self_attn.k_proj,0.0000135726,0.05000,4.407 | |
| 29,self_attn.q_proj,0.0000726531,0.05000,5.414 | |
| 29,self_attn.v_proj,0.0000103901,0.05000,5.424 | |
| 29,self_attn.o_proj,0.0000080586,0.05000,2.105 | |
| 29,mlp.up_proj,0.0001746968,0.05000,3.565 | |
| 29,mlp.gate_proj,0.0001798793,0.05000,4.246 | |
| 29,mlp.down_proj,0.0000321623,0.05000,11.065 | |
| 30,self_attn.k_proj,0.0000140717,0.05000,3.663 | |
| 30,self_attn.q_proj,0.0000811999,0.05000,5.291 | |
| 30,self_attn.v_proj,0.0000122248,0.05000,5.443 | |
| 30,self_attn.o_proj,0.0000073549,0.05000,1.336 | |
| 30,mlp.gate_proj,0.0001978493,0.05000,2.970 | |
| 30,mlp.up_proj,0.0001912195,0.05000,3.170 | |
| 30,mlp.down_proj,0.0000367621,0.05000,10.588 | |
| 31,self_attn.k_proj,0.0000160960,0.05000,3.959 | |
| 31,self_attn.v_proj,0.0000136198,0.05000,4.718 | |
| 31,self_attn.q_proj,0.0000900179,0.05000,4.759 | |
| 31,self_attn.o_proj,0.0000038948,0.05000,1.532 | |
| 31,mlp.up_proj,0.0002086598,0.05000,3.211 | |
| 31,mlp.gate_proj,0.0002161677,0.05000,3.409 | |
| 31,mlp.down_proj,0.0000391139,0.05000,11.071 | |
| 32,self_attn.k_proj,0.0000179868,0.05000,3.373 | |
| 32,self_attn.v_proj,0.0000154724,0.05000,3.916 | |
| 32,self_attn.q_proj,0.0001030208,0.05000,3.929 | |
| 32,self_attn.o_proj,0.0000053135,0.05000,1.284 | |
| 32,mlp.gate_proj,0.0002262592,0.05000,3.688 | |
| 32,mlp.up_proj,0.0002187264,0.05000,4.227 | |
| 32,mlp.down_proj,0.0000405399,0.05000,9.981 | |
| 33,self_attn.k_proj,0.0000160961,0.05000,4.525 | |
| 33,self_attn.v_proj,0.0000170791,0.05000,5.440 | |
| 33,self_attn.q_proj,0.0000897349,0.05000,5.454 | |
| 33,self_attn.o_proj,0.0000053545,0.05000,1.438 | |
| 33,mlp.up_proj,0.0002320241,0.05000,2.904 | |
| 33,mlp.gate_proj,0.0002413577,0.05000,3.199 | |
| 33,mlp.down_proj,0.0000431549,0.05000,10.102 | |
| 34,self_attn.k_proj,0.0000183636,0.05000,3.295 | |
| 34,self_attn.v_proj,0.0000186837,0.05000,3.895 | |
| 34,self_attn.q_proj,0.0001030182,0.05000,3.942 | |
| 34,self_attn.o_proj,0.0000041321,0.05000,1.393 | |
| 34,mlp.gate_proj,0.0002522255,0.05000,2.408 | |
| 34,mlp.up_proj,0.0002426109,0.05000,2.843 | |
| 34,mlp.down_proj,0.0000454112,0.05000,10.617 | |
| 35,self_attn.k_proj,0.0000207992,0.05000,4.379 | |
| 35,self_attn.v_proj,0.0000225918,0.05000,5.554 | |
| 35,self_attn.q_proj,0.0001199924,0.05000,5.573 | |
| 35,self_attn.o_proj,0.0000040412,0.05000,1.432 | |
| 35,mlp.up_proj,0.0002503290,0.05000,2.908 | |
| 35,mlp.gate_proj,0.0002594362,0.05000,3.366 | |
| 35,mlp.down_proj,0.0000470948,0.05000,10.480 | |
| 36,self_attn.k_proj,0.0000219349,0.05000,4.102 | |
| 36,self_attn.v_proj,0.0000232664,0.05000,5.307 | |
| 36,self_attn.q_proj,0.0001268069,0.05000,5.618 | |
| 36,self_attn.o_proj,0.0000040203,0.05000,1.959 | |
| 36,mlp.gate_proj,0.0002621903,0.05000,3.678 | |
| 36,mlp.up_proj,0.0002539390,0.05000,4.000 | |
| 36,mlp.down_proj,0.0000465977,0.05000,10.591 | |
| 37,self_attn.k_proj,0.0000200738,0.05000,2.686 | |
| 37,self_attn.v_proj,0.0000199910,0.05000,3.659 | |
| 37,self_attn.q_proj,0.0001136281,0.05000,3.686 | |
| 37,self_attn.o_proj,0.0000048593,0.05000,2.126 | |
| 37,mlp.up_proj,0.0002583565,0.05000,3.098 | |
| 37,mlp.gate_proj,0.0002655766,0.05000,3.535 | |
| 37,mlp.down_proj,0.0000479880,0.05000,11.099 | |
| 38,self_attn.k_proj,0.0000200595,0.05000,4.477 | |
| 38,self_attn.q_proj,0.0001108004,0.05000,5.556 | |
| 38,self_attn.v_proj,0.0000190509,0.05000,5.688 | |
| 38,self_attn.o_proj,0.0000070049,0.05000,1.376 | |
| 38,mlp.gate_proj,0.0002721755,0.05000,3.439 | |
| 38,mlp.up_proj,0.0002650407,0.05000,4.081 | |
| 38,mlp.down_proj,0.0000503930,0.05000,10.563 | |
| 39,self_attn.k_proj,0.0000188938,0.05000,4.884 | |
| 39,self_attn.v_proj,0.0000189752,0.05000,6.029 | |
| 39,self_attn.q_proj,0.0001064655,0.05000,6.105 | |
| 39,self_attn.o_proj,0.0000065238,0.05000,1.458 | |
| 39,mlp.up_proj,0.0002677968,0.05000,3.408 | |
| 39,mlp.gate_proj,0.0002741319,0.05000,4.104 | |
| 39,mlp.down_proj,0.0000520134,0.05000,10.976 | |
| 40,self_attn.k_proj,0.0000181140,0.05000,4.835 | |
| 40,self_attn.q_proj,0.0000976440,0.05000,5.640 | |
| 40,self_attn.v_proj,0.0000150401,0.05000,5.686 | |
| 40,self_attn.o_proj,0.0000093862,0.05000,1.519 | |
| 40,mlp.gate_proj,0.0002780502,0.05000,3.650 | |
| 40,mlp.up_proj,0.0002731487,0.05000,3.825 | |
| 40,mlp.down_proj,0.0000552938,0.05000,10.034 | |
| 41,self_attn.k_proj,0.0000163513,0.05000,5.722 | |
| 41,self_attn.q_proj,0.0000870572,0.05000,6.084 | |
| 41,self_attn.v_proj,0.0000142287,0.05000,6.099 | |
| 41,self_attn.o_proj,0.0000111016,0.05000,1.415 | |
| 41,mlp.up_proj,0.0002877337,0.05000,3.506 | |
| 41,mlp.gate_proj,0.0002927616,0.05000,4.128 | |
| 41,mlp.down_proj,0.0000598941,0.05000,10.100 | |
| 42,self_attn.k_proj,0.0000208149,0.05000,3.617 | |
| 42,self_attn.v_proj,0.0000188300,0.05000,4.428 | |
| 42,self_attn.q_proj,0.0001212942,0.05000,4.470 | |
| 42,self_attn.o_proj,0.0000084364,0.05000,1.734 | |
| 42,mlp.gate_proj,0.0003029804,0.05000,2.942 | |
| 42,mlp.up_proj,0.0002992545,0.05000,3.951 | |
| 42,mlp.down_proj,0.0000666695,0.05000,10.567 | |
| 43,self_attn.k_proj,0.0000202393,0.05000,5.263 | |
| 43,self_attn.v_proj,0.0000160383,0.05000,6.047 | |
| 43,self_attn.q_proj,0.0001133183,0.05000,6.077 | |
| 43,self_attn.o_proj,0.0000116777,0.05000,1.433 | |
| 43,mlp.up_proj,0.0003094900,0.05000,3.389 | |
| 43,mlp.gate_proj,0.0003118018,0.05000,3.735 | |
| 43,mlp.down_proj,0.0000718063,0.05000,10.604 | |
| 44,self_attn.k_proj,0.0000194806,0.05000,4.637 | |
| 44,self_attn.v_proj,0.0000151572,0.05000,5.621 | |
| 44,self_attn.q_proj,0.0001099958,0.05000,5.711 | |
| 44,self_attn.o_proj,0.0000156448,0.05000,2.218 | |
| 44,mlp.gate_proj,0.0003184364,0.05000,2.689 | |
| 44,mlp.up_proj,0.0003197311,0.05000,3.826 | |
| 44,mlp.down_proj,0.0000852196,0.05000,10.424 | |
| 45,self_attn.k_proj,0.0000201222,0.05000,5.630 | |
| 45,self_attn.v_proj,0.0000133998,0.05000,6.065 | |
| 45,self_attn.q_proj,0.0001139192,0.05000,6.072 | |
| 45,self_attn.o_proj,0.0000191630,0.05000,1.640 | |
| 45,mlp.gate_proj,0.0003303454,0.05000,2.452 | |
| 45,mlp.up_proj,0.0003321944,0.05000,2.581 | |
| 45,mlp.down_proj,0.0000923942,0.05000,11.024 | |
| 46,self_attn.k_proj,0.0000208662,0.05000,6.042 | |
| 46,self_attn.q_proj,0.0001194436,0.05000,6.369 | |
| 46,self_attn.v_proj,0.0000148032,0.05000,6.429 | |
| 46,self_attn.o_proj,0.0000288283,0.05000,1.863 | |
| 46,mlp.gate_proj,0.0003436773,0.05000,2.520 | |
| 46,mlp.up_proj,0.0003469413,0.05000,3.154 | |
| 46,mlp.down_proj,0.0000952999,0.05000,10.518 | |
| 47,self_attn.k_proj,0.0000214334,0.05000,3.824 | |
| 47,self_attn.q_proj,0.0001251200,0.05000,5.947 | |
| 47,self_attn.v_proj,0.0000156858,0.05000,6.015 | |
| 47,self_attn.o_proj,0.0000303793,0.05000,1.455 | |
| 47,mlp.up_proj,0.0003539408,0.05000,3.560 | |
| 47,mlp.gate_proj,0.0003477681,0.05000,3.684 | |
| 47,mlp.down_proj,0.0001082456,0.05000,11.433 | |
| 48,self_attn.k_proj,0.0000211907,0.05000,3.360 | |
| 48,self_attn.v_proj,0.0000179982,0.05000,4.059 | |
| 48,self_attn.q_proj,0.0001335354,0.05000,4.094 | |
| 48,self_attn.o_proj,0.0000307128,0.05000,1.556 | |
| 48,mlp.gate_proj,0.0003703603,0.05000,3.153 | |
| 48,mlp.up_proj,0.0003783210,0.05000,3.774 | |
| 48,mlp.down_proj,0.0001198356,0.05000,10.141 | |
| 49,self_attn.k_proj,0.0000209502,0.05000,3.757 | |
| 49,self_attn.q_proj,0.0001260142,0.05000,4.520 | |
| 49,self_attn.v_proj,0.0000167613,0.05000,4.680 | |
| 49,self_attn.o_proj,0.0000305430,0.05000,1.799 | |
| 49,mlp.up_proj,0.0003895040,0.05000,3.318 | |
| 49,mlp.gate_proj,0.0003782024,0.05000,3.486 | |
| 49,mlp.down_proj,0.0001307161,0.05000,9.873 | |
| 50,self_attn.k_proj,0.0000252363,0.05000,3.728 | |
| 50,self_attn.q_proj,0.0001573606,0.05000,4.382 | |
| 50,self_attn.v_proj,0.0000202814,0.05000,4.473 | |
| 50,self_attn.o_proj,0.0000390682,0.05000,1.619 | |
| 50,mlp.gate_proj,0.0003780016,0.05000,3.250 | |
| 50,mlp.up_proj,0.0003912809,0.05000,3.442 | |
| 50,mlp.down_proj,0.0001442899,0.05000,10.492 | |
| 51,self_attn.k_proj,0.0000229148,0.05000,4.907 | |
| 51,self_attn.v_proj,0.0000174884,0.05000,5.864 | |
| 51,self_attn.q_proj,0.0001381872,0.05000,5.876 | |
| 51,self_attn.o_proj,0.0000442487,0.05000,1.416 | |
| 51,mlp.up_proj,0.0004139378,0.05000,2.554 | |
| 51,mlp.gate_proj,0.0004015314,0.05000,3.195 | |
| 51,mlp.down_proj,0.0001593402,0.05000,10.141 | |
| 52,self_attn.k_proj,0.0000202969,0.05000,3.946 | |
| 52,self_attn.v_proj,0.0000213655,0.05000,4.169 | |
| 52,self_attn.q_proj,0.0001336853,0.05000,4.187 | |
| 52,self_attn.o_proj,0.0000471424,0.05000,2.272 | |
| 52,mlp.up_proj,0.0004737044,0.05000,2.894 | |
| 52,mlp.gate_proj,0.0004633855,0.05000,3.020 | |
| 52,mlp.down_proj,0.0001702164,0.05000,10.075 | |
| 53,self_attn.k_proj,0.0000233158,0.05000,4.126 | |
| 53,self_attn.v_proj,0.0000240366,0.05000,5.370 | |
| 53,self_attn.q_proj,0.0001519378,0.05000,5.440 | |
| 53,self_attn.o_proj,0.0000560780,0.05000,1.780 | |
| 53,mlp.up_proj,0.0005071147,0.05000,2.588 | |
| 53,mlp.gate_proj,0.0004993066,0.05000,2.939 | |
| 53,mlp.down_proj,0.0001802003,0.05000,10.284 | |
| 54,self_attn.k_proj,0.0000233795,0.05000,5.763 | |
| 54,self_attn.v_proj,0.0000302860,0.05000,6.028 | |
| 54,self_attn.q_proj,0.0001671440,0.05000,6.056 | |
| 54,self_attn.o_proj,0.0000516430,0.05000,1.571 | |
| 54,mlp.gate_proj,0.0004992430,0.05000,3.068 | |
| 54,mlp.up_proj,0.0005091205,0.05000,3.247 | |
| 54,mlp.down_proj,0.0002011907,0.05000,10.394 | |
| 55,self_attn.k_proj,0.0000225518,0.05000,5.177 | |
| 55,self_attn.q_proj,0.0001639603,0.05000,6.168 | |
| 55,self_attn.v_proj,0.0000294938,0.05000,6.208 | |
| 55,self_attn.o_proj,0.0000627227,0.05000,1.584 | |
| 55,mlp.up_proj,0.0005316132,0.05000,3.328 | |
| 55,mlp.gate_proj,0.0005195548,0.05000,3.811 | |
| 55,mlp.down_proj,0.0002442001,0.05000,10.356 | |
| 56,self_attn.k_proj,0.0000225301,0.05000,3.469 | |
| 56,self_attn.q_proj,0.0001552724,0.05000,4.236 | |
| 56,self_attn.v_proj,0.0000271226,0.05000,4.276 | |
| 56,self_attn.o_proj,0.0000846248,0.05000,1.558 | |
| 56,mlp.up_proj,0.0005921104,0.05000,2.768 | |
| 56,mlp.gate_proj,0.0005815993,0.05000,2.898 | |
| 56,mlp.down_proj,0.0002835366,0.05000,10.899 | |
| 57,self_attn.k_proj,0.0000243415,0.05000,3.525 | |
| 57,self_attn.q_proj,0.0001702276,0.05000,4.157 | |
| 57,self_attn.v_proj,0.0000326652,0.05000,4.195 | |
| 57,self_attn.o_proj,0.0000819429,0.05000,2.206 | |
| 57,mlp.up_proj,0.0006121153,0.05000,3.169 | |
| 57,mlp.gate_proj,0.0005969814,0.05000,3.911 | |
| 57,mlp.down_proj,0.0003201960,0.05000,10.512 | |
| 58,self_attn.k_proj,0.0000230610,0.05000,3.863 | |
| 58,self_attn.q_proj,0.0001736004,0.05000,4.268 | |
| 58,self_attn.v_proj,0.0000337409,0.05000,4.346 | |
| 58,self_attn.o_proj,0.0001036850,0.05000,1.822 | |
| 58,mlp.up_proj,0.0006419046,0.05000,3.708 | |
| 58,mlp.gate_proj,0.0006233936,0.05000,4.012 | |
| 58,mlp.down_proj,0.0004100781,0.05000,10.312 | |
| 59,self_attn.k_proj,0.0000230318,0.05000,4.086 | |
| 59,self_attn.v_proj,0.0000360248,0.05000,4.579 | |
| 59,self_attn.q_proj,0.0001751451,0.05000,4.619 | |
| 59,self_attn.o_proj,0.0001193186,0.05000,1.427 | |
| 59,mlp.up_proj,0.0006782974,0.05000,3.164 | |
| 59,mlp.gate_proj,0.0006649875,0.05000,3.927 | |
| 59,mlp.down_proj,0.0004905933,0.05000,10.005 | |
| 60,self_attn.k_proj,0.0000251866,0.05000,3.282 | |
| 60,self_attn.q_proj,0.0002060774,0.05000,3.995 | |
| 60,self_attn.v_proj,0.0000460723,0.05000,4.188 | |
| 60,self_attn.o_proj,0.0001114960,0.05000,1.566 | |
| 60,mlp.gate_proj,0.0008174037,0.05000,2.739 | |
| 60,mlp.up_proj,0.0008225366,0.05000,3.500 | |
| 60,mlp.down_proj,0.0005587261,0.05000,10.227 | |
| 61,self_attn.k_proj,0.0000258454,0.05000,4.640 | |
| 61,self_attn.v_proj,0.0000503555,0.05000,5.904 | |
| 61,self_attn.q_proj,0.0002102286,0.05000,5.923 | |
| 61,self_attn.o_proj,0.0001169386,0.05000,1.617 | |
| 61,mlp.up_proj,0.0008935185,0.05000,3.215 | |
| 61,mlp.gate_proj,0.0008894754,0.05000,3.439 | |
| 61,mlp.down_proj,0.0006350579,0.05000,10.907 | |
| 62,self_attn.k_proj,0.0000268598,0.05000,5.521 | |
| 62,self_attn.q_proj,0.0002151201,0.05000,5.885 | |
| 62,self_attn.v_proj,0.0000486909,0.05000,5.921 | |
| 62,self_attn.o_proj,0.0001290587,0.05000,1.887 | |
| 62,mlp.gate_proj,0.0010197122,0.05000,2.633 | |
| 62,mlp.up_proj,0.0010123444,0.05000,3.002 | |
| 62,mlp.down_proj,0.0006712618,0.05000,10.130 | |
| 63,self_attn.k_proj,0.0000273980,0.05000,4.824 | |
| 63,self_attn.q_proj,0.0002180233,0.05000,5.999 | |
| 63,self_attn.v_proj,0.0000510471,0.05000,6.011 | |
| 63,self_attn.o_proj,0.0001430958,0.05000,1.408 | |
| 63,mlp.up_proj,0.0010752235,0.05000,3.125 | |
| 63,mlp.gate_proj,0.0010777579,0.05000,3.336 | |
| 63,mlp.down_proj,0.0008231888,0.05000,10.316 | |
| 64,self_attn.k_proj,0.0000287087,0.05000,4.932 | |
| 64,self_attn.v_proj,0.0000513718,0.05000,5.205 | |
| 64,self_attn.q_proj,0.0002276157,0.05000,5.247 | |
| 64,self_attn.o_proj,0.0001499052,0.05000,1.687 | |
| 64,mlp.gate_proj,0.0011711172,0.05000,2.610 | |
| 64,mlp.up_proj,0.0011612333,0.05000,2.662 | |
| 64,mlp.down_proj,0.0009735479,0.05000,10.802 | |
| 65,self_attn.k_proj,0.0000295248,0.05000,3.200 | |
| 65,self_attn.q_proj,0.0002333447,0.05000,4.567 | |
| 65,self_attn.v_proj,0.0000530385,0.05000,4.625 | |
| 65,self_attn.o_proj,0.0001616151,0.05000,1.720 | |
| 65,mlp.up_proj,0.0013132838,0.05000,3.553 | |
| 65,mlp.gate_proj,0.0013234123,0.05000,3.645 | |
| 65,mlp.down_proj,0.0011519318,0.05000,10.334 | |
| 66,self_attn.k_proj,0.0000266790,0.05000,3.620 | |
| 66,self_attn.q_proj,0.0002225198,0.05000,4.450 | |
| 66,self_attn.v_proj,0.0000549764,0.05000,4.473 | |
| 66,self_attn.o_proj,0.0001442126,0.05000,2.104 | |
| 66,mlp.gate_proj,0.0015637107,0.05000,3.194 | |
| 66,mlp.up_proj,0.0015373455,0.05000,3.325 | |
| 66,mlp.down_proj,0.0012165026,0.05000,10.287 | |
| 67,self_attn.k_proj,0.0000301622,0.05000,3.543 | |
| 67,self_attn.v_proj,0.0000635581,0.05000,4.372 | |
| 67,self_attn.q_proj,0.0002477100,0.05000,4.527 | |
| 67,self_attn.o_proj,0.0001255285,0.05000,1.432 | |
| 67,mlp.up_proj,0.0016497195,0.05000,2.552 | |
| 67,mlp.gate_proj,0.0016621593,0.05000,2.809 | |
| 67,mlp.down_proj,0.0013005061,0.05000,9.696 | |
| 68,self_attn.k_proj,0.0000300613,0.05000,3.659 | |
| 68,self_attn.v_proj,0.0000724966,0.05000,4.544 | |
| 68,self_attn.q_proj,0.0002595847,0.05000,4.604 | |
| 68,self_attn.o_proj,0.0001559665,0.05000,1.404 | |
| 68,mlp.gate_proj,0.0017940587,0.05000,2.552 | |
| 68,mlp.up_proj,0.0017932277,0.05000,3.165 | |
| 68,mlp.down_proj,0.0014139637,0.05000,10.390 | |
| 69,self_attn.k_proj,0.0000318312,0.05000,3.465 | |
| 69,self_attn.v_proj,0.0000637588,0.05000,5.358 | |
| 69,self_attn.q_proj,0.0002578544,0.05000,5.386 | |
| 69,self_attn.o_proj,0.0001961804,0.05000,1.971 | |
| 69,mlp.up_proj,0.0019337971,0.05000,3.210 | |
| 69,mlp.gate_proj,0.0019088080,0.05000,3.295 | |
| 69,mlp.down_proj,0.0016905874,0.05000,10.535 | |
| 70,self_attn.k_proj,0.0000300106,0.05000,6.354 | |
| 70,self_attn.v_proj,0.0000823853,0.05000,6.654 | |
| 70,self_attn.q_proj,0.0002635716,0.05000,6.729 | |
| 70,self_attn.o_proj,0.0002364156,0.05000,1.422 | |
| 70,mlp.gate_proj,0.0021568899,0.05000,3.061 | |
| 70,mlp.up_proj,0.0022101400,0.05000,3.624 | |
| 70,mlp.down_proj,0.0020723711,0.05000,10.561 | |
| 71,self_attn.k_proj,0.0000319353,0.05000,4.750 | |
| 71,self_attn.q_proj,0.0002720949,0.05000,5.836 | |
| 71,self_attn.v_proj,0.0000836154,0.05000,5.881 | |
| 71,self_attn.o_proj,0.0002595553,0.05000,1.423 | |
| 71,mlp.up_proj,0.0024055358,0.05000,3.296 | |
| 71,mlp.gate_proj,0.0023240922,0.05000,3.780 | |
| 71,mlp.down_proj,0.0024203319,0.05000,10.366 | |
| 72,self_attn.k_proj,0.0000296554,0.05000,3.744 | |
| 72,self_attn.v_proj,0.0000946795,0.05000,4.144 | |
| 72,self_attn.q_proj,0.0002719569,0.05000,4.283 | |
| 72,self_attn.o_proj,0.0002646630,0.05000,1.306 | |
| 72,mlp.gate_proj,0.0025021866,0.05000,3.322 | |
| 72,mlp.up_proj,0.0026187636,0.05000,3.756 | |
| 72,mlp.down_proj,0.0027510167,0.05000,10.491 | |
| 73,self_attn.k_proj,0.0000315544,0.05000,4.145 | |
| 73,self_attn.v_proj,0.0001030523,0.05000,4.373 | |
| 73,self_attn.q_proj,0.0002792062,0.05000,4.487 | |
| 73,self_attn.o_proj,0.0002852725,0.05000,1.665 | |
| 73,mlp.up_proj,0.0028002660,0.05000,3.200 | |
| 73,mlp.gate_proj,0.0026514100,0.05000,3.300 | |
| 73,mlp.down_proj,0.0031029999,0.05000,11.276 | |
| 74,self_attn.k_proj,0.0000305290,0.05000,5.100 | |
| 74,self_attn.q_proj,0.0002951643,0.05000,5.785 | |
| 74,self_attn.v_proj,0.0001025656,0.05000,5.861 | |
| 74,self_attn.o_proj,0.0002881407,0.05000,2.083 | |
| 74,mlp.gate_proj,0.0027340488,0.05000,3.195 | |
| 74,mlp.up_proj,0.0029187105,0.05000,3.344 | |
| 74,mlp.down_proj,0.0036612688,0.05000,10.380 | |
| 75,self_attn.k_proj,0.0000301170,0.05000,3.534 | |
| 75,self_attn.q_proj,0.0002765698,0.05000,4.145 | |
| 75,self_attn.v_proj,0.0001125341,0.05000,4.246 | |
| 75,self_attn.o_proj,0.0003999441,0.05000,1.543 | |
| 75,mlp.up_proj,0.0031332221,0.05000,3.166 | |
| 75,mlp.gate_proj,0.0029146747,0.05000,3.312 | |
| 75,mlp.down_proj,0.0044430610,0.05000,10.050 | |
| 76,self_attn.k_proj,0.0000310636,0.05000,3.517 | |
| 76,self_attn.v_proj,0.0001647931,0.05000,4.473 | |
| 76,self_attn.q_proj,0.0003088401,0.05000,4.522 | |
| 76,self_attn.o_proj,0.0005387367,0.05000,1.715 | |
| 76,mlp.gate_proj,0.0030735200,0.05000,3.051 | |
| 76,mlp.up_proj,0.0033259669,0.05000,3.256 | |
| 76,mlp.down_proj,0.0062650401,0.05000,10.385 | |
| 77,self_attn.k_proj,0.0000278382,0.05000,3.388 | |
| 77,self_attn.v_proj,0.0001166612,0.05000,5.630 | |
| 77,self_attn.q_proj,0.0002810968,0.05000,5.661 | |
| 77,self_attn.o_proj,0.0005502004,0.05000,1.990 | |
| 77,mlp.gate_proj,0.0031031745,0.05000,2.545 | |
| 77,mlp.up_proj,0.0033627802,0.05000,2.666 | |
| 77,mlp.down_proj,0.0079508036,0.05000,11.004 | |
| 78,self_attn.k_proj,0.0000245423,0.05000,6.015 | |
| 78,self_attn.q_proj,0.0002503374,0.05000,6.199 | |
| 78,self_attn.v_proj,0.0001106485,0.05000,6.213 | |
| 78,self_attn.o_proj,0.0006962114,0.05000,1.416 | |
| 78,mlp.gate_proj,0.0027146134,0.05000,2.491 | |
| 78,mlp.up_proj,0.0029000152,0.05000,3.054 | |
| 78,mlp.down_proj,0.0163781559,0.05000,10.409 | |
| 79,self_attn.k_proj,0.0000201428,0.05000,4.882 | |
| 79,self_attn.q_proj,0.0001729193,0.05000,6.246 | |
| 79,self_attn.v_proj,0.0000415108,0.05000,6.258 | |
| 79,self_attn.o_proj,0.0001995059,0.05000,1.762 | |
| 79,mlp.up_proj,0.0020708944,0.05000,3.238 | |
| 79,mlp.gate_proj,0.0019782346,0.05000,4.098 | |
| 79,mlp.down_proj,0.0213594078,0.05000,10.760 | |