| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000025754,0.05000,4.550 | |
| 0,self_attn.v_proj,0.0000002206,0.05000,4.562 | |
| 0,self_attn.q_proj,0.0000087561,0.05000,4.573 | |
| 0,self_attn.o_proj,0.0000000012,0.05000,1.502 | |
| 0,mlp.up_proj,0.0000081505,0.05000,2.709 | |
| 0,mlp.gate_proj,0.0000094237,0.05000,2.716 | |
| 0,mlp.down_proj,0.0000000070,0.05000,5.802 | |
| 1,self_attn.q_proj,0.0000285129,0.05000,5.844 | |
| 1,self_attn.v_proj,0.0000020318,0.05000,5.856 | |
| 1,self_attn.k_proj,0.0000127451,0.05000,5.870 | |
| 1,self_attn.o_proj,0.0000000052,0.05000,1.503 | |
| 1,mlp.gate_proj,0.0000322149,0.05000,2.735 | |
| 1,mlp.up_proj,0.0000282160,0.05000,2.741 | |
| 1,mlp.down_proj,0.0000052935,0.05000,5.818 | |
| 2,self_attn.v_proj,0.0000137185,0.05000,5.586 | |
| 2,self_attn.k_proj,0.0001054883,0.05000,5.603 | |
| 2,self_attn.q_proj,0.0002171249,0.05000,5.632 | |
| 2,self_attn.o_proj,0.0000000075,0.05000,1.523 | |
| 2,mlp.gate_proj,0.0000672672,0.05000,2.829 | |
| 2,mlp.up_proj,0.0000587216,0.05000,2.835 | |
| 2,mlp.down_proj,0.0000000224,0.05000,5.795 | |
| 3,self_attn.v_proj,0.0000093818,0.05000,5.672 | |
| 3,self_attn.q_proj,0.0001175257,0.05000,5.684 | |
| 3,self_attn.k_proj,0.0000570549,0.05000,5.696 | |
| 3,self_attn.o_proj,0.0000000112,0.05000,1.535 | |
| 3,mlp.gate_proj,0.0001121420,0.05000,2.703 | |
| 3,mlp.up_proj,0.0000968189,0.05000,2.706 | |
| 3,mlp.down_proj,0.0000000410,0.05000,5.772 | |
| 4,self_attn.q_proj,0.0001813112,0.05000,5.543 | |
| 4,self_attn.v_proj,0.0000157679,0.05000,5.555 | |
| 4,self_attn.k_proj,0.0000802006,0.05000,5.555 | |
| 4,self_attn.o_proj,0.0000000139,0.05000,1.527 | |
| 4,mlp.gate_proj,0.0001625613,0.05000,2.747 | |
| 4,mlp.up_proj,0.0001317042,0.05000,2.761 | |
| 4,mlp.down_proj,0.0000000744,0.05000,5.809 | |
| 5,self_attn.k_proj,0.0001039211,0.05000,5.706 | |
| 5,self_attn.q_proj,0.0002341090,0.05000,5.739 | |
| 5,self_attn.v_proj,0.0000174460,0.05000,5.786 | |
| 5,self_attn.o_proj,0.0000000322,0.05000,1.503 | |
| 5,mlp.gate_proj,0.0002247521,0.05000,2.734 | |
| 5,mlp.up_proj,0.0001709394,0.05000,2.734 | |
| 5,mlp.down_proj,0.0000001268,0.05000,5.818 | |
| 6,self_attn.k_proj,0.0001032290,0.05000,5.563 | |
| 6,self_attn.v_proj,0.0000177316,0.05000,5.576 | |
| 6,self_attn.q_proj,0.0002197504,0.05000,5.594 | |
| 6,self_attn.o_proj,0.0000000426,0.05000,1.519 | |
| 6,mlp.gate_proj,0.0002620231,0.05000,2.695 | |
| 6,mlp.up_proj,0.0002037956,0.05000,2.700 | |
| 6,mlp.down_proj,0.0000001768,0.05000,5.722 | |
| 7,self_attn.k_proj,0.0001301391,0.05000,5.649 | |
| 7,self_attn.q_proj,0.0002715318,0.05000,5.686 | |
| 7,self_attn.v_proj,0.0000233400,0.05000,5.700 | |
| 7,self_attn.o_proj,0.0000000710,0.05000,1.489 | |
| 7,mlp.gate_proj,0.0003091105,0.05000,2.726 | |
| 7,mlp.up_proj,0.0002347886,0.05000,2.734 | |
| 7,mlp.down_proj,0.0000002321,0.05000,5.731 | |
| 8,self_attn.k_proj,0.0001017436,0.05000,5.731 | |
| 8,self_attn.q_proj,0.0002240664,0.05000,5.757 | |
| 8,self_attn.v_proj,0.0000217979,0.05000,5.766 | |
| 8,self_attn.o_proj,0.0000000915,0.05000,1.519 | |
| 8,mlp.up_proj,0.0002580485,0.05000,2.713 | |
| 8,mlp.gate_proj,0.0003330376,0.05000,2.718 | |
| 8,mlp.down_proj,0.0000002755,0.05000,5.747 | |
| 9,self_attn.v_proj,0.0000258198,0.05000,5.596 | |
| 9,self_attn.q_proj,0.0003062698,0.05000,5.632 | |
| 9,self_attn.k_proj,0.0001433366,0.05000,5.638 | |
| 9,self_attn.o_proj,0.0000001034,0.05000,1.490 | |
| 9,mlp.up_proj,0.0002804786,0.05000,2.756 | |
| 9,mlp.gate_proj,0.0003499140,0.05000,2.766 | |
| 9,mlp.down_proj,0.0000003341,0.05000,5.813 | |
| 10,self_attn.k_proj,0.0001297817,0.05000,5.668 | |
| 10,self_attn.v_proj,0.0000226510,0.05000,5.703 | |
| 10,self_attn.q_proj,0.0002727139,0.05000,5.738 | |
| 10,self_attn.o_proj,0.0000001711,0.05000,1.504 | |
| 10,mlp.gate_proj,0.0003655863,0.05000,2.747 | |
| 10,mlp.up_proj,0.0003002079,0.05000,2.752 | |
| 10,mlp.down_proj,0.0000003908,0.05000,5.818 | |
| 11,self_attn.v_proj,0.0000333907,0.05000,5.675 | |
| 11,self_attn.k_proj,0.0001514282,0.05000,5.690 | |
| 11,self_attn.q_proj,0.0003284788,0.05000,5.704 | |
| 11,self_attn.o_proj,0.0000002205,0.05000,1.515 | |
| 11,mlp.gate_proj,0.0003984610,0.05000,2.731 | |
| 11,mlp.up_proj,0.0003320518,0.05000,2.740 | |
| 11,mlp.down_proj,0.0000004510,0.05000,5.806 | |
| 12,self_attn.k_proj,0.0001964771,0.05000,5.543 | |
| 12,self_attn.q_proj,0.0004358755,0.05000,5.666 | |
| 12,self_attn.v_proj,0.0000379014,0.05000,5.708 | |
| 12,self_attn.o_proj,0.0000002516,0.05000,1.495 | |
| 12,mlp.up_proj,0.0003744479,0.05000,2.767 | |
| 12,mlp.gate_proj,0.0004391452,0.05000,2.776 | |
| 12,mlp.down_proj,0.0000005534,0.05000,5.815 | |
| 13,self_attn.v_proj,0.0000360716,0.05000,5.625 | |
| 13,self_attn.q_proj,0.0003422806,0.05000,5.741 | |
| 13,self_attn.k_proj,0.0001674168,0.05000,5.749 | |
| 13,self_attn.o_proj,0.0000003109,0.05000,1.493 | |
| 13,mlp.gate_proj,0.0004911288,0.05000,2.685 | |
| 13,mlp.up_proj,0.0004301303,0.05000,2.689 | |
| 13,mlp.down_proj,0.0000006914,0.05000,5.771 | |
| 14,self_attn.k_proj,0.0001664226,0.05000,5.596 | |
| 14,self_attn.v_proj,0.0000576001,0.05000,5.624 | |
| 14,self_attn.q_proj,0.0003889395,0.05000,5.668 | |
| 14,self_attn.o_proj,0.0000004098,0.05000,1.493 | |
| 14,mlp.up_proj,0.0004783811,0.05000,2.743 | |
| 14,mlp.gate_proj,0.0005488174,0.05000,2.747 | |
| 14,mlp.down_proj,0.0000008860,0.05000,5.796 | |
| 15,self_attn.q_proj,0.0004867710,0.05000,5.634 | |
| 15,self_attn.k_proj,0.0002165216,0.05000,5.752 | |
| 15,self_attn.v_proj,0.0000653710,0.05000,5.760 | |
| 15,self_attn.o_proj,0.0000004345,0.05000,1.515 | |
| 15,mlp.gate_proj,0.0006246117,0.05000,2.696 | |
| 15,mlp.up_proj,0.0005259726,0.05000,2.704 | |
| 15,mlp.down_proj,0.0000011260,0.05000,5.745 | |
| 16,self_attn.k_proj,0.0001991889,0.05000,5.492 | |
| 16,self_attn.v_proj,0.0000615639,0.05000,5.508 | |
| 16,self_attn.q_proj,0.0004318745,0.05000,5.523 | |
| 16,self_attn.o_proj,0.0000005076,0.05000,1.503 | |
| 16,mlp.up_proj,0.0006129682,0.05000,2.751 | |
| 16,mlp.gate_proj,0.0007694462,0.05000,2.759 | |
| 16,mlp.down_proj,0.0000015809,0.05000,5.768 | |
| 17,self_attn.v_proj,0.0000590238,0.05000,5.789 | |
| 17,self_attn.k_proj,0.0001672252,0.05000,5.818 | |
| 17,self_attn.q_proj,0.0003993788,0.05000,5.828 | |
| 17,self_attn.o_proj,0.0000006334,0.05000,1.505 | |
| 17,mlp.up_proj,0.0007126845,0.05000,2.701 | |
| 17,mlp.gate_proj,0.0008941703,0.05000,2.715 | |
| 17,mlp.down_proj,0.0000021782,0.05000,5.786 | |
| 18,self_attn.v_proj,0.0000725807,0.05000,5.491 | |
| 18,self_attn.k_proj,0.0001988027,0.05000,5.544 | |
| 18,self_attn.q_proj,0.0005069916,0.05000,5.570 | |
| 18,self_attn.o_proj,0.0000005907,0.05000,1.536 | |
| 18,mlp.gate_proj,0.0010087889,0.05000,2.764 | |
| 18,mlp.up_proj,0.0008049888,0.05000,2.769 | |
| 18,mlp.down_proj,0.0000031469,0.05000,5.804 | |
| 19,self_attn.q_proj,0.0004640531,0.05000,5.718 | |
| 19,self_attn.k_proj,0.0001974665,0.05000,5.751 | |
| 19,self_attn.v_proj,0.0000839271,0.05000,5.758 | |
| 19,self_attn.o_proj,0.0000007363,0.05000,1.516 | |
| 19,mlp.up_proj,0.0008893232,0.05000,2.702 | |
| 19,mlp.gate_proj,0.0011344106,0.05000,2.704 | |
| 19,mlp.down_proj,0.0000041928,0.05000,5.776 | |
| 20,self_attn.v_proj,0.0000917941,0.05000,5.457 | |
| 20,self_attn.k_proj,0.0002024085,0.05000,5.464 | |
| 20,self_attn.q_proj,0.0004972993,0.05000,5.482 | |
| 20,self_attn.o_proj,0.0000006737,0.05000,1.525 | |
| 20,mlp.gate_proj,0.0012861970,0.05000,2.697 | |
| 20,mlp.up_proj,0.0009820292,0.05000,2.696 | |
| 20,mlp.down_proj,0.0000043654,0.05000,5.801 | |
| 21,self_attn.k_proj,0.0001981790,0.05000,5.710 | |
| 21,self_attn.v_proj,0.0000964703,0.05000,5.747 | |
| 21,self_attn.q_proj,0.0004897626,0.05000,5.770 | |
| 21,self_attn.o_proj,0.0000006938,0.05000,1.536 | |
| 21,mlp.gate_proj,0.0015099732,0.05000,2.692 | |
| 21,mlp.up_proj,0.0010752812,0.05000,2.708 | |
| 21,mlp.down_proj,0.0000044608,0.05000,5.819 | |
| 22,self_attn.v_proj,0.0000996507,0.05000,5.592 | |
| 22,self_attn.q_proj,0.0004715399,0.05000,5.642 | |
| 22,self_attn.k_proj,0.0001876980,0.05000,5.657 | |
| 22,self_attn.o_proj,0.0000004057,0.05000,1.512 | |
| 22,mlp.gate_proj,0.0016046927,0.05000,2.720 | |
| 22,mlp.up_proj,0.0011544167,0.05000,2.726 | |
| 22,mlp.down_proj,0.0000046066,0.05000,5.792 | |
| 23,self_attn.q_proj,0.0004739835,0.05000,5.550 | |
| 23,self_attn.k_proj,0.0001863427,0.05000,5.639 | |
| 23,self_attn.v_proj,0.0001045092,0.05000,5.656 | |
| 23,self_attn.o_proj,0.0000006813,0.05000,1.508 | |
| 23,mlp.up_proj,0.0012700862,0.05000,2.755 | |
| 23,mlp.gate_proj,0.0017711886,0.05000,2.766 | |
| 23,mlp.down_proj,0.0000051867,0.05000,5.805 | |
| 24,self_attn.q_proj,0.0005410001,0.05000,5.842 | |
| 24,self_attn.v_proj,0.0001214173,0.05000,5.883 | |
| 24,self_attn.k_proj,0.0002158198,0.05000,5.946 | |
| 24,self_attn.o_proj,0.0000006280,0.05000,1.501 | |
| 24,mlp.gate_proj,0.0019970989,0.05000,2.721 | |
| 24,mlp.up_proj,0.0014057605,0.05000,2.721 | |
| 24,mlp.down_proj,0.0000056286,0.05000,5.838 | |
| 25,self_attn.k_proj,0.0002077088,0.05000,5.659 | |
| 25,self_attn.v_proj,0.0001386532,0.05000,5.680 | |
| 25,self_attn.q_proj,0.0005421010,0.05000,5.690 | |
| 25,self_attn.o_proj,0.0000006926,0.05000,1.508 | |
| 25,mlp.gate_proj,0.0021648855,0.05000,2.806 | |
| 25,mlp.up_proj,0.0015368462,0.05000,2.807 | |
| 25,mlp.down_proj,0.0000063590,0.05000,5.777 | |
| 26,self_attn.q_proj,0.0005148287,0.05000,5.733 | |
| 26,self_attn.v_proj,0.0001467281,0.05000,5.761 | |
| 26,self_attn.k_proj,0.0001950796,0.05000,5.790 | |
| 26,self_attn.o_proj,0.0000009540,0.05000,1.512 | |
| 26,mlp.up_proj,0.0016700355,0.05000,2.757 | |
| 26,mlp.gate_proj,0.0022701313,0.05000,2.764 | |
| 26,mlp.down_proj,0.0000073036,0.05000,5.829 | |
| 27,self_attn.q_proj,0.0005313924,0.05000,5.597 | |
| 27,self_attn.k_proj,0.0001970788,0.05000,5.617 | |
| 27,self_attn.v_proj,0.0001329189,0.05000,5.631 | |
| 27,self_attn.o_proj,0.0000010856,0.05000,1.539 | |
| 27,mlp.gate_proj,0.0024865442,0.05000,2.738 | |
| 27,mlp.up_proj,0.0018403968,0.05000,2.737 | |
| 27,mlp.down_proj,0.0000087551,0.05000,5.844 | |
| 28,self_attn.k_proj,0.0001981637,0.05000,5.458 | |
| 28,self_attn.v_proj,0.0001949648,0.05000,5.500 | |
| 28,self_attn.q_proj,0.0005183223,0.05000,5.508 | |
| 28,self_attn.o_proj,0.0000016372,0.05000,1.530 | |
| 28,mlp.gate_proj,0.0026638827,0.05000,2.748 | |
| 28,mlp.up_proj,0.0020455004,0.05000,2.762 | |
| 28,mlp.down_proj,0.0000119281,0.05000,5.836 | |
| 29,self_attn.q_proj,0.0005931044,0.05000,5.728 | |
| 29,self_attn.k_proj,0.0001997706,0.05000,5.741 | |
| 29,self_attn.v_proj,0.0002828346,0.05000,5.767 | |
| 29,self_attn.o_proj,0.0000034553,0.05000,1.534 | |
| 29,mlp.up_proj,0.0020760434,0.05000,2.725 | |
| 29,mlp.gate_proj,0.0025936320,0.05000,2.729 | |
| 29,mlp.down_proj,0.0000151650,0.05000,5.807 | |
| 30,self_attn.v_proj,0.0003089608,0.05000,5.433 | |
| 30,self_attn.k_proj,0.0001842356,0.05000,5.482 | |
| 30,self_attn.q_proj,0.0005517652,0.05000,5.508 | |
| 30,self_attn.o_proj,0.0000030842,0.05000,1.513 | |
| 30,mlp.up_proj,0.0021368292,0.05000,2.743 | |
| 30,mlp.gate_proj,0.0026252946,0.05000,2.751 | |
| 30,mlp.down_proj,0.0000199158,0.05000,5.768 | |
| 31,self_attn.k_proj,0.0001757457,0.05000,5.804 | |
| 31,self_attn.v_proj,0.0003163291,0.05000,5.898 | |
| 31,self_attn.q_proj,0.0005140052,0.05000,5.915 | |
| 31,self_attn.o_proj,0.0000041636,0.05000,1.517 | |
| 31,mlp.gate_proj,0.0022865063,0.05000,2.720 | |
| 31,mlp.up_proj,0.0018066571,0.05000,2.729 | |
| 31,mlp.down_proj,0.0000333210,0.05000,5.901 | |