| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000045,0.05000,4.840 | |
| 0,self_attn.v_proj,0.0000000004,0.05000,5.288 | |
| 0,self_attn.q_proj,0.0000000150,0.05000,5.068 | |
| 0,self_attn.o_proj,0.0000000000,0.05000,1.513 | |
| 0,mlp.up_proj,0.0000000142,0.05000,2.825 | |
| 0,mlp.gate_proj,0.0000000164,0.05000,2.834 | |
| 0,mlp.down_proj,0.0000000000,0.05000,5.910 | |
| 1,self_attn.q_proj,0.0000000452,0.05000,4.740 | |
| 1,self_attn.k_proj,0.0000000208,0.05000,4.753 | |
| 1,self_attn.v_proj,0.0000000034,0.05000,4.794 | |
| 1,self_attn.o_proj,0.0000000000,0.05000,1.628 | |
| 1,mlp.up_proj,0.0000000480,0.05000,2.837 | |
| 1,mlp.gate_proj,0.0000000548,0.05000,2.865 | |
| 1,mlp.down_proj,0.0000000073,0.05000,5.963 | |
| 2,self_attn.k_proj,0.0000001725,0.05000,4.514 | |
| 2,self_attn.q_proj,0.0000003553,0.05000,4.526 | |
| 2,self_attn.v_proj,0.0000000225,0.05000,4.536 | |
| 2,self_attn.o_proj,0.0000000000,0.05000,2.101 | |
| 2,mlp.up_proj,0.0000001006,0.05000,2.791 | |
| 2,mlp.gate_proj,0.0000001153,0.05000,2.805 | |
| 2,mlp.down_proj,0.0000000000,0.05000,5.912 | |
| 3,self_attn.v_proj,0.0000000155,0.05000,4.692 | |
| 3,self_attn.q_proj,0.0000001928,0.05000,4.718 | |
| 3,self_attn.k_proj,0.0000000937,0.05000,4.730 | |
| 3,self_attn.o_proj,0.0000000000,0.05000,1.556 | |
| 3,mlp.gate_proj,0.0000001922,0.05000,2.877 | |
| 3,mlp.up_proj,0.0000001660,0.05000,2.891 | |
| 3,mlp.down_proj,0.0000000001,0.05000,5.870 | |
| 4,self_attn.k_proj,0.0000001324,0.05000,4.821 | |
| 4,self_attn.q_proj,0.0000003002,0.05000,4.843 | |
| 4,self_attn.v_proj,0.0000000261,0.05000,4.850 | |
| 4,self_attn.o_proj,0.0000000000,0.05000,1.527 | |
| 4,mlp.gate_proj,0.0000002774,0.05000,2.827 | |
| 4,mlp.up_proj,0.0000002246,0.05000,2.837 | |
| 4,mlp.down_proj,0.0000000001,0.05000,5.955 | |
| 5,self_attn.k_proj,0.0000001730,0.05000,4.897 | |
| 5,self_attn.v_proj,0.0000000291,0.05000,4.904 | |
| 5,self_attn.q_proj,0.0000003899,0.05000,4.909 | |
| 5,self_attn.o_proj,0.0000000001,0.05000,1.577 | |
| 5,mlp.up_proj,0.0000002912,0.05000,2.816 | |
| 5,mlp.gate_proj,0.0000003836,0.05000,2.831 | |
| 5,mlp.down_proj,0.0000000003,0.05000,5.922 | |
| 6,self_attn.q_proj,0.0000003636,0.05000,4.775 | |
| 6,self_attn.k_proj,0.0000001706,0.05000,4.862 | |
| 6,self_attn.v_proj,0.0000000294,0.05000,4.873 | |
| 6,self_attn.o_proj,0.0000000001,0.05000,1.533 | |
| 6,mlp.up_proj,0.0000003460,0.05000,2.797 | |
| 6,mlp.gate_proj,0.0000004451,0.05000,2.797 | |
| 6,mlp.down_proj,0.0000000004,0.05000,5.935 | |
| 7,self_attn.v_proj,0.0000000391,0.05000,4.774 | |
| 7,self_attn.q_proj,0.0000004503,0.05000,4.793 | |
| 7,self_attn.k_proj,0.0000002152,0.05000,4.811 | |
| 7,self_attn.o_proj,0.0000000001,0.05000,1.568 | |
| 7,mlp.up_proj,0.0000004005,0.05000,2.814 | |
| 7,mlp.gate_proj,0.0000005274,0.05000,2.818 | |
| 7,mlp.down_proj,0.0000000005,0.05000,5.941 | |
| 8,self_attn.k_proj,0.0000001697,0.05000,4.593 | |
| 8,self_attn.q_proj,0.0000003730,0.05000,4.593 | |
| 8,self_attn.v_proj,0.0000000364,0.05000,4.615 | |
| 8,self_attn.o_proj,0.0000000002,0.05000,1.552 | |
| 8,mlp.gate_proj,0.0000005689,0.05000,2.832 | |
| 8,mlp.up_proj,0.0000004404,0.05000,2.842 | |
| 8,mlp.down_proj,0.0000000005,0.05000,5.915 | |
| 9,self_attn.q_proj,0.0000005147,0.05000,4.651 | |
| 9,self_attn.v_proj,0.0000000435,0.05000,4.676 | |
| 9,self_attn.k_proj,0.0000002410,0.05000,4.684 | |
| 9,self_attn.o_proj,0.0000000002,0.05000,1.546 | |
| 9,mlp.gate_proj,0.0000005988,0.05000,2.826 | |
| 9,mlp.up_proj,0.0000004793,0.05000,2.834 | |
| 9,mlp.down_proj,0.0000000007,0.05000,5.961 | |
| 10,self_attn.k_proj,0.0000002164,0.05000,4.770 | |
| 10,self_attn.q_proj,0.0000004548,0.05000,4.779 | |
| 10,self_attn.v_proj,0.0000000379,0.05000,4.786 | |
| 10,self_attn.o_proj,0.0000000003,0.05000,1.531 | |
| 10,mlp.gate_proj,0.0000006227,0.05000,2.837 | |
| 10,mlp.up_proj,0.0000005106,0.05000,2.848 | |
| 10,mlp.down_proj,0.0000000008,0.05000,5.918 | |
| 11,self_attn.k_proj,0.0000002533,0.05000,4.929 | |
| 11,self_attn.q_proj,0.0000005502,0.05000,5.001 | |
| 11,self_attn.v_proj,0.0000000559,0.05000,5.031 | |
| 11,self_attn.o_proj,0.0000000004,0.05000,1.540 | |
| 11,mlp.gate_proj,0.0000006790,0.05000,2.822 | |
| 11,mlp.up_proj,0.0000005648,0.05000,2.831 | |
| 11,mlp.down_proj,0.0000000009,0.05000,5.917 | |
| 12,self_attn.q_proj,0.0000007278,0.05000,4.785 | |
| 12,self_attn.v_proj,0.0000000635,0.05000,4.804 | |
| 12,self_attn.k_proj,0.0000003287,0.05000,4.831 | |
| 12,self_attn.o_proj,0.0000000004,0.05000,1.534 | |
| 12,mlp.gate_proj,0.0000007479,0.05000,2.831 | |
| 12,mlp.up_proj,0.0000006364,0.05000,2.836 | |
| 12,mlp.down_proj,0.0000000011,0.05000,5.979 | |
| 13,self_attn.k_proj,0.0000002807,0.05000,4.666 | |
| 13,self_attn.q_proj,0.0000005740,0.05000,4.694 | |
| 13,self_attn.v_proj,0.0000000607,0.05000,4.704 | |
| 13,self_attn.o_proj,0.0000000006,0.05000,1.560 | |
| 13,mlp.gate_proj,0.0000008370,0.05000,2.828 | |
| 13,mlp.up_proj,0.0000007320,0.05000,2.845 | |
| 13,mlp.down_proj,0.0000000013,0.05000,5.919 | |
| 14,self_attn.q_proj,0.0000006548,0.05000,4.817 | |
| 14,self_attn.v_proj,0.0000000978,0.05000,4.860 | |
| 14,self_attn.k_proj,0.0000002809,0.05000,4.864 | |
| 14,self_attn.o_proj,0.0000000007,0.05000,1.548 | |
| 14,mlp.gate_proj,0.0000009377,0.05000,2.863 | |
| 14,mlp.up_proj,0.0000008157,0.05000,2.875 | |
| 14,mlp.down_proj,0.0000000017,0.05000,5.917 | |
| 15,self_attn.k_proj,0.0000003675,0.05000,4.802 | |
| 15,self_attn.v_proj,0.0000001112,0.05000,4.832 | |
| 15,self_attn.q_proj,0.0000008244,0.05000,4.842 | |
| 15,self_attn.o_proj,0.0000000008,0.05000,1.565 | |
| 15,mlp.gate_proj,0.0000010717,0.05000,2.820 | |
| 15,mlp.up_proj,0.0000009010,0.05000,2.821 | |
| 15,mlp.down_proj,0.0000000022,0.05000,5.900 | |
| 16,self_attn.k_proj,0.0000003414,0.05000,4.800 | |
| 16,self_attn.q_proj,0.0000007387,0.05000,4.826 | |
| 16,self_attn.v_proj,0.0000001060,0.05000,4.831 | |
| 16,self_attn.o_proj,0.0000000009,0.05000,1.555 | |
| 16,mlp.up_proj,0.0000010571,0.05000,2.796 | |
| 16,mlp.gate_proj,0.0000013285,0.05000,2.804 | |
| 16,mlp.down_proj,0.0000000031,0.05000,5.935 | |
| 17,self_attn.v_proj,0.0000001007,0.05000,4.906 | |
| 17,self_attn.k_proj,0.0000002850,0.05000,4.927 | |
| 17,self_attn.q_proj,0.0000006805,0.05000,4.970 | |
| 17,self_attn.o_proj,0.0000000011,0.05000,1.555 | |
| 17,mlp.up_proj,0.0000012283,0.05000,2.795 | |
| 17,mlp.gate_proj,0.0000015413,0.05000,2.803 | |
| 17,mlp.down_proj,0.0000000043,0.05000,5.859 | |
| 18,self_attn.v_proj,0.0000001238,0.05000,4.658 | |
| 18,self_attn.k_proj,0.0000003386,0.05000,4.669 | |
| 18,self_attn.q_proj,0.0000008637,0.05000,4.682 | |
| 18,self_attn.o_proj,0.0000000011,0.05000,1.535 | |
| 18,mlp.up_proj,0.0000013842,0.05000,2.782 | |
| 18,mlp.gate_proj,0.0000017367,0.05000,2.792 | |
| 18,mlp.down_proj,0.0000000061,0.05000,5.917 | |
| 19,self_attn.k_proj,0.0000003408,0.05000,4.715 | |
| 19,self_attn.q_proj,0.0000007988,0.05000,4.776 | |
| 19,self_attn.v_proj,0.0000001450,0.05000,4.783 | |
| 19,self_attn.o_proj,0.0000000013,0.05000,1.550 | |
| 19,mlp.up_proj,0.0000015377,0.05000,2.835 | |
| 19,mlp.gate_proj,0.0000019642,0.05000,2.851 | |
| 19,mlp.down_proj,0.0000000081,0.05000,5.902 | |
| 20,self_attn.v_proj,0.0000460283,0.05000,4.815 | |
| 20,self_attn.q_proj,0.0002501937,0.05000,4.853 | |
| 20,self_attn.k_proj,0.0001023333,0.05000,4.865 | |
| 20,self_attn.o_proj,0.0000003618,0.05000,1.536 | |
| 20,mlp.up_proj,0.0004975359,0.05000,2.848 | |
| 20,mlp.gate_proj,0.0006521194,0.05000,2.854 | |
| 20,mlp.down_proj,0.0000025065,0.05000,5.928 | |
| 21,self_attn.k_proj,0.0001006711,0.05000,4.614 | |
| 21,self_attn.v_proj,0.0000486894,0.05000,4.634 | |
| 21,self_attn.q_proj,0.0002477611,0.05000,4.647 | |
| 21,self_attn.o_proj,0.0000003476,0.05000,1.568 | |
| 21,mlp.gate_proj,0.0007708430,0.05000,2.823 | |
| 21,mlp.up_proj,0.0005485023,0.05000,2.831 | |
| 21,mlp.down_proj,0.0000025757,0.05000,5.958 | |
| 22,self_attn.v_proj,0.0000507348,0.05000,4.733 | |
| 22,self_attn.q_proj,0.0002405264,0.05000,4.754 | |
| 22,self_attn.k_proj,0.0000960108,0.05000,4.761 | |
| 22,self_attn.o_proj,0.0000002108,0.05000,1.536 | |
| 22,mlp.up_proj,0.0005943207,0.05000,2.806 | |
| 22,mlp.gate_proj,0.0008269122,0.05000,2.810 | |
| 22,mlp.down_proj,0.0000027136,0.05000,5.895 | |
| 23,self_attn.k_proj,0.0000954055,0.05000,4.678 | |
| 23,self_attn.q_proj,0.0002420283,0.05000,4.711 | |
| 23,self_attn.v_proj,0.0000532537,0.05000,4.729 | |
| 23,self_attn.o_proj,0.0000003501,0.05000,1.521 | |
| 23,mlp.up_proj,0.0006547531,0.05000,2.851 | |
| 23,mlp.gate_proj,0.0009137075,0.05000,2.879 | |
| 23,mlp.down_proj,0.0000030363,0.05000,5.912 | |
| 24,self_attn.v_proj,0.0000622052,0.05000,4.498 | |
| 24,self_attn.k_proj,0.0001111750,0.05000,4.528 | |
| 24,self_attn.q_proj,0.0002778825,0.05000,4.554 | |
| 24,self_attn.o_proj,0.0000003277,0.05000,1.578 | |
| 24,mlp.up_proj,0.0007254657,0.05000,2.841 | |
| 24,mlp.gate_proj,0.0010315949,0.05000,2.861 | |
| 24,mlp.down_proj,0.0000033368,0.05000,5.904 | |
| 25,self_attn.v_proj,0.0000711914,0.05000,4.562 | |
| 25,self_attn.k_proj,0.0001072556,0.05000,4.586 | |
| 25,self_attn.q_proj,0.0002790395,0.05000,4.612 | |
| 25,self_attn.o_proj,0.0000003792,0.05000,1.566 | |
| 25,mlp.gate_proj,0.0011210348,0.05000,2.902 | |
| 25,mlp.up_proj,0.0007955477,0.05000,2.907 | |
| 25,mlp.down_proj,0.0000038278,0.05000,5.972 | |
| 26,self_attn.v_proj,0.0000751634,0.05000,4.598 | |
| 26,self_attn.k_proj,0.0001005206,0.05000,4.633 | |
| 26,self_attn.q_proj,0.0002639526,0.05000,4.640 | |
| 26,self_attn.o_proj,0.0000004955,0.05000,1.556 | |
| 26,mlp.up_proj,0.0008637970,0.05000,2.815 | |
| 26,mlp.gate_proj,0.0011751253,0.05000,2.820 | |
| 26,mlp.down_proj,0.0000043847,0.05000,5.919 | |
| 27,self_attn.v_proj,0.0000680719,0.05000,4.600 | |
| 27,self_attn.k_proj,0.0001012717,0.05000,4.649 | |
| 27,self_attn.q_proj,0.0002717224,0.05000,4.657 | |
| 27,self_attn.o_proj,0.0000005582,0.05000,1.540 | |
| 27,mlp.gate_proj,0.0012836707,0.05000,2.818 | |
| 27,mlp.up_proj,0.0009500155,0.05000,2.832 | |
| 27,mlp.down_proj,0.0000051473,0.05000,5.936 | |
| 28,self_attn.q_proj,0.0002645630,0.05000,4.639 | |
| 28,self_attn.k_proj,0.0001015999,0.05000,4.661 | |
| 28,self_attn.v_proj,0.0000992078,0.05000,4.686 | |
| 28,self_attn.o_proj,0.0000008682,0.05000,1.564 | |
| 28,mlp.gate_proj,0.0013713280,0.05000,2.813 | |
| 28,mlp.up_proj,0.0010524418,0.05000,2.818 | |
| 28,mlp.down_proj,0.0000069629,0.05000,5.921 | |
| 29,self_attn.v_proj,0.0001436985,0.05000,4.504 | |
| 29,self_attn.k_proj,0.0001024819,0.05000,4.512 | |
| 29,self_attn.q_proj,0.0003024004,0.05000,4.519 | |
| 29,self_attn.o_proj,0.0000018162,0.05000,1.541 | |
| 29,mlp.gate_proj,0.0013321182,0.05000,2.801 | |
| 29,mlp.up_proj,0.0010659065,0.05000,2.823 | |
| 29,mlp.down_proj,0.0000087815,0.05000,5.863 | |
| 30,self_attn.v_proj,0.0000005463,0.05000,4.492 | |
| 30,self_attn.k_proj,0.0000003260,0.05000,4.527 | |
| 30,self_attn.q_proj,0.0000009703,0.05000,4.532 | |
| 30,self_attn.o_proj,0.0000000055,0.05000,1.522 | |
| 30,mlp.gate_proj,0.0000046290,0.05000,2.849 | |
| 30,mlp.up_proj,0.0000037689,0.05000,2.855 | |
| 30,mlp.down_proj,0.0000000387,0.05000,5.934 | |
| 31,self_attn.k_proj,0.0000003091,0.05000,4.778 | |
| 31,self_attn.q_proj,0.0000009006,0.05000,4.797 | |
| 31,self_attn.v_proj,0.0000005541,0.05000,4.808 | |
| 31,self_attn.o_proj,0.0000000074,0.05000,1.543 | |
| 31,mlp.up_proj,0.0000029935,0.05000,2.817 | |
| 31,mlp.gate_proj,0.0000037887,0.05000,2.823 | |
| 31,mlp.down_proj,0.0000000543,0.05000,5.876 | |