| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000045,0.05000,4.425 | |
| 0,self_attn.v_proj,0.0000000004,0.05000,4.681 | |
| 0,self_attn.q_proj,0.0000000150,0.05000,4.512 | |
| 0,self_attn.o_proj,0.0000000000,0.05000,1.517 | |
| 0,mlp.gate_proj,0.0000000164,0.05000,2.821 | |
| 0,mlp.up_proj,0.0000000142,0.05000,2.833 | |
| 0,mlp.down_proj,0.0000000000,0.05000,5.894 | |
| 1,self_attn.k_proj,0.0000000208,0.05000,4.715 | |
| 1,self_attn.v_proj,0.0000000034,0.05000,4.756 | |
| 1,self_attn.q_proj,0.0000000452,0.05000,4.779 | |
| 1,self_attn.o_proj,0.0000000000,0.05000,1.556 | |
| 1,mlp.up_proj,0.0000000480,0.05000,2.849 | |
| 1,mlp.gate_proj,0.0000000548,0.05000,2.858 | |
| 1,mlp.down_proj,0.0000000073,0.05000,5.973 | |
| 2,self_attn.v_proj,0.0000000225,0.05000,4.851 | |
| 2,self_attn.q_proj,0.0000003553,0.05000,4.918 | |
| 2,self_attn.k_proj,0.0000001725,0.05000,4.924 | |
| 2,self_attn.o_proj,0.0000000000,0.05000,1.544 | |
| 2,mlp.gate_proj,0.0000001153,0.05000,2.867 | |
| 2,mlp.up_proj,0.0000001006,0.05000,2.888 | |
| 2,mlp.down_proj,0.0000000000,0.05000,5.934 | |
| 3,self_attn.k_proj,0.0000000937,0.05000,4.973 | |
| 3,self_attn.v_proj,0.0000000155,0.05000,4.993 | |
| 3,self_attn.q_proj,0.0000001928,0.05000,5.032 | |
| 3,self_attn.o_proj,0.0000000000,0.05000,1.556 | |
| 3,mlp.up_proj,0.0000001660,0.05000,2.836 | |
| 3,mlp.gate_proj,0.0000001922,0.05000,2.846 | |
| 3,mlp.down_proj,0.0000000001,0.05000,5.986 | |
| 4,self_attn.k_proj,0.0000001324,0.05000,4.754 | |
| 4,self_attn.v_proj,0.0000000261,0.05000,4.777 | |
| 4,self_attn.q_proj,0.0000003002,0.05000,4.790 | |
| 4,self_attn.o_proj,0.0000000000,0.05000,1.549 | |
| 4,mlp.up_proj,0.0000002246,0.05000,2.851 | |
| 4,mlp.gate_proj,0.0000002774,0.05000,2.855 | |
| 4,mlp.down_proj,0.0000000001,0.05000,5.973 | |
| 5,self_attn.v_proj,0.0000000291,0.05000,4.803 | |
| 5,self_attn.k_proj,0.0000001730,0.05000,4.830 | |
| 5,self_attn.q_proj,0.0000003899,0.05000,4.837 | |
| 5,self_attn.o_proj,0.0000000001,0.05000,1.534 | |
| 5,mlp.up_proj,0.0000002912,0.05000,2.847 | |
| 5,mlp.gate_proj,0.0000003836,0.05000,2.857 | |
| 5,mlp.down_proj,0.0000000003,0.05000,5.888 | |
| 6,self_attn.v_proj,0.0000000294,0.05000,4.935 | |
| 6,self_attn.k_proj,0.0000001706,0.05000,4.948 | |
| 6,self_attn.q_proj,0.0000003636,0.05000,4.953 | |
| 6,self_attn.o_proj,0.0000000001,0.05000,1.521 | |
| 6,mlp.gate_proj,0.0000004451,0.05000,2.825 | |
| 6,mlp.up_proj,0.0000003460,0.05000,2.831 | |
| 6,mlp.down_proj,0.0000000004,0.05000,5.921 | |
| 7,self_attn.k_proj,0.0000002152,0.05000,4.900 | |
| 7,self_attn.q_proj,0.0000004503,0.05000,5.002 | |
| 7,self_attn.v_proj,0.0000000391,0.05000,5.020 | |
| 7,self_attn.o_proj,0.0000000001,0.05000,1.543 | |
| 7,mlp.up_proj,0.0000004005,0.05000,2.853 | |
| 7,mlp.gate_proj,0.0000005274,0.05000,2.873 | |
| 7,mlp.down_proj,0.0000000005,0.05000,5.870 | |
| 8,self_attn.k_proj,0.0000001697,0.05000,4.837 | |
| 8,self_attn.q_proj,0.0000003730,0.05000,4.889 | |
| 8,self_attn.v_proj,0.0000000364,0.05000,4.901 | |
| 8,self_attn.o_proj,0.0000000002,0.05000,1.528 | |
| 8,mlp.gate_proj,0.0000005689,0.05000,2.820 | |
| 8,mlp.up_proj,0.0000004404,0.05000,2.836 | |
| 8,mlp.down_proj,0.0000000005,0.05000,5.891 | |
| 9,self_attn.k_proj,0.0000002410,0.05000,4.779 | |
| 9,self_attn.v_proj,0.0000000435,0.05000,4.831 | |
| 9,self_attn.q_proj,0.0000005147,0.05000,4.858 | |
| 9,self_attn.o_proj,0.0000000002,0.05000,1.537 | |
| 9,mlp.up_proj,0.0000004793,0.05000,2.900 | |
| 9,mlp.gate_proj,0.0000005988,0.05000,2.916 | |
| 9,mlp.down_proj,0.0000000007,0.05000,5.878 | |
| 10,self_attn.v_proj,0.0000000379,0.05000,4.766 | |
| 10,self_attn.k_proj,0.0000002164,0.05000,4.832 | |
| 10,self_attn.q_proj,0.0000004548,0.05000,4.858 | |
| 10,self_attn.o_proj,0.0000000003,0.05000,1.525 | |
| 10,mlp.gate_proj,0.0000006227,0.05000,2.869 | |
| 10,mlp.up_proj,0.0000005106,0.05000,2.868 | |
| 10,mlp.down_proj,0.0000000008,0.05000,5.864 | |
| 11,self_attn.v_proj,0.0000000559,0.05000,4.834 | |
| 11,self_attn.k_proj,0.0000002533,0.05000,4.841 | |
| 11,self_attn.q_proj,0.0000005502,0.05000,4.852 | |
| 11,self_attn.o_proj,0.0000000004,0.05000,1.523 | |
| 11,mlp.up_proj,0.0000005648,0.05000,2.887 | |
| 11,mlp.gate_proj,0.0000006790,0.05000,2.893 | |
| 11,mlp.down_proj,0.0000000009,0.05000,5.876 | |
| 12,self_attn.v_proj,0.0000000635,0.05000,4.901 | |
| 12,self_attn.q_proj,0.0000007278,0.05000,4.935 | |
| 12,self_attn.k_proj,0.0000003287,0.05000,4.943 | |
| 12,self_attn.o_proj,0.0000000004,0.05000,1.547 | |
| 12,mlp.gate_proj,0.0000007479,0.05000,2.852 | |
| 12,mlp.up_proj,0.0000006364,0.05000,2.878 | |
| 12,mlp.down_proj,0.0000000011,0.05000,5.910 | |
| 13,self_attn.v_proj,0.0000000607,0.05000,4.963 | |
| 13,self_attn.k_proj,0.0000002807,0.05000,5.071 | |
| 13,self_attn.q_proj,0.0000005740,0.05000,5.114 | |
| 13,self_attn.o_proj,0.0000000006,0.05000,1.540 | |
| 13,mlp.up_proj,0.0000007320,0.05000,2.818 | |
| 13,mlp.gate_proj,0.0000008370,0.05000,2.828 | |
| 13,mlp.down_proj,0.0000000013,0.05000,5.928 | |
| 14,self_attn.v_proj,0.0000000978,0.05000,4.684 | |
| 14,self_attn.k_proj,0.0000002809,0.05000,4.698 | |
| 14,self_attn.q_proj,0.0000006548,0.05000,4.701 | |
| 14,self_attn.o_proj,0.0000000007,0.05000,1.589 | |
| 14,mlp.gate_proj,0.0000009377,0.05000,2.761 | |
| 14,mlp.up_proj,0.0000008157,0.05000,2.767 | |
| 14,mlp.down_proj,0.0000000017,0.05000,5.905 | |
| 15,self_attn.q_proj,0.0000008244,0.05000,4.845 | |
| 15,self_attn.k_proj,0.0000003675,0.05000,4.857 | |
| 15,self_attn.v_proj,0.0000001112,0.05000,4.876 | |
| 15,self_attn.o_proj,0.0000000008,0.05000,1.547 | |
| 15,mlp.up_proj,0.0000009010,0.05000,2.888 | |
| 15,mlp.gate_proj,0.0000010717,0.05000,2.894 | |
| 15,mlp.down_proj,0.0000000022,0.05000,5.838 | |
| 16,self_attn.q_proj,0.0000007387,0.05000,4.792 | |
| 16,self_attn.k_proj,0.0000003414,0.05000,4.793 | |
| 16,self_attn.v_proj,0.0000001060,0.05000,4.807 | |
| 16,self_attn.o_proj,0.0000000009,0.05000,1.543 | |
| 16,mlp.gate_proj,0.0000013285,0.05000,2.857 | |
| 16,mlp.up_proj,0.0000010571,0.05000,2.870 | |
| 16,mlp.down_proj,0.0000000031,0.05000,5.940 | |
| 17,self_attn.v_proj,0.0000001007,0.05000,4.856 | |
| 17,self_attn.k_proj,0.0000002850,0.05000,4.927 | |
| 17,self_attn.q_proj,0.0000006805,0.05000,4.947 | |
| 17,self_attn.o_proj,0.0000000011,0.05000,1.536 | |
| 17,mlp.up_proj,0.0000012283,0.05000,2.818 | |
| 17,mlp.gate_proj,0.0000015413,0.05000,2.826 | |
| 17,mlp.down_proj,0.0000000043,0.05000,5.896 | |
| 18,self_attn.v_proj,0.0000001238,0.05000,4.909 | |
| 18,self_attn.k_proj,0.0000003386,0.05000,4.934 | |
| 18,self_attn.q_proj,0.0000008637,0.05000,4.940 | |
| 18,self_attn.o_proj,0.0000000011,0.05000,1.552 | |
| 18,mlp.gate_proj,0.0000017367,0.05000,2.819 | |
| 18,mlp.up_proj,0.0000013842,0.05000,2.828 | |
| 18,mlp.down_proj,0.0000000061,0.05000,5.913 | |
| 19,self_attn.k_proj,0.0000003408,0.05000,4.792 | |
| 19,self_attn.v_proj,0.0000001450,0.05000,4.812 | |
| 19,self_attn.q_proj,0.0000007988,0.05000,4.818 | |
| 19,self_attn.o_proj,0.0000000013,0.05000,1.585 | |
| 19,mlp.up_proj,0.0000015377,0.05000,2.836 | |
| 19,mlp.gate_proj,0.0000019642,0.05000,2.841 | |
| 19,mlp.down_proj,0.0000000081,0.05000,5.875 | |
| 20,self_attn.k_proj,0.0001023333,0.05000,4.825 | |
| 20,self_attn.q_proj,0.0002501937,0.05000,4.835 | |
| 20,self_attn.v_proj,0.0000460283,0.05000,4.843 | |
| 20,self_attn.o_proj,0.0000003618,0.05000,1.527 | |
| 20,mlp.gate_proj,0.0006521194,0.05000,2.855 | |
| 20,mlp.up_proj,0.0004975359,0.05000,2.866 | |
| 20,mlp.down_proj,0.0000025065,0.05000,5.920 | |
| 21,self_attn.v_proj,0.0000001681,0.05000,4.679 | |
| 21,self_attn.k_proj,0.0000003462,0.05000,4.699 | |
| 21,self_attn.q_proj,0.0000008533,0.05000,4.729 | |
| 21,self_attn.o_proj,0.0000000012,0.05000,1.538 | |
| 21,mlp.gate_proj,0.0000026566,0.05000,2.859 | |
| 21,mlp.up_proj,0.0000018903,0.05000,2.859 | |
| 21,mlp.down_proj,0.0000000088,0.05000,5.901 | |
| 22,self_attn.v_proj,0.0000001750,0.05000,4.938 | |
| 22,self_attn.k_proj,0.0000003291,0.05000,5.021 | |
| 22,self_attn.q_proj,0.0000008261,0.05000,5.033 | |
| 22,self_attn.o_proj,0.0000000007,0.05000,1.538 | |
| 22,mlp.gate_proj,0.0000028447,0.05000,2.773 | |
| 22,mlp.up_proj,0.0000020450,0.05000,2.780 | |
| 22,mlp.down_proj,0.0000000093,0.05000,5.958 | |
| 23,self_attn.q_proj,0.0002417441,0.05000,4.984 | |
| 23,self_attn.k_proj,0.0000953232,0.05000,5.046 | |
| 23,self_attn.v_proj,0.0000531522,0.05000,5.053 | |
| 23,self_attn.o_proj,0.0000003526,0.05000,1.563 | |
| 23,mlp.up_proj,0.0006533562,0.05000,2.885 | |
| 23,mlp.gate_proj,0.0009118593,0.05000,2.905 | |
| 23,mlp.down_proj,0.0000030385,0.05000,6.019 | |
| 24,self_attn.k_proj,0.0001111512,0.05000,4.693 | |
| 24,self_attn.q_proj,0.0002774746,0.05000,4.699 | |
| 24,self_attn.v_proj,0.0000621167,0.05000,4.709 | |
| 24,self_attn.o_proj,0.0000003281,0.05000,1.552 | |
| 24,mlp.up_proj,0.0007241608,0.05000,2.855 | |
| 24,mlp.gate_proj,0.0010297146,0.05000,2.854 | |
| 24,mlp.down_proj,0.0000033343,0.05000,5.911 | |
| 25,self_attn.v_proj,0.0000711168,0.05000,4.587 | |
| 25,self_attn.k_proj,0.0001070380,0.05000,4.607 | |
| 25,self_attn.q_proj,0.0002784348,0.05000,4.614 | |
| 25,self_attn.o_proj,0.0000003775,0.05000,1.546 | |
| 25,mlp.gate_proj,0.0011190466,0.05000,2.868 | |
| 25,mlp.up_proj,0.0007940060,0.05000,2.875 | |
| 25,mlp.down_proj,0.0000038247,0.05000,5.850 | |
| 26,self_attn.v_proj,0.0000750327,0.05000,4.572 | |
| 26,self_attn.k_proj,0.0001003102,0.05000,4.604 | |
| 26,self_attn.q_proj,0.0002635715,0.05000,4.633 | |
| 26,self_attn.o_proj,0.0000004931,0.05000,1.531 | |
| 26,mlp.up_proj,0.0008625213,0.05000,2.902 | |
| 26,mlp.gate_proj,0.0011732855,0.05000,2.912 | |
| 26,mlp.down_proj,0.0000043874,0.05000,5.909 | |
| 27,self_attn.k_proj,0.0001011328,0.05000,4.689 | |
| 27,self_attn.q_proj,0.0002715807,0.05000,4.734 | |
| 27,self_attn.v_proj,0.0000679950,0.05000,4.742 | |
| 27,self_attn.o_proj,0.0000005592,0.05000,1.525 | |
| 27,mlp.up_proj,0.0009492542,0.05000,2.856 | |
| 27,mlp.gate_proj,0.0012830498,0.05000,2.880 | |
| 27,mlp.down_proj,0.0000051588,0.05000,5.885 | |
| 28,self_attn.v_proj,0.0000991559,0.05000,4.726 | |
| 28,self_attn.q_proj,0.0002645180,0.05000,4.752 | |
| 28,self_attn.k_proj,0.0001015245,0.05000,4.773 | |
| 28,self_attn.o_proj,0.0000008684,0.05000,1.541 | |
| 28,mlp.gate_proj,0.0013707465,0.05000,2.855 | |
| 28,mlp.up_proj,0.0010521358,0.05000,2.867 | |
| 28,mlp.down_proj,0.0000069794,0.05000,5.925 | |
| 29,self_attn.v_proj,0.0001437969,0.05000,4.577 | |
| 29,self_attn.k_proj,0.0001024157,0.05000,4.606 | |
| 29,self_attn.q_proj,0.0003022972,0.05000,4.619 | |
| 29,self_attn.o_proj,0.0000018183,0.05000,1.548 | |
| 29,mlp.gate_proj,0.0013315470,0.05000,2.857 | |
| 29,mlp.up_proj,0.0010652888,0.05000,2.869 | |
| 29,mlp.down_proj,0.0000088039,0.05000,5.885 | |
| 30,self_attn.v_proj,0.0000005459,0.05000,4.485 | |
| 30,self_attn.k_proj,0.0000003257,0.05000,4.520 | |
| 30,self_attn.q_proj,0.0000009694,0.05000,4.527 | |
| 30,self_attn.o_proj,0.0000000056,0.05000,1.534 | |
| 30,mlp.up_proj,0.0000037660,0.05000,2.806 | |
| 30,mlp.gate_proj,0.0000046258,0.05000,2.810 | |
| 30,mlp.down_proj,0.0000000387,0.05000,5.990 | |
| 31,self_attn.k_proj,0.0000003086,0.05000,4.720 | |
| 31,self_attn.v_proj,0.0000005535,0.05000,4.749 | |
| 31,self_attn.q_proj,0.0000008998,0.05000,4.763 | |
| 31,self_attn.o_proj,0.0000000074,0.05000,1.537 | |
| 31,mlp.gate_proj,0.0000037957,0.05000,2.888 | |
| 31,mlp.up_proj,0.0000029992,0.05000,2.888 | |
| 31,mlp.down_proj,0.0000000545,0.05000,5.847 | |