| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000059439,0.05000,1.523 | |
| 0,self_attn.v_proj,0.0000039075,0.05000,1.012 | |
| 0,self_attn.q_proj,0.0000238143,0.05000,1.021 | |
| 0,self_attn.o_proj,0.0000220391,0.05000,1.315 | |
| 0,mlp.up_proj,0.0000110815,0.05000,1.442 | |
| 0,mlp.gate_proj,0.0000113717,0.05000,1.044 | |
| 0,mlp.down_proj,0.0000151834,0.05000,3.415 | |
| 1,self_attn.k_proj,0.0000059126,0.05000,1.041 | |
| 1,self_attn.v_proj,0.0000043126,0.05000,1.004 | |
| 1,self_attn.q_proj,0.0000232026,0.05000,1.020 | |
| 1,self_attn.o_proj,0.0000089596,0.05000,1.041 | |
| 1,mlp.up_proj,0.0000111797,0.05000,1.065 | |
| 1,mlp.gate_proj,0.0000114342,0.05000,1.035 | |
| 1,mlp.down_proj,0.0000064124,0.05000,2.654 | |
| 2,self_attn.k_proj,0.0000052098,0.05000,1.045 | |
| 2,self_attn.v_proj,0.0000036584,0.05000,1.010 | |
| 2,self_attn.q_proj,0.0000192775,0.05000,1.018 | |
| 2,self_attn.o_proj,0.0000115804,0.05000,1.037 | |
| 2,mlp.up_proj,0.0000130055,0.05000,1.068 | |
| 2,mlp.gate_proj,0.0000134072,0.05000,1.041 | |
| 2,mlp.down_proj,0.0000102456,0.05000,2.650 | |
| 3,self_attn.k_proj,0.0000079650,0.05000,1.039 | |
| 3,self_attn.v_proj,0.0000062979,0.05000,1.005 | |
| 3,self_attn.q_proj,0.0000344130,0.05000,1.018 | |
| 3,self_attn.o_proj,0.0000148093,0.05000,1.042 | |
| 3,mlp.up_proj,0.0000074303,0.05000,1.066 | |
| 3,mlp.gate_proj,0.0000075460,0.05000,1.039 | |
| 3,mlp.down_proj,0.0000036906,0.05000,2.652 | |
| 4,self_attn.k_proj,0.0000072926,0.05000,1.035 | |
| 4,self_attn.v_proj,0.0000054965,0.05000,1.004 | |
| 4,self_attn.q_proj,0.0000324719,0.05000,1.015 | |
| 4,self_attn.o_proj,0.0000135363,0.05000,1.042 | |
| 4,mlp.up_proj,0.0000077935,0.05000,1.064 | |
| 4,mlp.gate_proj,0.0000079466,0.05000,1.039 | |
| 4,mlp.down_proj,0.0000032122,0.05000,2.651 | |
| 5,self_attn.k_proj,0.0000092984,0.05000,1.038 | |
| 5,self_attn.v_proj,0.0000075066,0.05000,1.011 | |
| 5,self_attn.q_proj,0.0000400782,0.05000,1.019 | |
| 5,self_attn.o_proj,0.0000137737,0.05000,1.039 | |
| 5,mlp.up_proj,0.0000084687,0.05000,1.066 | |
| 5,mlp.gate_proj,0.0000086387,0.05000,1.037 | |
| 5,mlp.down_proj,0.0000029938,0.05000,2.648 | |
| 6,self_attn.k_proj,0.0000097146,0.05000,1.043 | |
| 6,self_attn.v_proj,0.0000078300,0.05000,1.001 | |
| 6,self_attn.q_proj,0.0000425935,0.05000,1.016 | |
| 6,self_attn.o_proj,0.0000130678,0.05000,1.040 | |
| 6,mlp.up_proj,0.0000066432,0.05000,1.066 | |
| 6,mlp.gate_proj,0.0000067693,0.05000,1.037 | |
| 6,mlp.down_proj,0.0000019580,0.05000,2.641 | |
| 7,self_attn.k_proj,0.0000110695,0.05000,1.034 | |
| 7,self_attn.v_proj,0.0000098961,0.05000,1.006 | |
| 7,self_attn.q_proj,0.0000535851,0.05000,1.012 | |
| 7,self_attn.o_proj,0.0000108217,0.05000,1.037 | |
| 7,mlp.up_proj,0.0000063509,0.05000,1.063 | |
| 7,mlp.gate_proj,0.0000064191,0.05000,1.035 | |
| 7,mlp.down_proj,0.0000018483,0.05000,2.653 | |
| 8,self_attn.k_proj,0.0000095001,0.05000,1.041 | |
| 8,self_attn.v_proj,0.0000075776,0.05000,1.002 | |
| 8,self_attn.q_proj,0.0000411649,0.05000,1.013 | |
| 8,self_attn.o_proj,0.0000126457,0.05000,1.040 | |
| 8,mlp.up_proj,0.0000065683,0.05000,1.063 | |
| 8,mlp.gate_proj,0.0000067366,0.05000,1.034 | |
| 8,mlp.down_proj,0.0000015336,0.05000,2.636 | |
| 9,self_attn.k_proj,0.0000075909,0.05000,1.044 | |
| 9,self_attn.v_proj,0.0000057550,0.05000,1.013 | |
| 9,self_attn.q_proj,0.0000344832,0.05000,1.025 | |
| 9,self_attn.o_proj,0.0000085166,0.05000,1.038 | |
| 9,mlp.up_proj,0.0000043794,0.05000,1.061 | |
| 9,mlp.gate_proj,0.0000045057,0.05000,1.035 | |
| 9,mlp.down_proj,0.0000009460,0.05000,2.641 | |
| 10,self_attn.k_proj,0.0000111547,0.05000,1.033 | |
| 10,self_attn.v_proj,0.0000092689,0.05000,1.000 | |
| 10,self_attn.q_proj,0.0000519109,0.05000,1.011 | |
| 10,self_attn.o_proj,0.0000135746,0.05000,1.032 | |
| 10,mlp.up_proj,0.0000039040,0.05000,1.061 | |
| 10,mlp.gate_proj,0.0000039544,0.05000,1.033 | |
| 10,mlp.down_proj,0.0000007761,0.05000,2.628 | |
| 11,self_attn.k_proj,0.0000108629,0.05000,1.035 | |
| 11,self_attn.v_proj,0.0000084592,0.05000,1.006 | |
| 11,self_attn.q_proj,0.0000500227,0.05000,1.008 | |
| 11,self_attn.o_proj,0.0000132639,0.05000,1.035 | |
| 11,mlp.up_proj,0.0000032214,0.05000,1.060 | |
| 11,mlp.gate_proj,0.0000033015,0.05000,1.030 | |
| 11,mlp.down_proj,0.0000004664,0.05000,2.627 | |
| 12,self_attn.k_proj,0.0000125110,0.05000,1.037 | |
| 12,self_attn.v_proj,0.0000097656,0.05000,0.995 | |
| 12,self_attn.q_proj,0.0000552543,0.05000,1.007 | |
| 12,self_attn.o_proj,0.0000134279,0.05000,1.036 | |
| 12,mlp.up_proj,0.0000031708,0.05000,1.058 | |
| 12,mlp.gate_proj,0.0000032374,0.05000,1.032 | |
| 12,mlp.down_proj,0.0000003898,0.05000,2.639 | |
| 13,self_attn.k_proj,0.0000102793,0.05000,1.040 | |
| 13,self_attn.v_proj,0.0000081455,0.05000,1.008 | |
| 13,self_attn.q_proj,0.0000480064,0.05000,1.011 | |
| 13,self_attn.o_proj,0.0000093675,0.05000,1.033 | |
| 13,mlp.up_proj,0.0000021026,0.05000,1.063 | |
| 13,mlp.gate_proj,0.0000021487,0.05000,1.033 | |
| 13,mlp.down_proj,0.0000001983,0.05000,2.641 | |
| 14,self_attn.k_proj,0.0000103936,0.05000,1.041 | |
| 14,self_attn.v_proj,0.0000081330,0.05000,1.002 | |
| 14,self_attn.q_proj,0.0000488184,0.05000,1.011 | |
| 14,self_attn.o_proj,0.0000089386,0.05000,1.037 | |
| 14,mlp.up_proj,0.0000025068,0.05000,1.062 | |
| 14,mlp.gate_proj,0.0000025513,0.05000,1.036 | |
| 14,mlp.down_proj,0.0000002944,0.05000,2.642 | |
| 15,self_attn.k_proj,0.0000134852,0.05000,1.045 | |
| 15,self_attn.v_proj,0.0000107378,0.05000,1.014 | |
| 15,self_attn.q_proj,0.0000620740,0.05000,1.016 | |
| 15,self_attn.o_proj,0.0000136202,0.05000,1.043 | |
| 15,mlp.up_proj,0.0000032474,0.05000,1.064 | |
| 15,mlp.gate_proj,0.0000033245,0.05000,1.040 | |
| 15,mlp.down_proj,0.0000004164,0.05000,2.635 | |
| 16,self_attn.k_proj,0.0000150497,0.05000,1.043 | |
| 16,self_attn.v_proj,0.0000123104,0.05000,1.008 | |
| 16,self_attn.q_proj,0.0000706003,0.05000,1.011 | |
| 16,self_attn.o_proj,0.0000116576,0.05000,1.038 | |
| 16,mlp.up_proj,0.0000042218,0.05000,1.061 | |
| 16,mlp.gate_proj,0.0000043296,0.05000,1.033 | |
| 16,mlp.down_proj,0.0000004880,0.05000,2.634 | |
| 17,self_attn.k_proj,0.0000164214,0.05000,1.038 | |
| 17,self_attn.v_proj,0.0000140974,0.05000,1.007 | |
| 17,self_attn.q_proj,0.0000774397,0.05000,1.009 | |
| 17,self_attn.o_proj,0.0000219263,0.05000,1.039 | |
| 17,mlp.up_proj,0.0000038117,0.05000,1.065 | |
| 17,mlp.gate_proj,0.0000039213,0.05000,1.041 | |
| 17,mlp.down_proj,0.0000004193,0.05000,2.653 | |
| 18,self_attn.k_proj,0.0000172823,0.05000,1.033 | |
| 18,self_attn.v_proj,0.0000144956,0.05000,0.998 | |
| 18,self_attn.q_proj,0.0000809578,0.05000,1.004 | |
| 18,self_attn.o_proj,0.0000178630,0.05000,1.035 | |
| 18,mlp.up_proj,0.0000034930,0.05000,1.061 | |
| 18,mlp.gate_proj,0.0000035984,0.05000,1.031 | |
| 18,mlp.down_proj,0.0000003581,0.05000,2.634 | |
| 19,self_attn.k_proj,0.0000138637,0.05000,1.038 | |
| 19,self_attn.v_proj,0.0000106994,0.05000,1.005 | |
| 19,self_attn.q_proj,0.0000632666,0.05000,1.005 | |
| 19,self_attn.o_proj,0.0000055669,0.05000,1.032 | |
| 19,mlp.up_proj,0.0000037013,0.05000,1.070 | |
| 19,mlp.gate_proj,0.0000038086,0.05000,1.035 | |
| 19,mlp.down_proj,0.0000003597,0.05000,2.646 | |
| 20,self_attn.k_proj,0.0000187151,0.05000,1.037 | |
| 20,self_attn.v_proj,0.0000151013,0.05000,1.000 | |
| 20,self_attn.q_proj,0.0000877593,0.05000,1.008 | |
| 20,self_attn.o_proj,0.0000173331,0.05000,1.031 | |
| 20,mlp.up_proj,0.0000035404,0.05000,1.058 | |
| 20,mlp.gate_proj,0.0000036535,0.05000,1.030 | |
| 20,mlp.down_proj,0.0000003419,0.05000,2.647 | |
| 21,self_attn.k_proj,0.0000161697,0.05000,1.037 | |
| 21,self_attn.v_proj,0.0000122697,0.05000,1.005 | |
| 21,self_attn.q_proj,0.0000721811,0.05000,1.011 | |
| 21,self_attn.o_proj,0.0000143799,0.05000,1.041 | |
| 21,mlp.up_proj,0.0000040757,0.05000,1.062 | |
| 21,mlp.gate_proj,0.0000042371,0.05000,1.039 | |
| 21,mlp.down_proj,0.0000004525,0.05000,2.664 | |
| 22,self_attn.k_proj,0.0000169354,0.05000,1.033 | |
| 22,self_attn.v_proj,0.0000132405,0.05000,1.002 | |
| 22,self_attn.q_proj,0.0000890276,0.05000,1.006 | |
| 22,self_attn.o_proj,0.0000041558,0.05000,1.037 | |
| 22,mlp.up_proj,0.0000036900,0.05000,1.056 | |
| 22,mlp.gate_proj,0.0000038310,0.05000,1.025 | |
| 22,mlp.down_proj,0.0000004213,0.05000,2.630 | |
| 23,self_attn.k_proj,0.0000182787,0.05000,1.039 | |
| 23,self_attn.v_proj,0.0000157284,0.05000,1.006 | |
| 23,self_attn.q_proj,0.0000960312,0.05000,1.006 | |
| 23,self_attn.o_proj,0.0000131840,0.05000,1.034 | |
| 23,mlp.up_proj,0.0000030392,0.05000,1.069 | |
| 23,mlp.gate_proj,0.0000031354,0.05000,1.040 | |
| 23,mlp.down_proj,0.0000002823,0.05000,2.631 | |
| 24,self_attn.k_proj,0.0000211280,0.05000,1.030 | |
| 24,self_attn.v_proj,0.0000192252,0.05000,1.001 | |
| 24,self_attn.q_proj,0.0001013641,0.05000,1.004 | |
| 24,self_attn.o_proj,0.0000243574,0.05000,1.039 | |
| 24,mlp.up_proj,0.0000033583,0.05000,1.065 | |
| 24,mlp.gate_proj,0.0000034760,0.05000,1.034 | |
| 24,mlp.down_proj,0.0000003517,0.05000,2.634 | |
| 25,self_attn.k_proj,0.0000196986,0.05000,1.048 | |
| 25,self_attn.v_proj,0.0000153495,0.05000,1.019 | |
| 25,self_attn.q_proj,0.0000933140,0.05000,1.016 | |
| 25,self_attn.o_proj,0.0000164252,0.05000,1.037 | |
| 25,mlp.up_proj,0.0000034673,0.05000,1.066 | |
| 25,mlp.gate_proj,0.0000035728,0.05000,1.042 | |
| 25,mlp.down_proj,0.0000003741,0.05000,2.647 | |
| 26,self_attn.k_proj,0.0000196134,0.05000,1.039 | |
| 26,self_attn.v_proj,0.0000150768,0.05000,1.004 | |
| 26,self_attn.q_proj,0.0000988552,0.05000,1.005 | |
| 26,self_attn.o_proj,0.0000089032,0.05000,1.038 | |
| 26,mlp.up_proj,0.0000036113,0.05000,1.064 | |
| 26,mlp.gate_proj,0.0000037079,0.05000,1.033 | |
| 26,mlp.down_proj,0.0000003865,0.05000,2.638 | |
| 27,self_attn.k_proj,0.0000185194,0.05000,1.038 | |
| 27,self_attn.v_proj,0.0000147775,0.05000,1.005 | |
| 27,self_attn.q_proj,0.0000884268,0.05000,1.006 | |
| 27,self_attn.o_proj,0.0000162331,0.05000,1.038 | |
| 27,mlp.up_proj,0.0000031586,0.05000,1.061 | |
| 27,mlp.gate_proj,0.0000032463,0.05000,1.036 | |
| 27,mlp.down_proj,0.0000003164,0.05000,2.633 | |
| 28,self_attn.k_proj,0.0000182955,0.05000,1.043 | |
| 28,self_attn.v_proj,0.0000151388,0.05000,1.002 | |
| 28,self_attn.q_proj,0.0000885868,0.05000,1.005 | |
| 28,self_attn.o_proj,0.0000136137,0.05000,1.032 | |
| 28,mlp.up_proj,0.0000028749,0.05000,1.064 | |
| 28,mlp.gate_proj,0.0000029219,0.05000,1.033 | |
| 28,mlp.down_proj,0.0000003112,0.05000,2.635 | |
| 29,self_attn.k_proj,0.0000185079,0.05000,1.043 | |
| 29,self_attn.v_proj,0.0000122247,0.05000,1.010 | |
| 29,self_attn.q_proj,0.0000848096,0.05000,1.009 | |
| 29,self_attn.o_proj,0.0000079501,0.05000,1.033 | |
| 29,mlp.up_proj,0.0000034258,0.05000,1.060 | |
| 29,mlp.gate_proj,0.0000034560,0.05000,1.033 | |
| 29,mlp.down_proj,0.0000004112,0.05000,2.624 | |
| 30,self_attn.k_proj,0.0000200373,0.05000,1.034 | |
| 30,self_attn.v_proj,0.0000163101,0.05000,1.004 | |
| 30,self_attn.q_proj,0.0001012875,0.05000,1.004 | |
| 30,self_attn.o_proj,0.0000071170,0.05000,1.033 | |
| 30,mlp.up_proj,0.0000035733,0.05000,1.057 | |
| 30,mlp.gate_proj,0.0000035858,0.05000,1.030 | |
| 30,mlp.down_proj,0.0000004136,0.05000,2.630 | |
| 31,self_attn.k_proj,0.0000211797,0.05000,1.036 | |
| 31,self_attn.v_proj,0.0000139414,0.05000,1.005 | |
| 31,self_attn.q_proj,0.0000860812,0.05000,1.006 | |
| 31,self_attn.o_proj,0.0000048044,0.05000,1.033 | |
| 31,mlp.up_proj,0.0000037375,0.05000,1.060 | |
| 31,mlp.gate_proj,0.0000037139,0.05000,1.033 | |
| 31,mlp.down_proj,0.0000004492,0.05000,2.622 | |
| 32,self_attn.k_proj,0.0000207835,0.05000,1.035 | |
| 32,self_attn.v_proj,0.0000152161,0.05000,1.001 | |
| 32,self_attn.q_proj,0.0000913564,0.05000,1.007 | |
| 32,self_attn.o_proj,0.0000079106,0.05000,1.034 | |
| 32,mlp.up_proj,0.0000024507,0.05000,1.059 | |
| 32,mlp.gate_proj,0.0000024351,0.05000,1.033 | |
| 32,mlp.down_proj,0.0000001740,0.05000,2.624 | |
| 33,self_attn.k_proj,0.0000182657,0.05000,1.039 | |
| 33,self_attn.v_proj,0.0000128059,0.05000,1.006 | |
| 33,self_attn.q_proj,0.0000866449,0.05000,1.007 | |
| 33,self_attn.o_proj,0.0000072791,0.05000,1.032 | |
| 33,mlp.up_proj,0.0000031301,0.05000,1.068 | |
| 33,mlp.gate_proj,0.0000031329,0.05000,1.031 | |
| 33,mlp.down_proj,0.0000004381,0.05000,2.626 | |
| 34,self_attn.k_proj,0.0000166431,0.05000,1.037 | |
| 34,self_attn.v_proj,0.0000133107,0.05000,1.001 | |
| 34,self_attn.q_proj,0.0000836072,0.05000,1.005 | |
| 34,self_attn.o_proj,0.0000067067,0.05000,1.039 | |
| 34,mlp.up_proj,0.0000042955,0.05000,1.059 | |
| 34,mlp.gate_proj,0.0000043195,0.05000,1.031 | |
| 34,mlp.down_proj,0.0000005294,0.05000,2.631 | |
| 35,self_attn.k_proj,0.0000127095,0.05000,1.038 | |
| 35,self_attn.v_proj,0.0000130456,0.05000,1.007 | |
| 35,self_attn.q_proj,0.0000706689,0.05000,1.006 | |
| 35,self_attn.o_proj,0.0000047317,0.05000,1.031 | |
| 35,mlp.up_proj,0.0000050128,0.05000,1.061 | |
| 35,mlp.gate_proj,0.0000050194,0.05000,1.029 | |
| 35,mlp.down_proj,0.0000007617,0.05000,2.616 | |
| 36,self_attn.k_proj,0.0000122905,0.05000,1.035 | |
| 36,self_attn.v_proj,0.0000143251,0.05000,1.002 | |
| 36,self_attn.q_proj,0.0000760232,0.05000,1.004 | |
| 36,self_attn.o_proj,0.0000038522,0.05000,1.032 | |
| 36,mlp.up_proj,0.0000282895,0.05000,1.061 | |
| 36,mlp.gate_proj,0.0000269556,0.05000,1.028 | |
| 36,mlp.down_proj,0.0000333966,0.05000,2.631 | |
| 37,self_attn.k_proj,0.0000136531,0.05000,1.034 | |
| 37,self_attn.v_proj,0.0000129941,0.05000,1.002 | |
| 37,self_attn.q_proj,0.0000815826,0.05000,1.001 | |
| 37,self_attn.o_proj,0.0000139014,0.05000,1.027 | |
| 37,mlp.up_proj,0.0000297700,0.05000,1.056 | |
| 37,mlp.gate_proj,0.0000275959,0.05000,1.030 | |
| 37,mlp.down_proj,0.0000330723,0.05000,2.627 | |