| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000044,0.05000,2.464 | |
| 0,self_attn.v_proj,0.0000000008,0.05000,2.488 | |
| 0,self_attn.q_proj,0.0000000191,0.05000,2.543 | |
| 0,self_attn.o_proj,0.0000000203,0.05000,0.861 | |
| 0,mlp.up_proj,0.0000000307,0.05000,2.166 | |
| 0,mlp.gate_proj,0.0000000795,0.05000,2.175 | |
| 0,mlp.down_proj,0.0000000207,0.05000,5.497 | |
| 1,self_attn.v_proj,0.0000000008,0.05000,3.146 | |
| 1,self_attn.k_proj,0.0000000022,0.05000,3.175 | |
| 1,self_attn.q_proj,0.0000000085,0.05000,3.193 | |
| 1,self_attn.o_proj,0.0000000040,0.05000,0.825 | |
| 1,mlp.up_proj,0.0000008692,0.05000,1.366 | |
| 1,mlp.gate_proj,0.0000012902,0.05000,1.372 | |
| 1,mlp.down_proj,0.0000000284,0.05000,5.618 | |
| 2,self_attn.k_proj,0.0000000123,0.05000,3.202 | |
| 2,self_attn.v_proj,0.0000000028,0.05000,3.210 | |
| 2,self_attn.q_proj,0.0000000484,0.05000,3.295 | |
| 2,self_attn.o_proj,0.0000000079,0.05000,0.838 | |
| 2,mlp.up_proj,0.0000008670,0.05000,2.285 | |
| 2,mlp.gate_proj,0.0000012831,0.05000,2.291 | |
| 2,mlp.down_proj,0.0000000571,0.05000,5.648 | |
| 3,self_attn.q_proj,0.0000000671,0.05000,3.347 | |
| 3,self_attn.v_proj,0.0000000060,0.05000,3.451 | |
| 3,self_attn.k_proj,0.0000000151,0.05000,3.490 | |
| 3,self_attn.o_proj,0.0000000252,0.05000,0.890 | |
| 3,mlp.up_proj,0.0000020149,0.05000,2.103 | |
| 3,mlp.gate_proj,0.0000023558,0.05000,2.110 | |
| 3,mlp.down_proj,0.0000006257,0.05000,5.511 | |
| 4,self_attn.k_proj,0.0000000315,0.05000,2.993 | |
| 4,self_attn.v_proj,0.0000000167,0.05000,3.009 | |
| 4,self_attn.q_proj,0.0000001521,0.05000,3.086 | |
| 4,self_attn.o_proj,0.0000000164,0.05000,0.890 | |
| 4,mlp.gate_proj,0.0000023605,0.05000,2.241 | |
| 4,mlp.up_proj,0.0000018879,0.05000,2.255 | |
| 4,mlp.down_proj,0.0000002817,0.05000,5.677 | |
| 5,self_attn.k_proj,0.0000000341,0.05000,3.653 | |
| 5,self_attn.v_proj,0.0000000171,0.05000,3.675 | |
| 5,self_attn.q_proj,0.0000001700,0.05000,3.707 | |
| 5,self_attn.o_proj,0.0000000157,0.05000,0.918 | |
| 5,mlp.up_proj,0.0000030345,0.05000,2.204 | |
| 5,mlp.gate_proj,0.0000033247,0.05000,2.219 | |
| 5,mlp.down_proj,0.0000000732,0.05000,5.558 | |
| 6,self_attn.k_proj,0.0000000210,0.05000,2.998 | |
| 6,self_attn.v_proj,0.0000000125,0.05000,3.003 | |
| 6,self_attn.q_proj,0.0000001101,0.05000,3.088 | |
| 6,self_attn.o_proj,0.0000000269,0.05000,0.896 | |
| 6,mlp.up_proj,0.0000007844,0.05000,2.153 | |
| 6,mlp.gate_proj,0.0000010371,0.05000,2.159 | |
| 6,mlp.down_proj,0.0000001627,0.05000,5.748 | |
| 7,self_attn.k_proj,0.0000000239,0.05000,3.633 | |
| 7,self_attn.v_proj,0.0000000261,0.05000,3.659 | |
| 7,self_attn.q_proj,0.0000001492,0.05000,3.664 | |
| 7,self_attn.o_proj,0.0000000598,0.05000,0.844 | |
| 7,mlp.up_proj,0.0000007770,0.05000,2.100 | |
| 7,mlp.gate_proj,0.0000008227,0.05000,2.109 | |
| 7,mlp.down_proj,0.0000002494,0.05000,5.609 | |
| 8,self_attn.k_proj,0.0000000450,0.05000,3.464 | |
| 8,self_attn.q_proj,0.0000002250,0.05000,3.475 | |
| 8,self_attn.v_proj,0.0000000253,0.05000,3.480 | |
| 8,self_attn.o_proj,0.0000000541,0.05000,0.843 | |
| 8,mlp.up_proj,0.0000009107,0.05000,2.163 | |
| 8,mlp.gate_proj,0.0000009393,0.05000,2.169 | |
| 8,mlp.down_proj,0.0000002649,0.05000,5.567 | |
| 9,self_attn.q_proj,0.0000002020,0.05000,2.928 | |
| 9,self_attn.v_proj,0.0000000356,0.05000,2.950 | |
| 9,self_attn.k_proj,0.0000000332,0.05000,3.041 | |
| 9,self_attn.o_proj,0.0000000851,0.05000,0.852 | |
| 9,mlp.up_proj,0.0000018742,0.05000,2.121 | |
| 9,mlp.gate_proj,0.0000025099,0.05000,2.130 | |
| 9,mlp.down_proj,0.0000003172,0.05000,5.574 | |
| 10,self_attn.q_proj,0.0000001846,0.05000,2.718 | |
| 10,self_attn.k_proj,0.0000000335,0.05000,2.737 | |
| 10,self_attn.v_proj,0.0000000234,0.05000,2.836 | |
| 10,self_attn.o_proj,0.0000000614,0.05000,0.838 | |
| 10,mlp.gate_proj,0.0000010436,0.05000,2.127 | |
| 10,mlp.up_proj,0.0000009895,0.05000,2.136 | |
| 10,mlp.down_proj,0.0000002303,0.05000,5.724 | |
| 11,self_attn.k_proj,0.0000000413,0.05000,3.974 | |
| 11,self_attn.q_proj,0.0000002067,0.05000,3.992 | |
| 11,self_attn.v_proj,0.0000000216,0.05000,4.085 | |
| 11,self_attn.o_proj,0.0000000655,0.05000,0.886 | |
| 11,mlp.up_proj,0.0000009311,0.05000,2.553 | |
| 11,mlp.gate_proj,0.0000009437,0.05000,2.563 | |
| 11,mlp.down_proj,0.0000002879,0.05000,5.553 | |
| 12,self_attn.v_proj,0.0000000269,0.05000,4.333 | |
| 12,self_attn.q_proj,0.0000002253,0.05000,4.347 | |
| 12,self_attn.k_proj,0.0000000432,0.05000,4.384 | |
| 12,self_attn.o_proj,0.0000000747,0.05000,0.874 | |
| 12,mlp.gate_proj,0.0000009145,0.05000,2.833 | |
| 12,mlp.up_proj,0.0000009364,0.05000,2.844 | |
| 12,mlp.down_proj,0.0000002613,0.05000,5.630 | |
| 13,self_attn.v_proj,0.0000000339,0.05000,2.604 | |
| 13,self_attn.k_proj,0.0000000372,0.05000,2.632 | |
| 13,self_attn.q_proj,0.0000002266,0.05000,2.640 | |
| 13,self_attn.o_proj,0.0000001181,0.05000,0.857 | |
| 13,mlp.up_proj,0.0000009420,0.05000,1.799 | |
| 13,mlp.gate_proj,0.0000009377,0.05000,1.798 | |
| 13,mlp.down_proj,0.0000002500,0.05000,5.592 | |
| 14,self_attn.k_proj,0.0000000547,0.05000,3.282 | |
| 14,self_attn.v_proj,0.0000000395,0.05000,3.297 | |
| 14,self_attn.q_proj,0.0000003236,0.05000,3.427 | |
| 14,self_attn.o_proj,0.0000000939,0.05000,0.851 | |
| 14,mlp.gate_proj,0.0000010082,0.05000,1.820 | |
| 14,mlp.up_proj,0.0000010460,0.05000,1.823 | |
| 14,mlp.down_proj,0.0000002847,0.05000,5.866 | |
| 15,self_attn.v_proj,0.0000000321,0.05000,3.789 | |
| 15,self_attn.k_proj,0.0000000497,0.05000,3.805 | |
| 15,self_attn.q_proj,0.0000002612,0.05000,3.890 | |
| 15,self_attn.o_proj,0.0000000868,0.05000,0.862 | |
| 15,mlp.up_proj,0.0000009975,0.05000,1.744 | |
| 15,mlp.gate_proj,0.0000009431,0.05000,1.748 | |
| 15,mlp.down_proj,0.0000003023,0.05000,5.621 | |
| 16,self_attn.q_proj,0.0000002790,0.05000,2.622 | |
| 16,self_attn.k_proj,0.0000000447,0.05000,2.629 | |
| 16,self_attn.v_proj,0.0000000462,0.05000,2.644 | |
| 16,self_attn.o_proj,0.0000001286,0.05000,0.839 | |
| 16,mlp.up_proj,0.0000010595,0.05000,1.755 | |
| 16,mlp.gate_proj,0.0000010016,0.05000,1.755 | |
| 16,mlp.down_proj,0.0000003172,0.05000,5.590 | |
| 17,self_attn.q_proj,0.0000003178,0.05000,2.550 | |
| 17,self_attn.v_proj,0.0000000503,0.05000,2.574 | |
| 17,self_attn.k_proj,0.0000000467,0.05000,2.594 | |
| 17,self_attn.o_proj,0.0000001092,0.05000,0.865 | |
| 17,mlp.up_proj,0.0000012212,0.05000,1.691 | |
| 17,mlp.gate_proj,0.0000011384,0.05000,1.691 | |
| 17,mlp.down_proj,0.0000004105,0.05000,5.573 | |
| 18,self_attn.v_proj,0.0000000558,0.05000,2.441 | |
| 18,self_attn.k_proj,0.0000000355,0.05000,2.474 | |
| 18,self_attn.q_proj,0.0000002488,0.05000,2.482 | |
| 18,self_attn.o_proj,0.0000002174,0.05000,0.858 | |
| 18,mlp.up_proj,0.0000012998,0.05000,1.713 | |
| 18,mlp.gate_proj,0.0000012134,0.05000,1.719 | |
| 18,mlp.down_proj,0.0000004943,0.05000,5.604 | |
| 19,self_attn.q_proj,0.0000002946,0.05000,2.463 | |
| 19,self_attn.k_proj,0.0000000362,0.05000,2.486 | |
| 19,self_attn.v_proj,0.0000000733,0.05000,2.516 | |
| 19,self_attn.o_proj,0.0000002530,0.05000,0.848 | |
| 19,mlp.up_proj,0.0000014108,0.05000,1.724 | |
| 19,mlp.gate_proj,0.0000013564,0.05000,1.730 | |
| 19,mlp.down_proj,0.0000006319,0.05000,5.626 | |
| 20,self_attn.q_proj,0.0000002772,0.05000,2.549 | |
| 20,self_attn.v_proj,0.0000000775,0.05000,2.581 | |
| 20,self_attn.k_proj,0.0000000353,0.05000,2.595 | |
| 20,self_attn.o_proj,0.0000001905,0.05000,0.848 | |
| 20,mlp.gate_proj,0.0000017158,0.05000,1.712 | |
| 20,mlp.up_proj,0.0000017782,0.05000,1.716 | |
| 20,mlp.down_proj,0.0000011989,0.05000,5.666 | |
| 21,self_attn.k_proj,0.0000000390,0.05000,2.589 | |
| 21,self_attn.v_proj,0.0000001106,0.05000,2.622 | |
| 21,self_attn.q_proj,0.0000003375,0.05000,2.633 | |
| 21,self_attn.o_proj,0.0000003695,0.05000,0.867 | |
| 21,mlp.up_proj,0.0000022832,0.05000,1.698 | |
| 21,mlp.gate_proj,0.0000022574,0.05000,1.705 | |
| 21,mlp.down_proj,0.0000017943,0.05000,5.606 | |
| 22,self_attn.q_proj,0.0000005025,0.05000,2.727 | |
| 22,self_attn.k_proj,0.0000000550,0.05000,2.731 | |
| 22,self_attn.v_proj,0.0000001965,0.05000,2.739 | |
| 22,self_attn.o_proj,0.0000003003,0.05000,0.861 | |
| 22,mlp.up_proj,0.0000031518,0.05000,1.768 | |
| 22,mlp.gate_proj,0.0000030812,0.05000,1.776 | |
| 22,mlp.down_proj,0.0000031401,0.05000,5.648 | |
| 23,self_attn.k_proj,0.0000000747,0.05000,2.695 | |
| 23,self_attn.v_proj,0.0000002885,0.05000,2.705 | |
| 23,self_attn.q_proj,0.0000006291,0.05000,2.714 | |
| 23,self_attn.o_proj,0.0000006152,0.05000,0.871 | |
| 23,mlp.up_proj,0.0000041236,0.05000,1.787 | |
| 23,mlp.gate_proj,0.0000039755,0.05000,1.794 | |
| 23,mlp.down_proj,0.0000037470,0.05000,5.645 | |
| 24,self_attn.q_proj,0.0000005010,0.05000,3.537 | |
| 24,self_attn.v_proj,0.0000002462,0.05000,3.574 | |
| 24,self_attn.k_proj,0.0000000591,0.05000,3.643 | |
| 24,self_attn.o_proj,0.0000004400,0.05000,0.855 | |
| 24,mlp.gate_proj,0.0000040475,0.05000,1.760 | |
| 24,mlp.up_proj,0.0000044454,0.05000,1.770 | |
| 24,mlp.down_proj,0.0000049576,0.05000,5.640 | |
| 25,self_attn.v_proj,0.0000003608,0.05000,2.477 | |
| 25,self_attn.q_proj,0.0000005041,0.05000,2.507 | |
| 25,self_attn.k_proj,0.0000000499,0.05000,2.533 | |
| 25,self_attn.o_proj,0.0000006603,0.05000,0.887 | |
| 25,mlp.up_proj,0.0000053732,0.05000,1.737 | |
| 25,mlp.gate_proj,0.0000047783,0.05000,1.737 | |
| 25,mlp.down_proj,0.0000070089,0.05000,5.685 | |
| 26,self_attn.q_proj,0.0000007222,0.05000,3.921 | |
| 26,self_attn.v_proj,0.0000006790,0.05000,3.977 | |
| 26,self_attn.k_proj,0.0000000789,0.05000,4.082 | |
| 26,self_attn.o_proj,0.0000011606,0.05000,0.862 | |
| 26,mlp.up_proj,0.0000056787,0.05000,2.722 | |
| 26,mlp.gate_proj,0.0000050093,0.05000,2.732 | |
| 26,mlp.down_proj,0.0000140491,0.05000,5.705 | |
| 27,self_attn.v_proj,0.0000007066,0.05000,2.857 | |
| 27,self_attn.q_proj,0.0000010869,0.05000,2.898 | |
| 27,self_attn.k_proj,0.0000001030,0.05000,2.932 | |
| 27,self_attn.o_proj,0.0000015821,0.05000,0.909 | |
| 27,mlp.up_proj,0.0000063775,0.05000,1.905 | |
| 27,mlp.gate_proj,0.0000059692,0.05000,1.912 | |
| 27,mlp.down_proj,0.0000325339,0.05000,5.683 | |