| layer,module,loss,samples,damp,time | |
| 0,self_attn.v_proj,0.0000000021,0.10000,9.228 | |
| 0,self_attn.k_proj,0.0000000326,0.10000,9.264 | |
| 0,self_attn.q_proj,0.0000001731,0.10000,9.268 | |
| 0,self_attn.o_proj,0.0000000019,0.10000,3.671 | |
| 0,mlp.gate_proj,0.0000000817,0.10000,7.073 | |
| 0,mlp.up_proj,0.0000000777,0.10000,7.086 | |
| 0,mlp.down_proj,0.0000000013,0.10000,20.354 | |
| 1,self_attn.q_proj,0.0000000612,0.10000,7.913 | |
| 1,self_attn.k_proj,0.0000000161,0.10000,7.921 | |
| 1,self_attn.v_proj,0.0000000009,0.10000,7.968 | |
| 1,self_attn.o_proj,0.0000000003,0.10000,2.500 | |
| 1,mlp.up_proj,0.0000002540,0.10000,5.501 | |
| 1,mlp.gate_proj,0.0000002742,0.10000,5.577 | |
| 1,mlp.down_proj,0.0002870575,0.10000,20.610 | |
| 2,self_attn.q_proj,0.0000032041,0.10000,7.672 | |
| 2,self_attn.v_proj,0.0000004020,0.10000,7.712 | |
| 2,self_attn.k_proj,0.0000009859,0.10000,7.717 | |
| 2,self_attn.o_proj,0.0000000097,0.10000,2.541 | |
| 2,mlp.up_proj,0.0000005513,0.10000,5.423 | |
| 2,mlp.gate_proj,0.0000005756,0.10000,5.493 | |
| 2,mlp.down_proj,0.0000000153,0.10000,20.298 | |
| 3,self_attn.k_proj,0.0000008145,0.10000,7.601 | |
| 3,self_attn.q_proj,0.0000022983,0.10000,7.700 | |
| 3,self_attn.v_proj,0.0000003440,0.10000,7.716 | |
| 3,self_attn.o_proj,0.0000000165,0.10000,2.436 | |
| 3,mlp.up_proj,0.0000009216,0.10000,5.592 | |
| 3,mlp.gate_proj,0.0000009405,0.10000,5.618 | |
| 3,mlp.down_proj,0.0000000234,0.10000,19.773 | |
| 4,self_attn.k_proj,0.0000010915,0.10000,7.611 | |
| 4,self_attn.v_proj,0.0000005528,0.10000,7.614 | |
| 4,self_attn.q_proj,0.0000043595,0.10000,7.626 | |
| 4,self_attn.o_proj,0.0000000053,0.10000,2.456 | |
| 4,mlp.gate_proj,0.0000017495,0.10000,5.564 | |
| 4,mlp.up_proj,0.0000017015,0.10000,5.600 | |
| 4,mlp.down_proj,0.0000000348,0.10000,19.943 | |
| 5,self_attn.v_proj,0.0000007812,0.10000,7.609 | |
| 5,self_attn.q_proj,0.0000052871,0.10000,7.622 | |
| 5,self_attn.k_proj,0.0000013634,0.10000,7.632 | |
| 5,self_attn.o_proj,0.0000000050,0.10000,2.604 | |
| 5,mlp.up_proj,0.0000025099,0.10000,5.507 | |
| 5,mlp.gate_proj,0.0000026141,0.10000,5.550 | |
| 5,mlp.down_proj,0.0000000539,0.10000,20.386 | |
| 6,self_attn.v_proj,0.0000005292,0.10000,7.844 | |
| 6,self_attn.q_proj,0.0000036487,0.10000,7.853 | |
| 6,self_attn.k_proj,0.0000009903,0.10000,7.897 | |
| 6,self_attn.o_proj,0.0000000065,0.10000,2.584 | |
| 6,mlp.up_proj,0.0000030373,0.10000,5.391 | |
| 6,mlp.gate_proj,0.0000031575,0.10000,5.416 | |
| 6,mlp.down_proj,0.0000000681,0.10000,19.967 | |
| 7,self_attn.k_proj,0.0000013567,0.10000,7.501 | |
| 7,self_attn.v_proj,0.0000006903,0.10000,7.541 | |
| 7,self_attn.q_proj,0.0000052830,0.10000,7.586 | |
| 7,self_attn.o_proj,0.0000000136,0.10000,2.643 | |
| 7,mlp.gate_proj,0.0000038829,0.10000,5.517 | |
| 7,mlp.up_proj,0.0000037647,0.10000,5.535 | |
| 7,mlp.down_proj,0.0000000921,0.10000,20.331 | |
| 8,self_attn.k_proj,0.0000012813,0.10000,7.599 | |
| 8,self_attn.q_proj,0.0000047585,0.10000,7.624 | |
| 8,self_attn.v_proj,0.0000007005,0.10000,7.677 | |
| 8,self_attn.o_proj,0.0000000398,0.10000,2.602 | |
| 8,mlp.gate_proj,0.0000045715,0.10000,5.526 | |
| 8,mlp.up_proj,0.0000043751,0.10000,5.551 | |
| 8,mlp.down_proj,0.0000001178,0.10000,19.864 | |
| 9,self_attn.k_proj,0.0000033423,0.10000,7.421 | |
| 9,self_attn.q_proj,0.0000149456,0.10000,7.430 | |
| 9,self_attn.v_proj,0.0000020237,0.10000,7.454 | |
| 9,self_attn.o_proj,0.0000000460,0.10000,2.480 | |
| 9,mlp.up_proj,0.0000048140,0.10000,5.383 | |
| 9,mlp.gate_proj,0.0000049987,0.10000,5.429 | |
| 9,mlp.down_proj,0.0000001313,0.10000,20.347 | |
| 10,self_attn.v_proj,0.0000011253,0.10000,7.113 | |
| 10,self_attn.q_proj,0.0000088448,0.10000,7.134 | |
| 10,self_attn.k_proj,0.0000021524,0.10000,7.170 | |
| 10,self_attn.o_proj,0.0000000724,0.10000,2.592 | |
| 10,mlp.up_proj,0.0000058928,0.10000,5.479 | |
| 10,mlp.gate_proj,0.0000061487,0.10000,5.480 | |
| 10,mlp.down_proj,0.0000001853,0.10000,20.006 | |
| 11,self_attn.q_proj,0.0000103466,0.10000,7.623 | |
| 11,self_attn.k_proj,0.0000023750,0.10000,7.691 | |
| 11,self_attn.v_proj,0.0000011267,0.10000,7.716 | |
| 11,self_attn.o_proj,0.0000000767,0.10000,2.407 | |
| 11,mlp.up_proj,0.0000067959,0.10000,5.429 | |
| 11,mlp.gate_proj,0.0000071278,0.10000,5.470 | |
| 11,mlp.down_proj,0.0000002469,0.10000,19.955 | |
| 12,self_attn.q_proj,0.0000143961,0.10000,7.662 | |
| 12,self_attn.v_proj,0.0000016649,0.10000,7.693 | |
| 12,self_attn.k_proj,0.0000031072,0.10000,7.737 | |
| 12,self_attn.o_proj,0.0000001098,0.10000,2.538 | |
| 12,mlp.up_proj,0.0000077164,0.10000,5.550 | |
| 12,mlp.gate_proj,0.0000080579,0.10000,5.582 | |
| 12,mlp.down_proj,0.0000002965,0.10000,19.899 | |
| 13,self_attn.v_proj,0.0000016180,0.10000,7.477 | |
| 13,self_attn.k_proj,0.0000029538,0.10000,7.484 | |
| 13,self_attn.q_proj,0.0000134573,0.10000,7.506 | |
| 13,self_attn.o_proj,0.0000001076,0.10000,2.593 | |
| 13,mlp.up_proj,0.0000089563,0.10000,5.575 | |
| 13,mlp.gate_proj,0.0000093503,0.10000,5.599 | |
| 13,mlp.down_proj,0.0000003839,0.10000,20.249 | |
| 14,self_attn.q_proj,0.0000131731,0.10000,7.786 | |
| 14,self_attn.v_proj,0.0000015733,0.10000,7.791 | |
| 14,self_attn.k_proj,0.0000028953,0.10000,7.823 | |
| 14,self_attn.o_proj,0.0000001857,0.10000,2.389 | |
| 14,mlp.gate_proj,0.0000097674,0.10000,5.493 | |
| 14,mlp.up_proj,0.0000093670,0.10000,5.521 | |
| 14,mlp.down_proj,0.0000004451,0.10000,20.165 | |
| 15,self_attn.k_proj,0.0000035102,0.10000,7.533 | |
| 15,self_attn.v_proj,0.0000019057,0.10000,7.537 | |
| 15,self_attn.q_proj,0.0000172255,0.10000,7.584 | |
| 15,self_attn.o_proj,0.0000001357,0.10000,2.428 | |
| 15,mlp.up_proj,0.0000118095,0.10000,5.560 | |
| 15,mlp.gate_proj,0.0000123567,0.10000,5.594 | |
| 15,mlp.down_proj,0.0000005491,0.10000,20.147 | |
| 16,self_attn.k_proj,0.0000032821,0.10000,7.184 | |
| 16,self_attn.v_proj,0.0000016827,0.10000,7.263 | |
| 16,self_attn.q_proj,0.0000154101,0.10000,7.314 | |
| 16,self_attn.o_proj,0.0000001600,0.10000,2.551 | |
| 16,mlp.gate_proj,0.0000134883,0.10000,5.490 | |
| 16,mlp.up_proj,0.0000129061,0.10000,5.551 | |
| 16,mlp.down_proj,0.0000006242,0.10000,19.930 | |
| 17,self_attn.v_proj,0.0000016488,0.10000,7.524 | |
| 17,self_attn.k_proj,0.0000027783,0.10000,7.546 | |
| 17,self_attn.q_proj,0.0000126517,0.10000,7.615 | |
| 17,self_attn.o_proj,0.0000002209,0.10000,2.467 | |
| 17,mlp.up_proj,0.0000125549,0.10000,5.486 | |
| 17,mlp.gate_proj,0.0000130271,0.10000,5.528 | |
| 17,mlp.down_proj,0.0000006893,0.10000,19.887 | |
| 18,self_attn.q_proj,0.0000235518,0.10000,7.603 | |
| 18,self_attn.v_proj,0.0000028751,0.10000,7.642 | |
| 18,self_attn.k_proj,0.0000051540,0.10000,7.668 | |
| 18,self_attn.o_proj,0.0000001676,0.10000,2.519 | |
| 18,mlp.up_proj,0.0000151162,0.10000,5.530 | |
| 18,mlp.gate_proj,0.0000157739,0.10000,5.531 | |
| 18,mlp.down_proj,0.0000008413,0.10000,19.978 | |
| 19,self_attn.k_proj,0.0000067402,0.10000,7.557 | |
| 19,self_attn.v_proj,0.0000040603,0.10000,7.671 | |
| 19,self_attn.q_proj,0.0000324108,0.10000,7.705 | |
| 19,self_attn.o_proj,0.0000002029,0.10000,2.595 | |
| 19,mlp.up_proj,0.0000175342,0.10000,5.386 | |
| 19,mlp.gate_proj,0.0000182990,0.10000,5.426 | |
| 19,mlp.down_proj,0.0000011666,0.10000,19.720 | |
| 20,self_attn.k_proj,0.0000027224,0.10000,7.418 | |
| 20,self_attn.q_proj,0.0000133101,0.10000,7.428 | |
| 20,self_attn.v_proj,0.0000016237,0.10000,7.495 | |
| 20,self_attn.o_proj,0.0000002907,0.10000,2.619 | |
| 20,mlp.up_proj,0.0000210489,0.10000,5.538 | |
| 20,mlp.gate_proj,0.0000221256,0.10000,5.584 | |
| 20,mlp.down_proj,0.0000015669,0.10000,19.688 | |
| 21,self_attn.q_proj,0.0000113229,0.10000,7.891 | |
| 21,self_attn.v_proj,0.0000014841,0.10000,7.906 | |
| 21,self_attn.k_proj,0.0000023100,0.10000,7.948 | |
| 21,self_attn.o_proj,0.0000004912,0.10000,2.379 | |
| 21,mlp.gate_proj,0.0000200858,0.10000,5.447 | |
| 21,mlp.up_proj,0.0000192769,0.10000,5.478 | |
| 21,mlp.down_proj,0.0000015327,0.10000,19.885 | |
| 22,self_attn.q_proj,0.0000304609,0.10000,7.333 | |
| 22,self_attn.k_proj,0.0000055332,0.10000,7.480 | |
| 22,self_attn.v_proj,0.0000034653,0.10000,7.539 | |
| 22,self_attn.o_proj,0.0000006605,0.10000,2.430 | |
| 22,mlp.gate_proj,0.0000276365,0.10000,5.473 | |
| 22,mlp.up_proj,0.0000265293,0.10000,5.518 | |
| 22,mlp.down_proj,0.0000028746,0.10000,19.896 | |
| 23,self_attn.q_proj,0.0000260237,0.10000,7.520 | |
| 23,self_attn.k_proj,0.0000045537,0.10000,7.542 | |
| 23,self_attn.v_proj,0.0000030669,0.10000,7.565 | |
| 23,self_attn.o_proj,0.0000007985,0.10000,2.394 | |
| 23,mlp.gate_proj,0.0000313806,0.10000,5.469 | |
| 23,mlp.up_proj,0.0000297783,0.10000,5.508 | |
| 23,mlp.down_proj,0.0000030651,0.10000,20.129 | |
| 24,self_attn.q_proj,0.0000225556,0.10000,7.726 | |
| 24,self_attn.v_proj,0.0000032132,0.10000,7.780 | |
| 24,self_attn.k_proj,0.0000040272,0.10000,7.824 | |
| 24,self_attn.o_proj,0.0000008312,0.10000,2.659 | |
| 24,mlp.up_proj,0.0000352088,0.10000,5.582 | |
| 24,mlp.gate_proj,0.0000374105,0.10000,5.611 | |
| 24,mlp.down_proj,0.0000036593,0.10000,20.107 | |
| 25,self_attn.q_proj,0.0000401664,0.10000,7.246 | |
| 25,self_attn.v_proj,0.0000045236,0.10000,7.335 | |
| 25,self_attn.k_proj,0.0000070576,0.10000,7.369 | |
| 25,self_attn.o_proj,0.0000008642,0.10000,2.579 | |
| 25,mlp.gate_proj,0.0000447818,0.10000,5.621 | |
| 25,mlp.up_proj,0.0000424599,0.10000,5.648 | |
| 25,mlp.down_proj,0.0000042406,0.10000,20.432 | |
| 26,self_attn.v_proj,0.0000034460,0.10000,7.444 | |
| 26,self_attn.k_proj,0.0000052029,0.10000,7.486 | |
| 26,self_attn.q_proj,0.0000287755,0.10000,7.587 | |
| 26,self_attn.o_proj,0.0000012136,0.10000,2.514 | |
| 26,mlp.up_proj,0.0000484828,0.10000,5.444 | |
| 26,mlp.gate_proj,0.0000509648,0.10000,5.473 | |
| 26,mlp.down_proj,0.0000044866,0.10000,19.777 | |
| 27,self_attn.k_proj,0.0000052048,0.10000,7.506 | |
| 27,self_attn.q_proj,0.0000279974,0.10000,7.512 | |
| 27,self_attn.v_proj,0.0000036007,0.10000,7.606 | |
| 27,self_attn.o_proj,0.0000011557,0.10000,2.593 | |
| 27,mlp.gate_proj,0.0000558311,0.10000,5.508 | |
| 27,mlp.up_proj,0.0000533192,0.10000,5.549 | |
| 27,mlp.down_proj,0.0000048159,0.10000,20.034 | |
| 28,self_attn.v_proj,0.0000038522,0.10000,7.423 | |
| 28,self_attn.k_proj,0.0000050725,0.10000,7.430 | |
| 28,self_attn.q_proj,0.0000284028,0.10000,7.471 | |
| 28,self_attn.o_proj,0.0000008212,0.10000,2.508 | |
| 28,mlp.gate_proj,0.0000591885,0.10000,5.598 | |
| 28,mlp.up_proj,0.0000567845,0.10000,5.609 | |
| 28,mlp.down_proj,0.0000053186,0.10000,20.057 | |
| 29,self_attn.k_proj,0.0000064067,0.10000,7.384 | |
| 29,self_attn.v_proj,0.0000041839,0.10000,7.426 | |
| 29,self_attn.q_proj,0.0000344852,0.10000,7.449 | |
| 29,self_attn.o_proj,0.0000015276,0.10000,2.517 | |
| 29,mlp.gate_proj,0.0000628065,0.10000,5.568 | |
| 29,mlp.up_proj,0.0000601938,0.10000,5.595 | |
| 29,mlp.down_proj,0.0000058865,0.10000,20.104 | |
| 30,self_attn.k_proj,0.0000064688,0.10000,7.754 | |
| 30,self_attn.q_proj,0.0000371887,0.10000,7.756 | |
| 30,self_attn.v_proj,0.0000049764,0.10000,7.765 | |
| 30,self_attn.o_proj,0.0000015450,0.10000,2.404 | |
| 30,mlp.up_proj,0.0000653806,0.10000,5.545 | |
| 30,mlp.gate_proj,0.0000690351,0.10000,5.581 | |
| 30,mlp.down_proj,0.0000065568,0.10000,20.078 | |
| 31,self_attn.k_proj,0.0000070759,0.10000,7.724 | |
| 31,self_attn.q_proj,0.0000394085,0.10000,7.759 | |
| 31,self_attn.v_proj,0.0000053754,0.10000,7.767 | |
| 31,self_attn.o_proj,0.0000009338,0.10000,2.585 | |
| 31,mlp.gate_proj,0.0000753035,0.10000,5.494 | |
| 31,mlp.up_proj,0.0000711931,0.10000,5.530 | |
| 31,mlp.down_proj,0.0000069818,0.10000,20.274 | |
| 32,self_attn.v_proj,0.0000059810,0.10000,7.587 | |
| 32,self_attn.q_proj,0.0000434644,0.10000,7.588 | |
| 32,self_attn.k_proj,0.0000078275,0.10000,7.616 | |
| 32,self_attn.o_proj,0.0000010483,0.10000,2.458 | |
| 32,mlp.up_proj,0.0000749633,0.10000,5.628 | |
| 32,mlp.gate_proj,0.0000790766,0.10000,5.630 | |
| 32,mlp.down_proj,0.0000072754,0.10000,20.249 | |
| 33,self_attn.v_proj,0.0000066209,0.10000,7.498 | |
| 33,self_attn.q_proj,0.0000395162,0.10000,7.537 | |
| 33,self_attn.k_proj,0.0000073552,0.10000,7.581 | |
| 33,self_attn.o_proj,0.0000011010,0.10000,2.419 | |
| 33,mlp.gate_proj,0.0000852695,0.10000,5.594 | |
| 33,mlp.up_proj,0.0000796592,0.10000,5.625 | |
| 33,mlp.down_proj,0.0000077406,0.10000,20.136 | |
| 34,self_attn.q_proj,0.0000460895,0.10000,7.329 | |
| 34,self_attn.k_proj,0.0000082995,0.10000,7.340 | |
| 34,self_attn.v_proj,0.0000075391,0.10000,7.391 | |
| 34,self_attn.o_proj,0.0000009329,0.10000,2.431 | |
| 34,mlp.up_proj,0.0000834546,0.10000,5.472 | |
| 34,mlp.gate_proj,0.0000895576,0.10000,5.492 | |
| 34,mlp.down_proj,0.0000083580,0.10000,20.097 | |
| 35,self_attn.v_proj,0.0000084153,0.10000,7.585 | |
| 35,self_attn.k_proj,0.0000090009,0.10000,7.628 | |
| 35,self_attn.q_proj,0.0000499938,0.10000,7.654 | |
| 35,self_attn.o_proj,0.0000009079,0.10000,2.428 | |
| 35,mlp.gate_proj,0.0000921758,0.10000,5.490 | |
| 35,mlp.up_proj,0.0000864605,0.10000,5.519 | |
| 35,mlp.down_proj,0.0000088132,0.10000,19.626 | |
| 36,self_attn.q_proj,0.0000526127,0.10000,7.630 | |
| 36,self_attn.k_proj,0.0000094206,0.10000,7.694 | |
| 36,self_attn.v_proj,0.0000089374,0.10000,7.705 | |
| 36,self_attn.o_proj,0.0000009794,0.10000,2.413 | |
| 36,mlp.up_proj,0.0000885454,0.10000,5.427 | |
| 36,mlp.gate_proj,0.0000936940,0.10000,5.475 | |
| 36,mlp.down_proj,0.0000086765,0.10000,19.848 | |
| 37,self_attn.q_proj,0.0000496085,0.10000,7.540 | |
| 37,self_attn.v_proj,0.0000081068,0.10000,7.547 | |
| 37,self_attn.k_proj,0.0000091389,0.10000,7.619 | |
| 37,self_attn.o_proj,0.0000010597,0.10000,2.560 | |
| 37,mlp.gate_proj,0.0000958392,0.10000,5.445 | |
| 37,mlp.up_proj,0.0000912658,0.10000,5.472 | |
| 37,mlp.down_proj,0.0000090947,0.10000,20.611 | |
| 38,self_attn.k_proj,0.0000090218,0.10000,7.505 | |
| 38,self_attn.v_proj,0.0000073823,0.10000,7.552 | |
| 38,self_attn.q_proj,0.0000477760,0.10000,7.604 | |
| 38,self_attn.o_proj,0.0000014388,0.10000,2.607 | |
| 38,mlp.up_proj,0.0000948766,0.10000,5.630 | |
| 38,mlp.gate_proj,0.0000995957,0.10000,5.687 | |
| 38,mlp.down_proj,0.0000096539,0.10000,20.665 | |
| 39,self_attn.k_proj,0.0000087143,0.10000,7.783 | |
| 39,self_attn.q_proj,0.0000458466,0.10000,7.800 | |
| 39,self_attn.v_proj,0.0000074993,0.10000,7.811 | |
| 39,self_attn.o_proj,0.0000014284,0.10000,2.624 | |
| 39,mlp.up_proj,0.0000977051,0.10000,5.718 | |
| 39,mlp.gate_proj,0.0001019799,0.10000,5.770 | |
| 39,mlp.down_proj,0.0000102326,0.10000,19.818 | |
| 40,self_attn.v_proj,0.0000059555,0.10000,7.881 | |
| 40,self_attn.k_proj,0.0000087123,0.10000,7.925 | |
| 40,self_attn.q_proj,0.0000450318,0.10000,7.934 | |
| 40,self_attn.o_proj,0.0000020943,0.10000,2.582 | |
| 40,mlp.gate_proj,0.0001046877,0.10000,5.491 | |
| 40,mlp.up_proj,0.0001010661,0.10000,5.521 | |
| 40,mlp.down_proj,0.0000111093,0.10000,20.130 | |
| 41,self_attn.k_proj,0.0000077564,0.10000,7.585 | |
| 41,self_attn.q_proj,0.0000395478,0.10000,7.645 | |
| 41,self_attn.v_proj,0.0000056907,0.10000,7.680 | |
| 41,self_attn.o_proj,0.0000024193,0.10000,2.419 | |
| 41,mlp.gate_proj,0.0001104609,0.10000,5.402 | |
| 41,mlp.up_proj,0.0001064536,0.10000,5.456 | |
| 41,mlp.down_proj,0.0000118984,0.10000,19.579 | |
| 42,self_attn.v_proj,0.0000074538,0.10000,7.492 | |
| 42,self_attn.k_proj,0.0000095771,0.10000,7.502 | |
| 42,self_attn.q_proj,0.0000524778,0.10000,7.525 | |
| 42,self_attn.o_proj,0.0000018908,0.10000,2.619 | |
| 42,mlp.gate_proj,0.0001145551,0.10000,5.567 | |
| 42,mlp.up_proj,0.0001113127,0.10000,5.566 | |
| 42,mlp.down_proj,0.0000132569,0.10000,20.476 | |
| 43,self_attn.q_proj,0.0000501651,0.10000,7.568 | |
| 43,self_attn.v_proj,0.0000065721,0.10000,7.606 | |
| 43,self_attn.k_proj,0.0000095035,0.10000,7.619 | |
| 43,self_attn.o_proj,0.0000026974,0.10000,2.587 | |
| 43,mlp.up_proj,0.0001156213,0.10000,5.585 | |
| 43,mlp.gate_proj,0.0001179126,0.10000,5.625 | |
| 43,mlp.down_proj,0.0000145511,0.10000,19.655 | |
| 44,self_attn.q_proj,0.0000500651,0.10000,7.585 | |
| 44,self_attn.v_proj,0.0000060644,0.10000,7.658 | |
| 44,self_attn.k_proj,0.0000090329,0.10000,7.677 | |
| 44,self_attn.o_proj,0.0000037612,0.10000,2.363 | |
| 44,mlp.up_proj,0.0001199390,0.10000,5.507 | |
| 44,mlp.gate_proj,0.0001201581,0.10000,5.558 | |
| 44,mlp.down_proj,0.0000174651,0.10000,20.205 | |
| 45,self_attn.v_proj,0.0000055269,0.10000,7.593 | |
| 45,self_attn.k_proj,0.0000095479,0.10000,7.669 | |
| 45,self_attn.q_proj,0.0000536274,0.10000,7.683 | |
| 45,self_attn.o_proj,0.0000048709,0.10000,2.548 | |
| 45,mlp.gate_proj,0.0001239049,0.10000,5.614 | |
| 45,mlp.up_proj,0.0001248203,0.10000,5.634 | |
| 45,mlp.down_proj,0.0000265387,0.10000,21.339 | |
| 46,self_attn.q_proj,0.0000577298,0.10000,7.601 | |
| 46,self_attn.v_proj,0.0000062249,0.10000,7.651 | |
| 46,self_attn.k_proj,0.0000105807,0.10000,7.710 | |
| 46,self_attn.o_proj,0.0000069953,0.10000,2.625 | |
| 46,mlp.gate_proj,0.0001262403,0.10000,5.554 | |
| 46,mlp.up_proj,0.0001284073,0.10000,5.572 | |
| 46,mlp.down_proj,0.0000189336,0.10000,21.073 | |
| 47,self_attn.k_proj,0.0000103215,0.10000,7.466 | |
| 47,self_attn.v_proj,0.0000064657,0.10000,7.526 | |
| 47,self_attn.q_proj,0.0000582078,0.10000,7.530 | |
| 47,self_attn.o_proj,0.0000070828,0.10000,2.520 | |
| 47,mlp.up_proj,0.0001302019,0.10000,5.585 | |
| 47,mlp.gate_proj,0.0001264322,0.10000,5.606 | |
| 47,mlp.down_proj,0.0000211231,0.10000,19.826 | |
| 48,self_attn.v_proj,0.0000073132,0.10000,7.629 | |
| 48,self_attn.k_proj,0.0000100739,0.10000,7.651 | |
| 48,self_attn.q_proj,0.0000602635,0.10000,7.668 | |
| 48,self_attn.o_proj,0.0000066834,0.10000,2.617 | |
| 48,mlp.up_proj,0.0001370564,0.10000,5.643 | |
| 48,mlp.gate_proj,0.0001323712,0.10000,5.670 | |
| 48,mlp.down_proj,0.0000231647,0.10000,20.022 | |
| 49,self_attn.q_proj,0.0000569726,0.10000,7.467 | |
| 49,self_attn.v_proj,0.0000070089,0.10000,7.511 | |
| 49,self_attn.k_proj,0.0000100563,0.10000,7.537 | |
| 49,self_attn.o_proj,0.0000071273,0.10000,2.690 | |
| 49,mlp.up_proj,0.0001388069,0.10000,5.564 | |
| 49,mlp.gate_proj,0.0001327598,0.10000,5.582 | |
| 49,mlp.down_proj,0.0000246430,0.10000,19.679 | |
| 50,self_attn.q_proj,0.0000708722,0.10000,7.401 | |
| 50,self_attn.k_proj,0.0000120532,0.10000,7.458 | |
| 50,self_attn.v_proj,0.0000080716,0.10000,7.462 | |
| 50,self_attn.o_proj,0.0000095992,0.10000,2.383 | |
| 50,mlp.up_proj,0.0001378052,0.10000,5.517 | |
| 50,mlp.gate_proj,0.0001304732,0.10000,5.558 | |
| 50,mlp.down_proj,0.0000268720,0.10000,20.348 | |
| 51,self_attn.k_proj,0.0000109577,0.10000,7.866 | |
| 51,self_attn.v_proj,0.0000072120,0.10000,7.875 | |
| 51,self_attn.q_proj,0.0000636702,0.10000,7.904 | |
| 51,self_attn.o_proj,0.0000103356,0.10000,2.575 | |
| 51,mlp.up_proj,0.0001441162,0.10000,5.636 | |
| 51,mlp.gate_proj,0.0001368454,0.10000,5.663 | |
| 51,mlp.down_proj,0.0000291911,0.10000,20.058 | |
| 52,self_attn.v_proj,0.0000086795,0.10000,7.588 | |
| 52,self_attn.q_proj,0.0000600079,0.10000,7.639 | |
| 52,self_attn.k_proj,0.0000096980,0.10000,7.672 | |
| 52,self_attn.o_proj,0.0000113856,0.10000,2.588 | |
| 52,mlp.gate_proj,0.0001552775,0.10000,5.546 | |
| 52,mlp.up_proj,0.0001617526,0.10000,5.575 | |
| 52,mlp.down_proj,0.0000303653,0.10000,20.007 | |
| 53,self_attn.q_proj,0.0000668065,0.10000,7.781 | |
| 53,self_attn.k_proj,0.0000110160,0.10000,7.794 | |
| 53,self_attn.v_proj,0.0000094514,0.10000,7.818 | |
| 53,self_attn.o_proj,0.0000123101,0.10000,2.501 | |
| 53,mlp.gate_proj,0.0001672415,0.10000,5.509 | |
| 53,mlp.up_proj,0.0001727192,0.10000,5.577 | |
| 53,mlp.down_proj,0.0000324975,0.10000,20.614 | |
| 54,self_attn.v_proj,0.0000121689,0.10000,7.322 | |
| 54,self_attn.q_proj,0.0000711726,0.10000,7.385 | |
| 54,self_attn.k_proj,0.0000106064,0.10000,7.424 | |
| 54,self_attn.o_proj,0.0000111422,0.10000,2.662 | |
| 54,mlp.gate_proj,0.0001642088,0.10000,5.415 | |
| 54,mlp.up_proj,0.0001706440,0.10000,5.452 | |
| 54,mlp.down_proj,0.0000350907,0.10000,21.223 | |
| 55,self_attn.q_proj,0.0000691806,0.10000,7.747 | |
| 55,self_attn.v_proj,0.0000118824,0.10000,7.816 | |
| 55,self_attn.k_proj,0.0000102520,0.10000,7.824 | |
| 55,self_attn.o_proj,0.0000136196,0.10000,2.590 | |
| 55,mlp.gate_proj,0.0001693113,0.10000,5.730 | |
| 55,mlp.up_proj,0.0001763623,0.10000,5.749 | |
| 55,mlp.down_proj,0.0000408001,0.10000,20.976 | |
| 56,self_attn.k_proj,0.0000104374,0.10000,7.534 | |
| 56,self_attn.q_proj,0.0000656221,0.10000,7.610 | |
| 56,self_attn.v_proj,0.0000102865,0.10000,7.619 | |
| 56,self_attn.o_proj,0.0000172257,0.10000,2.578 | |
| 56,mlp.gate_proj,0.0001863374,0.10000,5.384 | |
| 56,mlp.up_proj,0.0001923496,0.10000,5.413 | |
| 56,mlp.down_proj,0.0000456986,0.10000,21.377 | |
| 57,self_attn.q_proj,0.0000698117,0.10000,7.628 | |
| 57,self_attn.k_proj,0.0000110748,0.10000,7.656 | |
| 57,self_attn.v_proj,0.0000117489,0.10000,7.666 | |
| 57,self_attn.o_proj,0.0000160523,0.10000,2.566 | |
| 57,mlp.up_proj,0.0001927503,0.10000,5.497 | |
| 57,mlp.gate_proj,0.0001861044,0.10000,5.499 | |
| 57,mlp.down_proj,0.0000500290,0.10000,22.042 | |
| 58,self_attn.k_proj,0.0000103453,0.10000,7.627 | |
| 58,self_attn.q_proj,0.0000693757,0.10000,7.687 | |
| 58,self_attn.v_proj,0.0000122293,0.10000,7.700 | |
| 58,self_attn.o_proj,0.0000205697,0.10000,2.705 | |
| 58,mlp.gate_proj,0.0001921572,0.10000,5.532 | |
| 58,mlp.up_proj,0.0001995629,0.10000,5.577 | |
| 58,mlp.down_proj,0.0000628824,0.10000,21.362 | |
| 59,self_attn.q_proj,0.0000682933,0.10000,7.780 | |
| 59,self_attn.v_proj,0.0000126599,0.10000,7.886 | |
| 59,self_attn.k_proj,0.0000103990,0.10000,7.895 | |
| 59,self_attn.o_proj,0.0000237298,0.10000,2.588 | |
| 59,mlp.up_proj,0.0002055769,0.10000,5.527 | |
| 59,mlp.gate_proj,0.0002024219,0.10000,5.565 | |
| 59,mlp.down_proj,0.0000747734,0.10000,21.180 | |
| 60,self_attn.q_proj,0.0000787734,0.10000,7.587 | |
| 60,self_attn.k_proj,0.0000112112,0.10000,7.644 | |
| 60,self_attn.v_proj,0.0000155765,0.10000,7.686 | |
| 60,self_attn.o_proj,0.0000187066,0.10000,2.490 | |
| 60,mlp.up_proj,0.0002466824,0.10000,5.516 | |
| 60,mlp.gate_proj,0.0002482997,0.10000,5.552 | |
| 60,mlp.down_proj,0.0000836316,0.10000,20.232 | |
| 61,self_attn.k_proj,0.0000113100,0.10000,7.703 | |
| 61,self_attn.q_proj,0.0000788874,0.10000,7.718 | |
| 61,self_attn.v_proj,0.0000166985,0.10000,7.729 | |
| 61,self_attn.o_proj,0.0000209697,0.10000,2.546 | |
| 61,mlp.gate_proj,0.0002714686,0.10000,5.520 | |
| 61,mlp.up_proj,0.0002681355,0.10000,5.558 | |
| 61,mlp.down_proj,0.0000946684,0.10000,20.082 | |
| 62,self_attn.v_proj,0.0000158675,0.10000,7.594 | |
| 62,self_attn.q_proj,0.0000809794,0.10000,7.610 | |
| 62,self_attn.k_proj,0.0000117794,0.10000,7.700 | |
| 62,self_attn.o_proj,0.0000217965,0.10000,2.392 | |
| 62,mlp.up_proj,0.0003033536,0.10000,5.619 | |
| 62,mlp.gate_proj,0.0003143894,0.10000,5.652 | |
| 62,mlp.down_proj,0.0001002527,0.10000,20.066 | |
| 63,self_attn.k_proj,0.0000116479,0.10000,7.401 | |
| 63,self_attn.v_proj,0.0000161500,0.10000,7.438 | |
| 63,self_attn.q_proj,0.0000789493,0.10000,7.486 | |
| 63,self_attn.o_proj,0.0000241157,0.10000,2.683 | |
| 63,mlp.gate_proj,0.0003314460,0.10000,5.515 | |
| 63,mlp.up_proj,0.0003226264,0.10000,5.557 | |
| 63,mlp.down_proj,0.0001205571,0.10000,19.858 | |
| 64,self_attn.q_proj,0.0000827995,0.10000,7.159 | |
| 64,self_attn.v_proj,0.0000162335,0.10000,7.237 | |
| 64,self_attn.k_proj,0.0000123475,0.10000,7.280 | |
| 64,self_attn.o_proj,0.0000250567,0.10000,2.711 | |
| 64,mlp.gate_proj,0.0003612445,0.10000,5.547 | |
| 64,mlp.up_proj,0.0003488006,0.10000,5.594 | |
| 64,mlp.down_proj,0.0001459270,0.10000,20.483 | |
| 65,self_attn.q_proj,0.0000846235,0.10000,7.763 | |
| 65,self_attn.v_proj,0.0000174364,0.10000,7.773 | |
| 65,self_attn.k_proj,0.0000126387,0.10000,7.783 | |
| 65,self_attn.o_proj,0.0000276419,0.10000,2.486 | |
| 65,mlp.gate_proj,0.0004038748,0.10000,5.586 | |
| 65,mlp.up_proj,0.0003911497,0.10000,5.639 | |
| 65,mlp.down_proj,0.0001679931,0.10000,21.395 | |
| 66,self_attn.q_proj,0.0000795299,0.10000,7.331 | |
| 66,self_attn.k_proj,0.0000111875,0.10000,7.429 | |
| 66,self_attn.v_proj,0.0000181991,0.10000,7.509 | |
| 66,self_attn.o_proj,0.0000254603,0.10000,2.643 | |
| 66,mlp.up_proj,0.0004548113,0.10000,5.494 | |
| 66,mlp.gate_proj,0.0004761389,0.10000,5.531 | |
| 66,mlp.down_proj,0.0001795034,0.10000,19.397 | |
| 67,self_attn.v_proj,0.0000208610,0.10000,7.683 | |
| 67,self_attn.q_proj,0.0000848699,0.10000,7.696 | |
| 67,self_attn.k_proj,0.0000119792,0.10000,7.725 | |
| 67,self_attn.o_proj,0.0000205163,0.10000,2.410 | |
| 67,mlp.up_proj,0.0004864768,0.10000,5.511 | |
| 67,mlp.gate_proj,0.0005036222,0.10000,5.545 | |
| 67,mlp.down_proj,0.0001952821,0.10000,19.801 | |
| 68,self_attn.k_proj,0.0000123669,0.10000,7.688 | |
| 68,self_attn.v_proj,0.0000238467,0.10000,7.690 | |
| 68,self_attn.q_proj,0.0000902852,0.10000,7.724 | |
| 68,self_attn.o_proj,0.0000248123,0.10000,2.404 | |
| 68,mlp.up_proj,0.0005289965,0.10000,5.485 | |
| 68,mlp.gate_proj,0.0005417064,0.10000,5.525 | |
| 68,mlp.down_proj,0.0002131409,0.10000,19.902 | |
| 69,self_attn.v_proj,0.0000202863,0.10000,7.588 | |
| 69,self_attn.k_proj,0.0000125554,0.10000,7.626 | |
| 69,self_attn.q_proj,0.0000876923,0.10000,7.636 | |
| 69,self_attn.o_proj,0.0000313533,0.10000,2.536 | |
| 69,mlp.gate_proj,0.0005753896,0.10000,5.672 | |
| 69,mlp.up_proj,0.0005724220,0.10000,5.698 | |
| 69,mlp.down_proj,0.0002522457,0.10000,20.550 | |
| 70,self_attn.q_proj,0.0000906051,0.10000,7.411 | |
| 70,self_attn.v_proj,0.0000272172,0.10000,7.521 | |
| 70,self_attn.k_proj,0.0000120387,0.10000,7.522 | |
| 70,self_attn.o_proj,0.0000402383,0.10000,2.457 | |
| 70,mlp.up_proj,0.0006517229,0.10000,5.642 | |
| 70,mlp.gate_proj,0.0006455610,0.10000,5.684 | |
| 70,mlp.down_proj,0.0003055418,0.10000,19.862 | |
| 71,self_attn.q_proj,0.0000930551,0.10000,7.603 | |
| 71,self_attn.v_proj,0.0000281192,0.10000,7.669 | |
| 71,self_attn.k_proj,0.0000125433,0.10000,7.726 | |
| 71,self_attn.o_proj,0.0000438307,0.10000,2.437 | |
| 71,mlp.up_proj,0.0007127374,0.10000,5.469 | |
| 71,mlp.gate_proj,0.0006954548,0.10000,5.494 | |
| 71,mlp.down_proj,0.0003597987,0.10000,19.980 | |
| 72,self_attn.q_proj,0.0000927018,0.10000,7.435 | |
| 72,self_attn.k_proj,0.0000116728,0.10000,7.489 | |
| 72,self_attn.v_proj,0.0000321309,0.10000,7.510 | |
| 72,self_attn.o_proj,0.0000462191,0.10000,2.635 | |
| 72,mlp.up_proj,0.0007812226,0.10000,5.585 | |
| 72,mlp.gate_proj,0.0007519810,0.10000,5.660 | |
| 72,mlp.down_proj,0.0004198793,0.10000,20.175 | |
| 73,self_attn.v_proj,0.0000375422,0.10000,7.585 | |
| 73,self_attn.k_proj,0.0000121011,0.10000,7.629 | |
| 73,self_attn.q_proj,0.0000952071,0.10000,7.643 | |
| 73,self_attn.o_proj,0.0000536777,0.10000,2.556 | |
| 73,mlp.gate_proj,0.0007917987,0.10000,5.591 | |
| 73,mlp.up_proj,0.0008330985,0.10000,5.611 | |
| 73,mlp.down_proj,0.0004890529,0.10000,19.851 | |
| 74,self_attn.k_proj,0.0000120178,0.10000,7.573 | |
| 74,self_attn.q_proj,0.0001013378,0.10000,7.678 | |
| 74,self_attn.v_proj,0.0000355574,0.10000,7.680 | |
| 74,self_attn.o_proj,0.0000542979,0.10000,2.617 | |
| 74,mlp.up_proj,0.0008737134,0.10000,5.618 | |
| 74,mlp.gate_proj,0.0008159181,0.10000,5.687 | |
| 74,mlp.down_proj,0.0005833126,0.10000,20.004 | |
| 75,self_attn.k_proj,0.0000116486,0.10000,7.028 | |
| 75,self_attn.q_proj,0.0000966183,0.10000,7.096 | |
| 75,self_attn.v_proj,0.0000404687,0.10000,7.178 | |
| 75,self_attn.o_proj,0.0000779568,0.10000,2.582 | |
| 75,mlp.gate_proj,0.0008736650,0.10000,5.671 | |
| 75,mlp.up_proj,0.0009480298,0.10000,5.685 | |
| 75,mlp.down_proj,0.0007020727,0.10000,20.006 | |
| 76,self_attn.q_proj,0.0001066564,0.10000,7.277 | |
| 76,self_attn.v_proj,0.0000635603,0.10000,7.317 | |
| 76,self_attn.k_proj,0.0000114564,0.10000,7.332 | |
| 76,self_attn.o_proj,0.0001143767,0.10000,2.440 | |
| 76,mlp.gate_proj,0.0009227967,0.10000,5.597 | |
| 76,mlp.up_proj,0.0010102869,0.10000,5.630 | |
| 76,mlp.down_proj,0.0009644486,0.10000,20.413 | |
| 77,self_attn.k_proj,0.0000107619,0.10000,7.470 | |
| 77,self_attn.v_proj,0.0000409660,0.10000,7.598 | |
| 77,self_attn.q_proj,0.0000962039,0.10000,7.605 | |
| 77,self_attn.o_proj,0.0001133945,0.10000,2.581 | |
| 77,mlp.gate_proj,0.0009674702,0.10000,5.547 | |
| 77,mlp.up_proj,0.0010632526,0.10000,5.576 | |
| 77,mlp.down_proj,0.0012206845,0.10000,20.999 | |
| 78,self_attn.k_proj,0.0000096184,0.10000,7.544 | |
| 78,self_attn.v_proj,0.0000409346,0.10000,7.564 | |
| 78,self_attn.q_proj,0.0000881543,0.10000,7.574 | |
| 78,self_attn.o_proj,0.0001534645,0.10000,2.566 | |
| 78,mlp.up_proj,0.0009482567,0.10000,5.460 | |
| 78,mlp.gate_proj,0.0008761560,0.10000,5.480 | |
| 78,mlp.down_proj,0.0030329266,0.10000,21.313 | |
| 79,self_attn.k_proj,0.0000072852,0.10000,7.797 | |
| 79,self_attn.q_proj,0.0000550956,0.10000,7.848 | |
| 79,self_attn.v_proj,0.0000130519,0.10000,7.859 | |
| 79,self_attn.o_proj,0.0000371522,0.10000,2.543 | |
| 79,mlp.gate_proj,0.0007860953,0.10000,5.503 | |
| 79,mlp.up_proj,0.0008234376,0.10000,5.540 | |
| 79,mlp.down_proj,0.0059871628,0.10000,21.447 | |