| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000074,0.05000,4.076 | |
| 0,self_attn.q_proj,0.0000000206,0.05000,4.106 | |
| 0,self_attn.v_proj,0.0000000015,0.05000,4.122 | |
| 0,self_attn.o_proj,0.0000000157,0.05000,1.158 | |
| 0,mlp.up_proj,0.0000000114,0.05000,3.470 | |
| 0,mlp.gate_proj,0.0000000133,0.05000,3.490 | |
| 0,mlp.down_proj,0.0000000193,0.05000,3.869 | |
| 1,self_attn.q_proj,0.0000000006,0.05000,4.900 | |
| 1,self_attn.k_proj,0.0000000002,0.05000,4.926 | |
| 1,self_attn.v_proj,0.0000000001,0.05000,4.943 | |
| 1,self_attn.o_proj,0.0000000002,0.05000,1.201 | |
| 1,mlp.up_proj,0.0000000479,0.05000,3.198 | |
| 1,mlp.gate_proj,0.0000001445,0.05000,3.210 | |
| 1,mlp.down_proj,0.0000000009,0.05000,3.574 | |
| 2,self_attn.v_proj,0.0000000004,0.05000,4.326 | |
| 2,self_attn.q_proj,0.0000000029,0.05000,4.358 | |
| 2,self_attn.k_proj,0.0000000011,0.05000,4.433 | |
| 2,self_attn.o_proj,0.0000000015,0.05000,1.285 | |
| 2,mlp.gate_proj,0.0000002588,0.05000,3.458 | |
| 2,mlp.up_proj,0.0000001298,0.05000,3.476 | |
| 2,mlp.down_proj,0.0000000050,0.05000,3.544 | |
| 3,self_attn.k_proj,0.0000000071,0.05000,3.937 | |
| 3,self_attn.q_proj,0.0000000193,0.05000,3.959 | |
| 3,self_attn.v_proj,0.0000000026,0.05000,3.972 | |
| 3,self_attn.o_proj,0.0000000043,0.05000,1.206 | |
| 3,mlp.gate_proj,0.0000003206,0.05000,3.242 | |
| 3,mlp.up_proj,0.0000001479,0.05000,3.252 | |
| 3,mlp.down_proj,0.0000000121,0.05000,3.914 | |
| 4,self_attn.q_proj,0.0000000231,0.05000,4.343 | |
| 4,self_attn.v_proj,0.0000000033,0.05000,4.405 | |
| 4,self_attn.k_proj,0.0000000086,0.05000,4.416 | |
| 4,self_attn.o_proj,0.0000000077,0.05000,1.169 | |
| 4,mlp.up_proj,0.0000002798,0.05000,3.357 | |
| 4,mlp.gate_proj,0.0000005087,0.05000,3.379 | |
| 4,mlp.down_proj,0.0001496382,0.05000,3.528 | |
| 5,self_attn.k_proj,0.0000000318,0.05000,3.794 | |
| 5,self_attn.q_proj,0.0000001019,0.05000,3.870 | |
| 5,self_attn.v_proj,0.0000000151,0.05000,3.907 | |
| 5,self_attn.o_proj,0.0000000132,0.05000,1.150 | |
| 5,mlp.up_proj,0.0000004159,0.05000,2.522 | |
| 5,mlp.gate_proj,0.0000007649,0.05000,2.546 | |
| 5,mlp.down_proj,0.0000001460,0.05000,3.541 | |
| 6,self_attn.q_proj,0.0000001069,0.05000,3.811 | |
| 6,self_attn.k_proj,0.0000000310,0.05000,3.860 | |
| 6,self_attn.v_proj,0.0000000184,0.05000,3.866 | |
| 6,self_attn.o_proj,0.0000000110,0.05000,1.143 | |
| 6,mlp.up_proj,0.0000006236,0.05000,2.564 | |
| 6,mlp.gate_proj,0.0000011021,0.05000,2.570 | |
| 6,mlp.down_proj,0.0000001073,0.05000,3.539 | |
| 7,self_attn.k_proj,0.0000000430,0.05000,3.557 | |
| 7,self_attn.v_proj,0.0000000261,0.05000,3.639 | |
| 7,self_attn.q_proj,0.0000001502,0.05000,3.650 | |
| 7,self_attn.o_proj,0.0000000111,0.05000,1.151 | |
| 7,mlp.up_proj,0.0000007642,0.05000,2.499 | |
| 7,mlp.gate_proj,0.0000013492,0.05000,2.508 | |
| 7,mlp.down_proj,0.0000000492,0.05000,3.530 | |
| 8,self_attn.q_proj,0.0000001647,0.05000,3.726 | |
| 8,self_attn.k_proj,0.0000000498,0.05000,3.742 | |
| 8,self_attn.v_proj,0.0000000280,0.05000,3.749 | |
| 8,self_attn.o_proj,0.0000000091,0.05000,1.195 | |
| 8,mlp.gate_proj,0.0000008816,0.05000,2.494 | |
| 8,mlp.up_proj,0.0000005125,0.05000,2.498 | |
| 8,mlp.down_proj,0.0000000619,0.05000,3.521 | |
| 9,self_attn.k_proj,0.0000000422,0.05000,3.545 | |
| 9,self_attn.v_proj,0.0000000267,0.05000,3.561 | |
| 9,self_attn.q_proj,0.0000001460,0.05000,3.581 | |
| 9,self_attn.o_proj,0.0000000168,0.05000,1.141 | |
| 9,mlp.up_proj,0.0000003213,0.05000,2.513 | |
| 9,mlp.gate_proj,0.0000003591,0.05000,2.522 | |
| 9,mlp.down_proj,0.0000000803,0.05000,3.551 | |
| 10,self_attn.q_proj,0.0000002188,0.05000,3.755 | |
| 10,self_attn.k_proj,0.0000000617,0.05000,3.799 | |
| 10,self_attn.v_proj,0.0000000361,0.05000,3.813 | |
| 10,self_attn.o_proj,0.0000000154,0.05000,1.153 | |
| 10,mlp.up_proj,0.0000003657,0.05000,2.443 | |
| 10,mlp.gate_proj,0.0000004093,0.05000,2.448 | |
| 10,mlp.down_proj,0.0000000965,0.05000,3.616 | |
| 11,self_attn.k_proj,0.0000000474,0.05000,3.524 | |
| 11,self_attn.v_proj,0.0000000273,0.05000,3.604 | |
| 11,self_attn.q_proj,0.0000001692,0.05000,3.612 | |
| 11,self_attn.o_proj,0.0000000241,0.05000,1.142 | |
| 11,mlp.up_proj,0.0000004200,0.05000,2.538 | |
| 11,mlp.gate_proj,0.0000005279,0.05000,2.555 | |
| 11,mlp.down_proj,0.0000000851,0.05000,3.562 | |
| 12,self_attn.q_proj,0.0000002061,0.05000,3.418 | |
| 12,self_attn.v_proj,0.0000000328,0.05000,3.534 | |
| 12,self_attn.k_proj,0.0000000577,0.05000,3.571 | |
| 12,self_attn.o_proj,0.0000000278,0.05000,1.146 | |
| 12,mlp.gate_proj,0.0000004661,0.05000,2.530 | |
| 12,mlp.up_proj,0.0000004365,0.05000,2.534 | |
| 12,mlp.down_proj,0.0000001030,0.05000,3.555 | |
| 13,self_attn.q_proj,0.0000002177,0.05000,3.406 | |
| 13,self_attn.k_proj,0.0000000620,0.05000,3.407 | |
| 13,self_attn.v_proj,0.0000000392,0.05000,3.455 | |
| 13,self_attn.o_proj,0.0000000293,0.05000,1.144 | |
| 13,mlp.up_proj,0.0000004977,0.05000,2.513 | |
| 13,mlp.gate_proj,0.0000005316,0.05000,2.535 | |
| 13,mlp.down_proj,0.0000001189,0.05000,3.533 | |
| 14,self_attn.q_proj,0.0000002546,0.05000,3.494 | |
| 14,self_attn.v_proj,0.0000000387,0.05000,3.545 | |
| 14,self_attn.k_proj,0.0000000740,0.05000,3.582 | |
| 14,self_attn.o_proj,0.0000000303,0.05000,1.150 | |
| 14,mlp.up_proj,0.0000005113,0.05000,2.471 | |
| 14,mlp.gate_proj,0.0000005438,0.05000,2.477 | |
| 14,mlp.down_proj,0.0000001245,0.05000,3.503 | |
| 15,self_attn.k_proj,0.0000000593,0.05000,3.810 | |
| 15,self_attn.q_proj,0.0000002137,0.05000,3.904 | |
| 15,self_attn.v_proj,0.0000000407,0.05000,3.915 | |
| 15,self_attn.o_proj,0.0000000397,0.05000,1.140 | |
| 15,mlp.up_proj,0.0000005303,0.05000,2.377 | |
| 15,mlp.gate_proj,0.0000005843,0.05000,2.391 | |
| 15,mlp.down_proj,0.0000001302,0.05000,3.542 | |
| 16,self_attn.q_proj,0.0000002011,0.05000,3.929 | |
| 16,self_attn.v_proj,0.0000000299,0.05000,3.952 | |
| 16,self_attn.k_proj,0.0000000633,0.05000,3.954 | |
| 16,self_attn.o_proj,0.0000000320,0.05000,1.149 | |
| 16,mlp.gate_proj,0.0000005026,0.05000,2.592 | |
| 16,mlp.up_proj,0.0000004937,0.05000,2.598 | |
| 16,mlp.down_proj,0.0000001260,0.05000,3.540 | |
| 17,self_attn.k_proj,0.0000000676,0.05000,3.510 | |
| 17,self_attn.v_proj,0.0000000323,0.05000,3.521 | |
| 17,self_attn.q_proj,0.0000002323,0.05000,3.567 | |
| 17,self_attn.o_proj,0.0000000340,0.05000,1.144 | |
| 17,mlp.up_proj,0.0000004876,0.05000,2.553 | |
| 17,mlp.gate_proj,0.0000004806,0.05000,2.580 | |
| 17,mlp.down_proj,0.0000001191,0.05000,3.525 | |
| 18,self_attn.q_proj,0.0000002289,0.05000,4.095 | |
| 18,self_attn.v_proj,0.0000000371,0.05000,4.126 | |
| 18,self_attn.k_proj,0.0000000658,0.05000,4.139 | |
| 18,self_attn.o_proj,0.0000000409,0.05000,1.130 | |
| 18,mlp.gate_proj,0.0000004643,0.05000,2.561 | |
| 18,mlp.up_proj,0.0000004858,0.05000,2.569 | |
| 18,mlp.down_proj,0.0000001185,0.05000,3.517 | |
| 19,self_attn.q_proj,0.0000002764,0.05000,3.542 | |
| 19,self_attn.v_proj,0.0000000402,0.05000,3.615 | |
| 19,self_attn.k_proj,0.0000000741,0.05000,3.641 | |
| 19,self_attn.o_proj,0.0000000308,0.05000,1.134 | |
| 19,mlp.up_proj,0.0000005025,0.05000,2.549 | |
| 19,mlp.gate_proj,0.0000004797,0.05000,2.579 | |
| 19,mlp.down_proj,0.0000001231,0.05000,3.523 | |
| 20,self_attn.q_proj,0.0000002709,0.05000,3.825 | |
| 20,self_attn.v_proj,0.0000000383,0.05000,3.901 | |
| 20,self_attn.k_proj,0.0000000785,0.05000,3.915 | |
| 20,self_attn.o_proj,0.0000000425,0.05000,1.137 | |
| 20,mlp.gate_proj,0.0000004417,0.05000,2.506 | |
| 20,mlp.up_proj,0.0000004883,0.05000,2.505 | |
| 20,mlp.down_proj,0.0000001268,0.05000,3.520 | |
| 21,self_attn.k_proj,0.0000000683,0.05000,3.726 | |
| 21,self_attn.q_proj,0.0000002360,0.05000,3.801 | |
| 21,self_attn.v_proj,0.0000000327,0.05000,3.827 | |
| 21,self_attn.o_proj,0.0000000444,0.05000,1.143 | |
| 21,mlp.up_proj,0.0000004921,0.05000,2.515 | |
| 21,mlp.gate_proj,0.0000004432,0.05000,2.532 | |
| 21,mlp.down_proj,0.0000001214,0.05000,3.528 | |
| 22,self_attn.v_proj,0.0000000495,0.05000,3.738 | |
| 22,self_attn.k_proj,0.0000000745,0.05000,3.762 | |
| 22,self_attn.q_proj,0.0000002610,0.05000,3.799 | |
| 22,self_attn.o_proj,0.0000000528,0.05000,1.136 | |
| 22,mlp.up_proj,0.0000004986,0.05000,2.533 | |
| 22,mlp.gate_proj,0.0000004491,0.05000,2.540 | |
| 22,mlp.down_proj,0.0000001492,0.05000,3.513 | |
| 23,self_attn.k_proj,0.0000000683,0.05000,3.437 | |
| 23,self_attn.v_proj,0.0000000480,0.05000,3.463 | |
| 23,self_attn.q_proj,0.0000002551,0.05000,3.499 | |
| 23,self_attn.o_proj,0.0000000544,0.05000,1.134 | |
| 23,mlp.up_proj,0.0000005058,0.05000,2.529 | |
| 23,mlp.gate_proj,0.0000004802,0.05000,2.532 | |
| 23,mlp.down_proj,0.0000001372,0.05000,3.507 | |
| 24,self_attn.q_proj,0.0000002997,0.05000,3.422 | |
| 24,self_attn.k_proj,0.0000000956,0.05000,3.438 | |
| 24,self_attn.v_proj,0.0000000430,0.05000,3.493 | |
| 24,self_attn.o_proj,0.0000000590,0.05000,1.137 | |
| 24,mlp.gate_proj,0.0000004554,0.05000,2.581 | |
| 24,mlp.up_proj,0.0000004873,0.05000,2.587 | |
| 24,mlp.down_proj,0.0000001235,0.05000,3.525 | |
| 25,self_attn.k_proj,0.0000000914,0.05000,3.659 | |
| 25,self_attn.v_proj,0.0000000552,0.05000,3.760 | |
| 25,self_attn.q_proj,0.0000003244,0.05000,3.775 | |
| 25,self_attn.o_proj,0.0000000401,0.05000,1.152 | |
| 25,mlp.up_proj,0.0000004959,0.05000,2.504 | |
| 25,mlp.gate_proj,0.0000004476,0.05000,2.527 | |
| 25,mlp.down_proj,0.0000001325,0.05000,3.525 | |
| 26,self_attn.q_proj,0.0000002927,0.05000,3.843 | |
| 26,self_attn.v_proj,0.0000000365,0.05000,3.916 | |
| 26,self_attn.k_proj,0.0000000829,0.05000,3.932 | |
| 26,self_attn.o_proj,0.0000000480,0.05000,1.141 | |
| 26,mlp.gate_proj,0.0000004655,0.05000,2.653 | |
| 26,mlp.up_proj,0.0000005360,0.05000,2.661 | |
| 26,mlp.down_proj,0.0000001535,0.05000,3.544 | |
| 27,self_attn.k_proj,0.0000000845,0.05000,3.682 | |
| 27,self_attn.q_proj,0.0000002836,0.05000,3.766 | |
| 27,self_attn.v_proj,0.0000000448,0.05000,3.771 | |
| 27,self_attn.o_proj,0.0000000720,0.05000,1.142 | |
| 27,mlp.up_proj,0.0000005640,0.05000,2.558 | |
| 27,mlp.gate_proj,0.0000004908,0.05000,2.587 | |
| 27,mlp.down_proj,0.0000001856,0.05000,3.556 | |
| 28,self_attn.q_proj,0.0000002748,0.05000,3.603 | |
| 28,self_attn.v_proj,0.0000000634,0.05000,3.624 | |
| 28,self_attn.k_proj,0.0000000678,0.05000,3.634 | |
| 28,self_attn.o_proj,0.0000000759,0.05000,1.132 | |
| 28,mlp.gate_proj,0.0000004960,0.05000,2.536 | |
| 28,mlp.up_proj,0.0000005713,0.05000,2.547 | |
| 28,mlp.down_proj,0.0000002030,0.05000,3.496 | |
| 29,self_attn.q_proj,0.0000003218,0.05000,3.824 | |
| 29,self_attn.k_proj,0.0000000896,0.05000,3.852 | |
| 29,self_attn.v_proj,0.0000000643,0.05000,3.875 | |
| 29,self_attn.o_proj,0.0000000759,0.05000,1.173 | |
| 29,mlp.up_proj,0.0000005743,0.05000,2.581 | |
| 29,mlp.gate_proj,0.0000005014,0.05000,2.612 | |
| 29,mlp.down_proj,0.0000002231,0.05000,3.538 | |
| 30,self_attn.k_proj,0.0000000758,0.05000,3.898 | |
| 30,self_attn.v_proj,0.0000000699,0.05000,3.898 | |
| 30,self_attn.q_proj,0.0000002911,0.05000,3.909 | |
| 30,self_attn.o_proj,0.0000000963,0.05000,1.151 | |
| 30,mlp.gate_proj,0.0000005358,0.05000,2.578 | |
| 30,mlp.up_proj,0.0000006059,0.05000,2.588 | |
| 30,mlp.down_proj,0.0000002535,0.05000,3.543 | |
| 31,self_attn.k_proj,0.0000000760,0.05000,3.357 | |
| 31,self_attn.v_proj,0.0000000656,0.05000,3.472 | |
| 31,self_attn.q_proj,0.0000002968,0.05000,3.484 | |
| 31,self_attn.o_proj,0.0000000876,0.05000,1.145 | |
| 31,mlp.up_proj,0.0000006837,0.05000,2.533 | |
| 31,mlp.gate_proj,0.0000006198,0.05000,2.561 | |
| 31,mlp.down_proj,0.0000003191,0.05000,3.539 | |
| 32,self_attn.v_proj,0.0000000970,0.05000,3.365 | |
| 32,self_attn.k_proj,0.0000000867,0.05000,3.400 | |
| 32,self_attn.q_proj,0.0000003585,0.05000,3.454 | |
| 32,self_attn.o_proj,0.0000000881,0.05000,1.140 | |
| 32,mlp.up_proj,0.0000007260,0.05000,2.497 | |
| 32,mlp.gate_proj,0.0000006735,0.05000,2.508 | |
| 32,mlp.down_proj,0.0000003660,0.05000,3.544 | |
| 33,self_attn.q_proj,0.0000003616,0.05000,3.409 | |
| 33,self_attn.v_proj,0.0000000883,0.05000,3.419 | |
| 33,self_attn.k_proj,0.0000000866,0.05000,3.445 | |
| 33,self_attn.o_proj,0.0000001073,0.05000,1.146 | |
| 33,mlp.up_proj,0.0000008888,0.05000,2.491 | |
| 33,mlp.gate_proj,0.0000008382,0.05000,2.503 | |
| 33,mlp.down_proj,0.0000005407,0.05000,3.533 | |
| 34,self_attn.q_proj,0.0000004201,0.05000,4.001 | |
| 34,self_attn.v_proj,0.0000001121,0.05000,4.025 | |
| 34,self_attn.k_proj,0.0000000911,0.05000,4.040 | |
| 34,self_attn.o_proj,0.0000000971,0.05000,1.147 | |
| 34,mlp.gate_proj,0.0000010043,0.05000,2.583 | |
| 34,mlp.up_proj,0.0000010385,0.05000,2.590 | |
| 34,mlp.down_proj,0.0000006755,0.05000,3.535 | |
| 35,self_attn.k_proj,0.0000000967,0.05000,3.599 | |
| 35,self_attn.v_proj,0.0000001044,0.05000,3.693 | |
| 35,self_attn.q_proj,0.0000003993,0.05000,3.725 | |
| 35,self_attn.o_proj,0.0000001738,0.05000,1.149 | |
| 35,mlp.up_proj,0.0000011876,0.05000,2.531 | |
| 35,mlp.gate_proj,0.0000011666,0.05000,2.562 | |
| 35,mlp.down_proj,0.0000008386,0.05000,3.509 | |
| 36,self_attn.q_proj,0.0000004909,0.05000,3.529 | |
| 36,self_attn.v_proj,0.0000001891,0.05000,3.537 | |
| 36,self_attn.k_proj,0.0000001019,0.05000,3.595 | |
| 36,self_attn.o_proj,0.0000001320,0.05000,1.139 | |
| 36,mlp.up_proj,0.0000012988,0.05000,2.582 | |
| 36,mlp.gate_proj,0.0000012655,0.05000,2.586 | |
| 36,mlp.down_proj,0.0000010114,0.05000,3.563 | |
| 37,self_attn.k_proj,0.0000001170,0.05000,3.401 | |
| 37,self_attn.q_proj,0.0000005350,0.05000,3.436 | |
| 37,self_attn.v_proj,0.0000001738,0.05000,3.502 | |
| 37,self_attn.o_proj,0.0000001674,0.05000,1.149 | |
| 37,mlp.up_proj,0.0000014454,0.05000,2.447 | |
| 37,mlp.gate_proj,0.0000014013,0.05000,2.463 | |
| 37,mlp.down_proj,0.0000011469,0.05000,3.576 | |
| 38,self_attn.v_proj,0.0000001754,0.05000,3.757 | |
| 38,self_attn.k_proj,0.0000001155,0.05000,3.769 | |
| 38,self_attn.q_proj,0.0000005264,0.05000,3.782 | |
| 38,self_attn.o_proj,0.0000001730,0.05000,1.162 | |
| 38,mlp.up_proj,0.0000016110,0.05000,2.521 | |
| 38,mlp.gate_proj,0.0000015450,0.05000,2.527 | |
| 38,mlp.down_proj,0.0000013149,0.05000,3.546 | |
| 39,self_attn.k_proj,0.0000001116,0.05000,3.312 | |
| 39,self_attn.v_proj,0.0000001994,0.05000,3.365 | |
| 39,self_attn.q_proj,0.0000005239,0.05000,3.436 | |
| 39,self_attn.o_proj,0.0000002415,0.05000,1.161 | |
| 39,mlp.up_proj,0.0000017928,0.05000,2.457 | |
| 39,mlp.gate_proj,0.0000017018,0.05000,2.480 | |
| 39,mlp.down_proj,0.0000015803,0.05000,3.542 | |
| 40,self_attn.k_proj,0.0000001218,0.05000,3.695 | |
| 40,self_attn.v_proj,0.0000002551,0.05000,3.695 | |
| 40,self_attn.q_proj,0.0000005873,0.05000,3.705 | |
| 40,self_attn.o_proj,0.0000002292,0.05000,1.161 | |
| 40,mlp.up_proj,0.0000019417,0.05000,2.560 | |
| 40,mlp.gate_proj,0.0000018318,0.05000,2.565 | |
| 40,mlp.down_proj,0.0000018159,0.05000,3.546 | |
| 41,self_attn.k_proj,0.0000001183,0.05000,3.569 | |
| 41,self_attn.q_proj,0.0000005899,0.05000,3.615 | |
| 41,self_attn.v_proj,0.0000002547,0.05000,3.669 | |
| 41,self_attn.o_proj,0.0000001957,0.05000,1.160 | |
| 41,mlp.up_proj,0.0000020936,0.05000,2.531 | |
| 41,mlp.gate_proj,0.0000019421,0.05000,2.559 | |
| 41,mlp.down_proj,0.0000020503,0.05000,3.620 | |
| 42,self_attn.q_proj,0.0000006111,0.05000,4.035 | |
| 42,self_attn.k_proj,0.0000001178,0.05000,4.064 | |
| 42,self_attn.v_proj,0.0000002594,0.05000,4.076 | |
| 42,self_attn.o_proj,0.0000002111,0.05000,1.154 | |
| 42,mlp.up_proj,0.0000022532,0.05000,2.615 | |
| 42,mlp.gate_proj,0.0000020654,0.05000,2.621 | |
| 42,mlp.down_proj,0.0000024288,0.05000,3.587 | |
| 43,self_attn.k_proj,0.0000001174,0.05000,3.388 | |
| 43,self_attn.v_proj,0.0000004101,0.05000,3.428 | |
| 43,self_attn.q_proj,0.0000006248,0.05000,3.506 | |
| 43,self_attn.o_proj,0.0000003921,0.05000,1.144 | |
| 43,mlp.up_proj,0.0000024706,0.05000,2.569 | |
| 43,mlp.gate_proj,0.0000022215,0.05000,2.600 | |
| 43,mlp.down_proj,0.0000029538,0.05000,3.545 | |
| 44,self_attn.v_proj,0.0000004372,0.05000,3.535 | |
| 44,self_attn.q_proj,0.0000005866,0.05000,3.572 | |
| 44,self_attn.k_proj,0.0000001027,0.05000,3.589 | |
| 44,self_attn.o_proj,0.0000005251,0.05000,1.141 | |
| 44,mlp.gate_proj,0.0000023094,0.05000,2.631 | |
| 44,mlp.up_proj,0.0000026141,0.05000,2.639 | |
| 44,mlp.down_proj,0.0000044741,0.05000,3.559 | |
| 45,self_attn.k_proj,0.0000001031,0.05000,3.699 | |
| 45,self_attn.v_proj,0.0000005164,0.05000,3.829 | |
| 45,self_attn.q_proj,0.0000006073,0.05000,3.843 | |
| 45,self_attn.o_proj,0.0000005373,0.05000,1.156 | |
| 45,mlp.up_proj,0.0000027213,0.05000,2.508 | |
| 45,mlp.gate_proj,0.0000024398,0.05000,2.544 | |
| 45,mlp.down_proj,0.0000050870,0.05000,3.565 | |
| 46,self_attn.q_proj,0.0000005609,0.05000,4.140 | |
| 46,self_attn.k_proj,0.0000000954,0.05000,4.193 | |
| 46,self_attn.v_proj,0.0000005434,0.05000,4.204 | |
| 46,self_attn.o_proj,0.0000009439,0.05000,1.152 | |
| 46,mlp.up_proj,0.0000027407,0.05000,2.600 | |
| 46,mlp.gate_proj,0.0000025642,0.05000,2.607 | |
| 46,mlp.down_proj,0.0000072006,0.05000,3.551 | |
| 47,self_attn.k_proj,0.0000000795,0.05000,3.488 | |
| 47,self_attn.v_proj,0.0000002801,0.05000,3.552 | |
| 47,self_attn.q_proj,0.0000004749,0.05000,3.603 | |
| 47,self_attn.o_proj,0.0000004404,0.05000,1.152 | |
| 47,mlp.up_proj,0.0000028646,0.05000,2.518 | |
| 47,mlp.gate_proj,0.0000027463,0.05000,2.543 | |
| 47,mlp.down_proj,0.0000116770,0.05000,3.533 | |