| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.00022096,0.01000,1.099 | |
| 0,self_attn.v_proj,0.00000229,0.01000,2.435 | |
| 0,self_attn.q_proj,0.00036210,0.01000,2.448 | |
| 0,self_attn.o_proj,0.00000175,0.01000,2.415 | |
| 0,mlp.up_proj,0.00150737,0.01000,1.416 | |
| 0,mlp.gate_proj,0.00142441,0.01000,0.274 | |
| 0,mlp.down_proj,0.00595958,0.01000,0.739 | |
| 1,self_attn.k_proj,0.00078274,0.01000,0.286 | |
| 1,self_attn.v_proj,0.00015115,0.01000,0.272 | |
| 1,self_attn.q_proj,0.00174118,0.01000,0.162 | |
| 1,self_attn.o_proj,0.00103411,0.01000,0.769 | |
| 1,mlp.up_proj,0.00179594,0.01000,1.660 | |
| 1,mlp.gate_proj,0.00228291,0.01000,0.973 | |
| 1,mlp.down_proj,0.00224895,0.01000,0.746 | |
| 2,self_attn.k_proj,0.00125878,0.01000,0.437 | |
| 2,self_attn.v_proj,0.00020735,0.01000,0.269 | |
| 2,self_attn.q_proj,0.00295782,0.01000,0.638 | |
| 2,self_attn.o_proj,0.00098028,0.01000,0.810 | |
| 2,mlp.up_proj,0.00240148,0.01000,0.318 | |
| 2,mlp.gate_proj,0.00286920,0.01000,0.260 | |
| 2,mlp.down_proj,0.00500130,0.01000,6.505 | |
| 3,self_attn.k_proj,0.00188067,0.01000,1.197 | |
| 3,self_attn.v_proj,0.00074529,0.01000,0.289 | |
| 3,self_attn.q_proj,0.00454102,0.01000,0.292 | |
| 3,self_attn.o_proj,0.00114469,0.01000,0.283 | |
| 3,mlp.up_proj,0.00272536,0.01000,0.309 | |
| 3,mlp.gate_proj,0.00309045,0.01000,0.279 | |
| 3,mlp.down_proj,0.00337280,0.01000,0.736 | |
| 4,self_attn.k_proj,0.00178011,0.01000,0.471 | |
| 4,self_attn.v_proj,0.00069859,0.01000,0.149 | |
| 4,self_attn.q_proj,0.00427734,0.01000,0.145 | |
| 4,self_attn.o_proj,0.00194755,0.01000,1.499 | |
| 4,mlp.up_proj,0.00357304,0.01000,0.308 | |
| 4,mlp.gate_proj,0.00408032,0.01000,0.289 | |
| 4,mlp.down_proj,0.00474062,0.01000,0.744 | |
| 5,self_attn.k_proj,0.00194141,0.01000,0.269 | |
| 5,self_attn.v_proj,0.00072606,0.01000,0.919 | |
| 5,self_attn.q_proj,0.00453751,0.01000,1.476 | |
| 5,self_attn.o_proj,0.00234540,0.01000,0.281 | |
| 5,mlp.up_proj,0.00409303,0.01000,0.266 | |
| 5,mlp.gate_proj,0.00449629,0.01000,0.596 | |
| 5,mlp.down_proj,0.00556781,0.01000,6.516 | |
| 6,self_attn.k_proj,0.00163071,0.01000,0.275 | |
| 6,self_attn.v_proj,0.00068974,0.01000,0.287 | |
| 6,self_attn.q_proj,0.00406556,0.01000,0.276 | |
| 6,self_attn.o_proj,0.00182722,0.01000,0.284 | |
| 6,mlp.up_proj,0.00438432,0.01000,0.273 | |
| 6,mlp.gate_proj,0.00448065,0.01000,0.271 | |
| 6,mlp.down_proj,0.00687783,0.01000,0.819 | |
| 7,self_attn.k_proj,0.00229149,0.01000,0.366 | |
| 7,self_attn.v_proj,0.00139370,0.01000,0.148 | |
| 7,self_attn.q_proj,0.00637256,0.01000,0.142 | |
| 7,self_attn.o_proj,0.00216803,0.01000,1.421 | |
| 7,mlp.up_proj,0.00479016,0.01000,0.280 | |
| 7,mlp.gate_proj,0.00473948,0.01000,0.287 | |
| 7,mlp.down_proj,0.00823352,0.01000,0.831 | |
| 8,self_attn.k_proj,0.00214538,0.01000,1.666 | |
| 8,self_attn.v_proj,0.00103131,0.01000,1.952 | |
| 8,self_attn.q_proj,0.00540090,0.01000,1.636 | |
| 8,self_attn.o_proj,0.00283757,0.01000,0.303 | |
| 8,mlp.up_proj,0.00546549,0.01000,0.274 | |
| 8,mlp.gate_proj,0.00495393,0.01000,0.275 | |
| 8,mlp.down_proj,0.01154038,0.01000,6.464 | |
| 9,self_attn.k_proj,0.00147208,0.01000,1.818 | |
| 9,self_attn.v_proj,0.00058141,0.01000,1.731 | |
| 9,self_attn.q_proj,0.00394661,0.01000,1.675 | |
| 9,self_attn.o_proj,0.00251221,0.01000,0.324 | |
| 9,mlp.up_proj,0.00595842,0.01000,0.347 | |
| 9,mlp.gate_proj,0.00489875,0.01000,0.343 | |
| 9,mlp.down_proj,0.01428184,0.01000,0.904 | |
| 10,self_attn.k_proj,0.00132155,0.01000,2.685 | |
| 10,self_attn.v_proj,0.00068617,0.01000,2.503 | |
| 10,self_attn.q_proj,0.00363028,0.01000,1.752 | |
| 10,self_attn.o_proj,0.00545926,0.01000,0.408 | |
| 10,mlp.up_proj,0.00611763,0.01000,1.632 | |
| 10,mlp.gate_proj,0.00474317,0.01000,1.328 | |
| 10,mlp.down_proj,0.01347071,0.01000,2.937 | |
| 11,self_attn.k_proj,0.00115821,0.01000,3.339 | |
| 11,self_attn.v_proj,0.00065106,0.01000,2.422 | |
| 11,self_attn.q_proj,0.00344706,0.01000,2.382 | |
| 11,self_attn.o_proj,0.00740811,0.01000,2.400 | |
| 11,mlp.up_proj,0.00620620,0.01000,2.718 | |
| 11,mlp.gate_proj,0.00449832,0.01000,2.710 | |
| 11,mlp.down_proj,0.27257532,0.01000,5.754 | |
| 12,self_attn.k_proj,0.00163961,0.01000,0.344 | |
| 12,self_attn.v_proj,0.00094356,0.01000,0.337 | |
| 12,self_attn.q_proj,0.00456318,0.01000,0.338 | |
| 12,self_attn.o_proj,0.00419531,0.01000,1.311 | |
| 12,mlp.up_proj,0.00565002,0.01000,0.279 | |
| 12,mlp.gate_proj,0.00445975,0.01000,1.091 | |
| 12,mlp.down_proj,0.01192240,0.01000,4.327 | |
| 13,self_attn.k_proj,0.00174242,0.01000,0.339 | |
| 13,self_attn.v_proj,0.00083272,0.01000,0.344 | |
| 13,self_attn.q_proj,0.00502530,0.01000,0.395 | |
| 13,self_attn.o_proj,0.00500150,0.01000,0.343 | |
| 13,mlp.up_proj,0.00570113,0.01000,1.926 | |
| 13,mlp.gate_proj,0.00524486,0.01000,1.750 | |
| 13,mlp.down_proj,0.01178209,0.01000,2.821 | |
| 14,self_attn.k_proj,0.00200629,0.01000,0.361 | |
| 14,self_attn.v_proj,0.00157519,0.01000,0.359 | |
| 14,self_attn.q_proj,0.00566488,0.01000,0.366 | |
| 14,self_attn.o_proj,0.00620107,0.01000,2.248 | |
| 14,mlp.up_proj,0.00577955,0.01000,4.655 | |
| 14,mlp.gate_proj,0.00547774,0.01000,5.042 | |
| 14,mlp.down_proj,0.01469438,0.01000,8.832 | |
| 15,self_attn.k_proj,0.00194205,0.01000,0.349 | |
| 15,self_attn.v_proj,0.00151308,0.01000,0.345 | |
| 15,self_attn.q_proj,0.00563300,0.01000,0.342 | |
| 15,self_attn.o_proj,0.00601548,0.01000,0.344 | |
| 15,mlp.up_proj,0.00601284,0.01000,0.342 | |
| 15,mlp.gate_proj,0.00594717,0.01000,0.336 | |
| 15,mlp.down_proj,0.01753610,0.01000,5.689 | |
| 16,self_attn.k_proj,0.00155090,0.01000,1.763 | |
| 16,self_attn.v_proj,0.00110804,0.01000,0.365 | |
| 16,self_attn.q_proj,0.00422240,0.01000,0.357 | |
| 16,self_attn.o_proj,0.00903260,0.01000,0.345 | |
| 16,mlp.up_proj,0.00553630,0.01000,1.181 | |
| 16,mlp.gate_proj,0.00532908,0.01000,1.499 | |
| 16,mlp.down_proj,0.01532181,0.01000,5.315 | |
| 17,self_attn.k_proj,0.00241632,0.01000,0.830 | |
| 17,self_attn.v_proj,0.00194845,0.01000,2.641 | |
| 17,self_attn.q_proj,0.00834111,0.01000,4.413 | |
| 17,self_attn.o_proj,0.01061929,0.01000,2.746 | |
| 17,mlp.up_proj,0.00562216,0.01000,2.742 | |
| 17,mlp.gate_proj,0.00506327,0.01000,1.101 | |
| 17,mlp.down_proj,0.01818097,0.01000,4.789 | |
| 18,self_attn.k_proj,0.00273163,0.01000,2.613 | |
| 18,self_attn.v_proj,0.00311299,0.01000,1.891 | |
| 18,self_attn.q_proj,0.00828936,0.01000,0.344 | |
| 18,self_attn.o_proj,0.00938506,0.01000,0.345 | |
| 18,mlp.up_proj,0.00625932,0.01000,0.344 | |
| 18,mlp.gate_proj,0.00583430,0.01000,0.339 | |
| 18,mlp.down_proj,0.03318551,0.01000,2.234 | |
| 19,self_attn.k_proj,0.00133622,0.01000,0.326 | |
| 19,self_attn.v_proj,0.00225405,0.01000,0.800 | |
| 19,self_attn.q_proj,0.00550781,0.01000,1.800 | |
| 19,self_attn.o_proj,0.01567704,0.01000,0.449 | |
| 19,mlp.up_proj,0.00725614,0.01000,2.903 | |
| 19,mlp.gate_proj,0.00687203,0.01000,2.471 | |
| 19,mlp.down_proj,0.03395692,0.01000,2.946 | |
| 20,self_attn.k_proj,0.00182818,0.01000,0.388 | |
| 20,self_attn.v_proj,0.00369986,0.01000,1.045 | |
| 20,self_attn.q_proj,0.00668970,0.01000,3.772 | |
| 20,self_attn.o_proj,0.01447436,0.01000,3.580 | |
| 20,mlp.up_proj,0.00868652,0.01000,2.710 | |
| 20,mlp.gate_proj,0.00763109,0.01000,1.037 | |
| 20,mlp.down_proj,0.06614500,0.01000,3.153 | |
| 21,self_attn.k_proj,0.00169165,0.01000,0.353 | |
| 21,self_attn.v_proj,0.00278996,0.01000,1.556 | |
| 21,self_attn.q_proj,0.00603606,0.01000,2.608 | |
| 21,self_attn.o_proj,0.01160419,0.01000,2.633 | |
| 21,mlp.up_proj,0.00941546,0.01000,2.761 | |
| 21,mlp.gate_proj,0.00857336,0.01000,1.637 | |
| 21,mlp.down_proj,0.05236044,0.01000,3.023 | |
| 22,self_attn.k_proj,0.00173458,0.01000,0.340 | |
| 22,self_attn.v_proj,0.00304587,0.01000,0.335 | |
| 22,self_attn.q_proj,0.00609978,0.01000,1.500 | |
| 22,self_attn.o_proj,0.01699413,0.01000,0.329 | |
| 22,mlp.up_proj,0.01043702,0.01000,3.157 | |
| 22,mlp.gate_proj,0.00901166,0.01000,2.403 | |
| 22,mlp.down_proj,0.08635419,0.01000,2.277 | |
| 23,self_attn.k_proj,0.00235798,0.01000,2.724 | |
| 23,self_attn.v_proj,0.00853371,0.01000,2.700 | |
| 23,self_attn.q_proj,0.00731025,0.01000,2.679 | |
| 23,self_attn.o_proj,0.04595792,0.01000,0.347 | |
| 23,mlp.up_proj,0.01267573,0.01000,1.922 | |
| 23,mlp.gate_proj,0.00977481,0.01000,1.572 | |
| 23,mlp.down_proj,0.09878369,0.01000,1.992 | |
| 24,self_attn.k_proj,0.00193833,0.01000,0.352 | |
| 24,self_attn.v_proj,0.00926276,0.01000,0.343 | |
| 24,self_attn.q_proj,0.00732911,0.01000,0.354 | |
| 24,self_attn.o_proj,0.02490180,0.01000,0.294 | |
| 24,mlp.up_proj,0.01275103,0.01000,3.643 | |
| 24,mlp.gate_proj,0.00968059,0.01000,4.339 | |
| 24,mlp.down_proj,0.13135986,0.01000,6.748 | |
| 25,self_attn.k_proj,0.00188807,0.01000,1.592 | |
| 25,self_attn.v_proj,0.00410724,0.01000,1.087 | |
| 25,self_attn.q_proj,0.00648702,0.01000,0.338 | |
| 25,self_attn.o_proj,0.01829978,0.01000,1.828 | |
| 25,mlp.up_proj,0.01323432,0.01000,0.353 | |
| 25,mlp.gate_proj,0.01043347,0.01000,0.343 | |
| 25,mlp.down_proj,0.10982227,0.01000,6.597 | |
| 26,self_attn.k_proj,0.00186195,0.01000,3.885 | |
| 26,self_attn.v_proj,0.00593649,0.01000,2.686 | |
| 26,self_attn.q_proj,0.00663982,0.01000,0.818 | |
| 26,self_attn.o_proj,0.02385299,0.01000,0.346 | |
| 26,mlp.up_proj,0.01519259,0.01000,0.357 | |
| 26,mlp.gate_proj,0.01179895,0.01000,0.383 | |
| 26,mlp.down_proj,0.16240232,0.01000,2.805 | |
| 27,self_attn.k_proj,0.00188216,0.01000,0.753 | |
| 27,self_attn.v_proj,0.00480582,0.01000,2.568 | |
| 27,self_attn.q_proj,0.00687713,0.01000,3.243 | |
| 27,self_attn.o_proj,0.03130198,0.01000,1.944 | |
| 27,mlp.up_proj,0.01527163,0.01000,0.361 | |
| 27,mlp.gate_proj,0.01144433,0.01000,0.350 | |
| 27,mlp.down_proj,0.20937583,0.01000,6.981 | |
| 28,self_attn.k_proj,0.00163398,0.01000,2.274 | |
| 28,self_attn.v_proj,0.00619308,0.01000,0.347 | |
| 28,self_attn.q_proj,0.00561940,0.01000,1.200 | |
| 28,self_attn.o_proj,0.02704479,0.01000,0.391 | |
| 28,mlp.up_proj,0.01647252,0.01000,0.362 | |
| 28,mlp.gate_proj,0.01167521,0.01000,0.348 | |
| 28,mlp.down_proj,3.19434714,0.01000,7.166 | |
| 29,self_attn.k_proj,0.00153822,0.01000,1.574 | |
| 29,self_attn.v_proj,0.00717453,0.01000,0.978 | |
| 29,self_attn.q_proj,0.00649254,0.01000,1.795 | |
| 29,self_attn.o_proj,0.06275121,0.01000,0.949 | |
| 29,mlp.up_proj,0.02440672,0.01000,2.122 | |
| 29,mlp.gate_proj,0.01807862,0.01000,0.632 | |
| 29,mlp.down_proj,0.86159390,0.01000,0.909 | |