| layer,module,loss,samples,damp,time | |
| 0,self_attn.v_proj,0.0000003655,0.05000,6.135 | |
| 0,self_attn.q_proj,0.0000139163,0.05000,6.251 | |
| 0,self_attn.k_proj,0.0000070522,0.05000,6.287 | |
| 0,self_attn.o_proj,0.0000000161,0.05000,1.438 | |
| 0,mlp.up_proj,0.0000059081,0.05000,3.042 | |
| 0,mlp.gate_proj,0.0000067841,0.05000,3.079 | |
| 0,mlp.down_proj,0.0000000707,0.05000,3.574 | |
| 1,self_attn.q_proj,0.0000158107,0.05000,6.250 | |
| 1,self_attn.k_proj,0.0000093271,0.05000,6.342 | |
| 1,self_attn.v_proj,0.0000009569,0.05000,6.403 | |
| 1,self_attn.o_proj,0.0000000717,0.05000,1.268 | |
| 1,mlp.gate_proj,0.0000085050,0.05000,2.909 | |
| 1,mlp.up_proj,0.0000074407,0.05000,2.938 | |
| 1,mlp.down_proj,0.0000020780,0.05000,3.624 | |
| 2,self_attn.v_proj,0.0000035664,0.05000,6.128 | |
| 2,self_attn.k_proj,0.0000384627,0.05000,6.183 | |
| 2,self_attn.q_proj,0.0000636528,0.05000,6.217 | |
| 2,self_attn.o_proj,0.0000000483,0.05000,1.279 | |
| 2,mlp.gate_proj,0.0000133714,0.05000,2.891 | |
| 2,mlp.up_proj,0.0000112456,0.05000,2.918 | |
| 2,mlp.down_proj,0.0000001836,0.05000,3.592 | |
| 3,self_attn.k_proj,0.0000209325,0.05000,6.104 | |
| 3,self_attn.q_proj,0.0000374590,0.05000,6.210 | |
| 3,self_attn.v_proj,0.0000032397,0.05000,6.243 | |
| 3,self_attn.o_proj,0.0000000519,0.05000,1.242 | |
| 3,mlp.gate_proj,0.0000199032,0.05000,2.985 | |
| 3,mlp.up_proj,0.0000147765,0.05000,3.037 | |
| 3,mlp.down_proj,0.0000002623,0.05000,3.622 | |
| 4,self_attn.k_proj,0.0000209495,0.05000,6.247 | |
| 4,self_attn.v_proj,0.0000035178,0.05000,6.307 | |
| 4,self_attn.q_proj,0.0000402571,0.05000,6.356 | |
| 4,self_attn.o_proj,0.0000001683,0.05000,1.296 | |
| 4,mlp.gate_proj,0.0000267916,0.05000,3.001 | |
| 4,mlp.up_proj,0.0000176318,0.05000,3.032 | |
| 4,mlp.down_proj,0.0000004458,0.05000,3.538 | |
| 5,self_attn.q_proj,0.0000566906,0.05000,6.143 | |
| 5,self_attn.k_proj,0.0000350725,0.05000,6.192 | |
| 5,self_attn.v_proj,0.0000035867,0.05000,6.259 | |
| 5,self_attn.o_proj,0.0000002498,0.05000,1.254 | |
| 5,mlp.up_proj,0.0000200849,0.05000,2.861 | |
| 5,mlp.gate_proj,0.0000287105,0.05000,2.907 | |
| 5,mlp.down_proj,0.0000006270,0.05000,3.494 | |
| 6,self_attn.q_proj,0.0000456653,0.05000,6.164 | |
| 6,self_attn.k_proj,0.0000243565,0.05000,6.213 | |
| 6,self_attn.v_proj,0.0000032720,0.05000,6.258 | |
| 6,self_attn.o_proj,0.0000002966,0.05000,1.271 | |
| 6,mlp.gate_proj,0.0000316156,0.05000,2.851 | |
| 6,mlp.up_proj,0.0000221315,0.05000,2.875 | |
| 6,mlp.down_proj,0.0000007019,0.05000,3.596 | |
| 7,self_attn.k_proj,0.0000232553,0.05000,6.241 | |
| 7,self_attn.q_proj,0.0000390834,0.05000,6.349 | |
| 7,self_attn.v_proj,0.0000030140,0.05000,6.364 | |
| 7,self_attn.o_proj,0.0000005020,0.05000,1.230 | |
| 7,mlp.gate_proj,0.0000300552,0.05000,2.820 | |
| 7,mlp.up_proj,0.0000227827,0.05000,2.857 | |
| 7,mlp.down_proj,0.0000007818,0.05000,3.548 | |
| 8,self_attn.k_proj,0.0000296915,0.05000,6.160 | |
| 8,self_attn.q_proj,0.0000489327,0.05000,6.220 | |
| 8,self_attn.v_proj,0.0000035765,0.05000,6.250 | |
| 8,self_attn.o_proj,0.0000005180,0.05000,1.287 | |
| 8,mlp.gate_proj,0.0000325682,0.05000,3.116 | |
| 8,mlp.up_proj,0.0000241525,0.05000,3.147 | |
| 8,mlp.down_proj,0.0000007777,0.05000,3.697 | |
| 9,self_attn.k_proj,0.0000279815,0.05000,6.365 | |
| 9,self_attn.q_proj,0.0000470294,0.05000,6.415 | |
| 9,self_attn.v_proj,0.0000045795,0.05000,6.444 | |
| 9,self_attn.o_proj,0.0000005254,0.05000,1.274 | |
| 9,mlp.gate_proj,0.0000318904,0.05000,3.054 | |
| 9,mlp.up_proj,0.0000243400,0.05000,3.097 | |
| 9,mlp.down_proj,0.0000007917,0.05000,3.662 | |
| 10,self_attn.v_proj,0.0000035862,0.05000,6.390 | |
| 10,self_attn.k_proj,0.0000299603,0.05000,6.439 | |
| 10,self_attn.q_proj,0.0000476768,0.05000,6.472 | |
| 10,self_attn.o_proj,0.0000006423,0.05000,1.260 | |
| 10,mlp.gate_proj,0.0000323488,0.05000,3.004 | |
| 10,mlp.up_proj,0.0000264711,0.05000,3.029 | |
| 10,mlp.down_proj,0.0000009133,0.05000,3.569 | |
| 11,self_attn.v_proj,0.0000042222,0.05000,6.385 | |
| 11,self_attn.q_proj,0.0000389616,0.05000,6.432 | |
| 11,self_attn.k_proj,0.0000221590,0.05000,6.478 | |
| 11,self_attn.o_proj,0.0000007108,0.05000,1.303 | |
| 11,mlp.gate_proj,0.0000346920,0.05000,3.147 | |
| 11,mlp.up_proj,0.0000293260,0.05000,3.189 | |
| 11,mlp.down_proj,0.0000010680,0.05000,3.578 | |
| 12,self_attn.v_proj,0.0000049074,0.05000,6.397 | |
| 12,self_attn.q_proj,0.0000599314,0.05000,6.425 | |
| 12,self_attn.k_proj,0.0000360839,0.05000,6.448 | |
| 12,self_attn.o_proj,0.0000008251,0.05000,1.306 | |
| 12,mlp.up_proj,0.0000314120,0.05000,3.121 | |
| 12,mlp.gate_proj,0.0000372577,0.05000,3.155 | |
| 12,mlp.down_proj,0.0000012126,0.05000,3.640 | |
| 13,self_attn.k_proj,0.0000389678,0.05000,6.532 | |
| 13,self_attn.q_proj,0.0000606843,0.05000,6.581 | |
| 13,self_attn.v_proj,0.0000056146,0.05000,6.603 | |
| 13,self_attn.o_proj,0.0000009978,0.05000,1.232 | |
| 13,mlp.gate_proj,0.0000445419,0.05000,3.054 | |
| 13,mlp.up_proj,0.0000351055,0.05000,3.085 | |
| 13,mlp.down_proj,0.0000015760,0.05000,3.608 | |
| 14,self_attn.q_proj,0.0000686343,0.05000,6.346 | |
| 14,self_attn.k_proj,0.0000314004,0.05000,6.429 | |
| 14,self_attn.v_proj,0.0000066387,0.05000,6.455 | |
| 14,self_attn.o_proj,0.0000012561,0.05000,1.325 | |
| 14,mlp.up_proj,0.0000375102,0.05000,2.993 | |
| 14,mlp.gate_proj,0.0000478461,0.05000,3.019 | |
| 14,mlp.down_proj,0.0000019180,0.05000,3.639 | |
| 15,self_attn.v_proj,0.0000065177,0.05000,6.382 | |
| 15,self_attn.q_proj,0.0000684232,0.05000,6.478 | |
| 15,self_attn.k_proj,0.0000357806,0.05000,6.490 | |
| 15,self_attn.o_proj,0.0000009062,0.05000,1.253 | |
| 15,mlp.up_proj,0.0000374816,0.05000,3.019 | |
| 15,mlp.gate_proj,0.0000510690,0.05000,3.046 | |
| 15,mlp.down_proj,0.0000019322,0.05000,3.550 | |
| 16,self_attn.q_proj,0.0000697884,0.05000,6.246 | |
| 16,self_attn.v_proj,0.0000073443,0.05000,6.299 | |
| 16,self_attn.k_proj,0.0000398958,0.05000,6.347 | |
| 16,self_attn.o_proj,0.0000005650,0.05000,1.274 | |
| 16,mlp.up_proj,0.0000372290,0.05000,3.057 | |
| 16,mlp.gate_proj,0.0000518827,0.05000,3.110 | |
| 16,mlp.down_proj,0.0000018123,0.05000,3.574 | |
| 17,self_attn.v_proj,0.0000071509,0.05000,6.345 | |
| 17,self_attn.k_proj,0.0000360828,0.05000,6.390 | |
| 17,self_attn.q_proj,0.0000662234,0.05000,6.422 | |
| 17,self_attn.o_proj,0.0000005764,0.05000,1.277 | |
| 17,mlp.gate_proj,0.0000540872,0.05000,3.071 | |
| 17,mlp.up_proj,0.0000382789,0.05000,3.121 | |
| 17,mlp.down_proj,0.0000019723,0.05000,3.628 | |
| 18,self_attn.q_proj,0.0000768960,0.05000,6.232 | |
| 18,self_attn.v_proj,0.0000090087,0.05000,6.312 | |
| 18,self_attn.k_proj,0.0000426919,0.05000,6.348 | |
| 18,self_attn.o_proj,0.0000005129,0.05000,1.306 | |
| 18,mlp.up_proj,0.0000403784,0.05000,3.084 | |
| 18,mlp.gate_proj,0.0000557208,0.05000,3.102 | |
| 18,mlp.down_proj,0.0000020153,0.05000,3.576 | |
| 19,self_attn.k_proj,0.0000391191,0.05000,6.414 | |
| 19,self_attn.q_proj,0.0000672697,0.05000,6.462 | |
| 19,self_attn.v_proj,0.0000086852,0.05000,6.490 | |
| 19,self_attn.o_proj,0.0000007129,0.05000,1.348 | |
| 19,mlp.up_proj,0.0000428687,0.05000,3.091 | |
| 19,mlp.gate_proj,0.0000584434,0.05000,3.129 | |
| 19,mlp.down_proj,0.0000024692,0.05000,3.558 | |
| 20,self_attn.v_proj,0.0000102000,0.05000,6.572 | |
| 20,self_attn.k_proj,0.0000419316,0.05000,6.646 | |
| 20,self_attn.q_proj,0.0000693657,0.05000,6.679 | |
| 20,self_attn.o_proj,0.0000005730,0.05000,1.440 | |
| 20,mlp.up_proj,0.0000435856,0.05000,3.067 | |
| 20,mlp.gate_proj,0.0000564082,0.05000,3.126 | |
| 20,mlp.down_proj,0.0000023884,0.05000,3.670 | |
| 21,self_attn.k_proj,0.0000410597,0.05000,6.395 | |
| 21,self_attn.v_proj,0.0000134331,0.05000,6.524 | |
| 21,self_attn.q_proj,0.0000694150,0.05000,6.547 | |
| 21,self_attn.o_proj,0.0000006532,0.05000,1.324 | |
| 21,mlp.gate_proj,0.0000595703,0.05000,3.093 | |
| 21,mlp.up_proj,0.0000455969,0.05000,3.126 | |
| 21,mlp.down_proj,0.0000025119,0.05000,3.593 | |
| 22,self_attn.k_proj,0.0000379314,0.05000,6.376 | |
| 22,self_attn.q_proj,0.0000656641,0.05000,6.415 | |
| 22,self_attn.v_proj,0.0000129559,0.05000,6.437 | |
| 22,self_attn.o_proj,0.0000006026,0.05000,1.297 | |
| 22,mlp.up_proj,0.0000487634,0.05000,3.087 | |
| 22,mlp.gate_proj,0.0000640544,0.05000,3.115 | |
| 22,mlp.down_proj,0.0000028967,0.05000,3.652 | |
| 23,self_attn.q_proj,0.0000680379,0.05000,6.571 | |
| 23,self_attn.v_proj,0.0000125475,0.05000,6.652 | |
| 23,self_attn.k_proj,0.0000421066,0.05000,6.674 | |
| 23,self_attn.o_proj,0.0000008360,0.05000,1.300 | |
| 23,mlp.gate_proj,0.0000771958,0.05000,3.051 | |
| 23,mlp.up_proj,0.0000553964,0.05000,3.084 | |
| 23,mlp.down_proj,0.0000037663,0.05000,3.648 | |
| 24,self_attn.q_proj,0.0000738199,0.05000,6.379 | |
| 24,self_attn.v_proj,0.0000189734,0.05000,6.423 | |
| 24,self_attn.k_proj,0.0000465050,0.05000,6.477 | |
| 24,self_attn.o_proj,0.0000014266,0.05000,1.281 | |
| 24,mlp.up_proj,0.0000596369,0.05000,3.043 | |
| 24,mlp.gate_proj,0.0000848039,0.05000,3.081 | |
| 24,mlp.down_proj,0.0000043019,0.05000,3.599 | |
| 25,self_attn.k_proj,0.0000343078,0.05000,6.722 | |
| 25,self_attn.q_proj,0.0000664509,0.05000,6.772 | |
| 25,self_attn.v_proj,0.0000153221,0.05000,6.806 | |
| 25,self_attn.o_proj,0.0000016806,0.05000,1.262 | |
| 25,mlp.gate_proj,0.0000898007,0.05000,3.004 | |
| 25,mlp.up_proj,0.0000626860,0.05000,3.051 | |
| 25,mlp.down_proj,0.0000053409,0.05000,3.695 | |
| 26,self_attn.v_proj,0.0000210691,0.05000,6.411 | |
| 26,self_attn.q_proj,0.0000636958,0.05000,6.472 | |
| 26,self_attn.k_proj,0.0000403479,0.05000,6.524 | |
| 26,self_attn.o_proj,0.0000014542,0.05000,1.290 | |
| 26,mlp.up_proj,0.0000650641,0.05000,3.043 | |
| 26,mlp.gate_proj,0.0000945761,0.05000,3.087 | |
| 26,mlp.down_proj,0.0000081644,0.05000,3.669 | |
| 27,self_attn.v_proj,0.0000141159,0.05000,6.830 | |
| 27,self_attn.k_proj,0.0000273797,0.05000,6.913 | |
| 27,self_attn.q_proj,0.0000486121,0.05000,6.940 | |
| 27,self_attn.o_proj,0.0000070236,0.05000,1.345 | |
| 27,mlp.gate_proj,0.0000950958,0.05000,3.230 | |
| 27,mlp.up_proj,0.0000753671,0.05000,3.255 | |
| 27,mlp.down_proj,0.0000416984,0.05000,3.798 | |