| layer,module,loss,samples,damp,time | |
| 0,self_attn.v_proj,0.0000002875,0.05000,6.079 | |
| 0,self_attn.q_proj,0.0000129580,0.05000,6.072 | |
| 0,self_attn.k_proj,0.0000065541,0.05000,6.166 | |
| 0,self_attn.o_proj,0.0000000108,0.05000,1.322 | |
| 0,mlp.up_proj,0.0000042795,0.05000,2.767 | |
| 0,mlp.gate_proj,0.0000049425,0.05000,2.827 | |
| 0,mlp.down_proj,0.0000000314,0.05000,3.129 | |
| 1,self_attn.v_proj,0.0000006689,0.05000,5.451 | |
| 1,self_attn.q_proj,0.0000126307,0.05000,5.730 | |
| 1,self_attn.k_proj,0.0000075396,0.05000,5.728 | |
| 1,self_attn.o_proj,0.0000000542,0.05000,1.178 | |
| 1,mlp.up_proj,0.0000047425,0.05000,3.081 | |
| 1,mlp.gate_proj,0.0000054370,0.05000,3.112 | |
| 1,mlp.down_proj,0.0000014180,0.05000,3.606 | |
| 2,self_attn.q_proj,0.0000451748,0.05000,5.432 | |
| 2,self_attn.v_proj,0.0000023224,0.05000,5.532 | |
| 2,self_attn.k_proj,0.0000278147,0.05000,5.595 | |
| 2,self_attn.o_proj,0.0000000395,0.05000,1.582 | |
| 2,mlp.gate_proj,0.0000069938,0.05000,3.056 | |
| 2,mlp.up_proj,0.0000058359,0.05000,3.076 | |
| 2,mlp.down_proj,0.0000000593,0.05000,3.429 | |
| 3,self_attn.k_proj,0.0000122990,0.05000,5.539 | |
| 3,self_attn.q_proj,0.0000217445,0.05000,5.617 | |
| 3,self_attn.v_proj,0.0000017581,0.05000,5.651 | |
| 3,self_attn.o_proj,0.0000000203,0.05000,1.148 | |
| 3,mlp.up_proj,0.0000073834,0.05000,2.965 | |
| 3,mlp.gate_proj,0.0000100123,0.05000,3.005 | |
| 3,mlp.down_proj,0.0000000824,0.05000,3.236 | |
| 4,self_attn.v_proj,0.0000018723,0.05000,5.579 | |
| 4,self_attn.q_proj,0.0000233329,0.05000,5.656 | |
| 4,self_attn.k_proj,0.0000122032,0.05000,5.675 | |
| 4,self_attn.o_proj,0.0000000633,0.05000,1.160 | |
| 4,mlp.gate_proj,0.0000134069,0.05000,2.868 | |
| 4,mlp.up_proj,0.0000087210,0.05000,2.888 | |
| 4,mlp.down_proj,0.0000001386,0.05000,3.249 | |
| 5,self_attn.q_proj,0.0000320827,0.05000,5.716 | |
| 5,self_attn.v_proj,0.0000018635,0.05000,5.766 | |
| 5,self_attn.k_proj,0.0000201049,0.05000,5.805 | |
| 5,self_attn.o_proj,0.0000000861,0.05000,1.145 | |
| 5,mlp.up_proj,0.0000098045,0.05000,2.898 | |
| 5,mlp.gate_proj,0.0000141574,0.05000,2.948 | |
| 5,mlp.down_proj,0.0000001802,0.05000,3.211 | |
| 6,self_attn.v_proj,0.0000016420,0.05000,5.570 | |
| 6,self_attn.k_proj,0.0000132601,0.05000,5.575 | |
| 6,self_attn.q_proj,0.0000247839,0.05000,5.591 | |
| 6,self_attn.o_proj,0.0000001096,0.05000,1.109 | |
| 6,mlp.up_proj,0.0000105212,0.05000,2.988 | |
| 6,mlp.gate_proj,0.0000152134,0.05000,3.020 | |
| 6,mlp.down_proj,0.0000002012,0.05000,3.370 | |
| 7,self_attn.k_proj,0.0000120739,0.05000,5.535 | |
| 7,self_attn.v_proj,0.0000014840,0.05000,5.605 | |
| 7,self_attn.q_proj,0.0000204857,0.05000,5.640 | |
| 7,self_attn.o_proj,0.0000002358,0.05000,1.129 | |
| 7,mlp.gate_proj,0.0000128394,0.05000,3.091 | |
| 7,mlp.up_proj,0.0000096388,0.05000,3.129 | |
| 7,mlp.down_proj,0.0000002028,0.05000,3.140 | |
| 8,self_attn.v_proj,0.0000015355,0.05000,5.690 | |
| 8,self_attn.k_proj,0.0000140590,0.05000,5.747 | |
| 8,self_attn.q_proj,0.0000230355,0.05000,5.764 | |
| 8,self_attn.o_proj,0.0000001701,0.05000,1.138 | |
| 8,mlp.up_proj,0.0000097746,0.05000,2.718 | |
| 8,mlp.gate_proj,0.0000133103,0.05000,2.764 | |
| 8,mlp.down_proj,0.0000001912,0.05000,3.235 | |
| 9,self_attn.k_proj,0.0000125890,0.05000,5.656 | |
| 9,self_attn.v_proj,0.0000019354,0.05000,5.697 | |
| 9,self_attn.q_proj,0.0000210542,0.05000,5.709 | |
| 9,self_attn.o_proj,0.0000001880,0.05000,1.125 | |
| 9,mlp.gate_proj,0.0000120921,0.05000,2.345 | |
| 9,mlp.up_proj,0.0000091294,0.05000,2.378 | |
| 9,mlp.down_proj,0.0000001759,0.05000,3.018 | |
| 10,self_attn.k_proj,0.0000123705,0.05000,5.145 | |
| 10,self_attn.q_proj,0.0000194175,0.05000,5.205 | |
| 10,self_attn.v_proj,0.0000013578,0.05000,5.219 | |
| 10,self_attn.o_proj,0.0000001988,0.05000,1.069 | |
| 10,mlp.up_proj,0.0000093869,0.05000,2.431 | |
| 10,mlp.gate_proj,0.0000116347,0.05000,2.435 | |
| 10,mlp.down_proj,0.0000001812,0.05000,3.010 | |
| 11,self_attn.k_proj,0.0000083764,0.05000,5.029 | |
| 11,self_attn.v_proj,0.0000015281,0.05000,5.087 | |
| 11,self_attn.q_proj,0.0000145726,0.05000,5.109 | |
| 11,self_attn.o_proj,0.0000002144,0.05000,1.055 | |
| 11,mlp.gate_proj,0.0000117093,0.05000,2.358 | |
| 11,mlp.up_proj,0.0000097968,0.05000,2.368 | |
| 11,mlp.down_proj,0.0000001988,0.05000,3.045 | |
| 12,self_attn.k_proj,0.0000136289,0.05000,5.094 | |
| 12,self_attn.v_proj,0.0000016965,0.05000,5.144 | |
| 12,self_attn.q_proj,0.0000224206,0.05000,5.161 | |
| 12,self_attn.o_proj,0.0000002437,0.05000,1.047 | |
| 12,mlp.gate_proj,0.0000121265,0.05000,2.366 | |
| 12,mlp.up_proj,0.0000100321,0.05000,2.385 | |
| 12,mlp.down_proj,0.0000002146,0.05000,3.073 | |
| 13,self_attn.v_proj,0.0000018654,0.05000,5.003 | |
| 13,self_attn.q_proj,0.0000215060,0.05000,5.062 | |
| 13,self_attn.k_proj,0.0000140466,0.05000,5.070 | |
| 13,self_attn.o_proj,0.0000002475,0.05000,1.040 | |
| 13,mlp.gate_proj,0.0000145311,0.05000,2.448 | |
| 13,mlp.up_proj,0.0000111055,0.05000,2.464 | |
| 13,mlp.down_proj,0.0000002871,0.05000,2.965 | |
| 14,self_attn.q_proj,0.0000244416,0.05000,4.975 | |
| 14,self_attn.k_proj,0.0000109761,0.05000,5.087 | |
| 14,self_attn.v_proj,0.0000021334,0.05000,5.103 | |
| 14,self_attn.o_proj,0.0000004272,0.05000,1.061 | |
| 14,mlp.gate_proj,0.0000144053,0.05000,2.369 | |
| 14,mlp.up_proj,0.0000109751,0.05000,2.391 | |
| 14,mlp.down_proj,0.0000002757,0.05000,3.033 | |
| 15,self_attn.v_proj,0.0000019140,0.05000,5.057 | |
| 15,self_attn.k_proj,0.0000115560,0.05000,5.108 | |
| 15,self_attn.q_proj,0.0000219541,0.05000,5.133 | |
| 15,self_attn.o_proj,0.0000003740,0.05000,1.044 | |
| 15,mlp.gate_proj,0.0000141731,0.05000,2.447 | |
| 15,mlp.up_proj,0.0000101552,0.05000,2.471 | |
| 15,mlp.down_proj,0.0000002539,0.05000,3.024 | |
| 16,self_attn.q_proj,0.0000201770,0.05000,4.931 | |
| 16,self_attn.v_proj,0.0000019840,0.05000,5.031 | |
| 16,self_attn.k_proj,0.0000116480,0.05000,5.075 | |
| 16,self_attn.o_proj,0.0000002044,0.05000,1.058 | |
| 16,mlp.gate_proj,0.0000144537,0.05000,2.390 | |
| 16,mlp.up_proj,0.0000101879,0.05000,2.410 | |
| 16,mlp.down_proj,0.0000002548,0.05000,3.036 | |
| 17,self_attn.v_proj,0.0000019457,0.05000,5.025 | |
| 17,self_attn.k_proj,0.0000103892,0.05000,5.091 | |
| 17,self_attn.q_proj,0.0000190087,0.05000,5.127 | |
| 17,self_attn.o_proj,0.0000001803,0.05000,1.055 | |
| 17,mlp.up_proj,0.0000105910,0.05000,2.332 | |
| 17,mlp.gate_proj,0.0000151940,0.05000,2.350 | |
| 17,mlp.down_proj,0.0000002681,0.05000,3.039 | |
| 18,self_attn.k_proj,0.0000125478,0.05000,5.233 | |
| 18,self_attn.q_proj,0.0000225686,0.05000,5.229 | |
| 18,self_attn.v_proj,0.0000024447,0.05000,5.291 | |
| 18,self_attn.o_proj,0.0000000928,0.05000,1.089 | |
| 18,mlp.up_proj,0.0000113110,0.05000,2.333 | |
| 18,mlp.gate_proj,0.0000158267,0.05000,2.352 | |
| 18,mlp.down_proj,0.0000002841,0.05000,3.043 | |
| 19,self_attn.v_proj,0.0000024250,0.05000,5.080 | |
| 19,self_attn.q_proj,0.0000203657,0.05000,5.166 | |
| 19,self_attn.k_proj,0.0000117773,0.05000,5.181 | |
| 19,self_attn.o_proj,0.0000001395,0.05000,1.059 | |
| 19,mlp.up_proj,0.0000118265,0.05000,2.313 | |
| 19,mlp.gate_proj,0.0000163829,0.05000,2.330 | |
| 19,mlp.down_proj,0.0000003390,0.05000,3.025 | |
| 20,self_attn.k_proj,0.0000131098,0.05000,5.081 | |
| 20,self_attn.q_proj,0.0000216605,0.05000,5.130 | |
| 20,self_attn.v_proj,0.0000028895,0.05000,5.157 | |
| 20,self_attn.o_proj,0.0000000723,0.05000,1.023 | |
| 20,mlp.up_proj,0.0000114745,0.05000,2.554 | |
| 20,mlp.gate_proj,0.0000150741,0.05000,2.556 | |
| 20,mlp.down_proj,0.0000002896,0.05000,3.027 | |
| 21,self_attn.v_proj,0.0000038318,0.05000,5.045 | |
| 21,self_attn.k_proj,0.0000127311,0.05000,5.085 | |
| 21,self_attn.q_proj,0.0000215379,0.05000,5.122 | |
| 21,self_attn.o_proj,0.0000000909,0.05000,1.051 | |
| 21,mlp.up_proj,0.0000113903,0.05000,2.481 | |
| 21,mlp.gate_proj,0.0000150505,0.05000,2.496 | |
| 21,mlp.down_proj,0.0000002896,0.05000,3.067 | |
| 22,self_attn.v_proj,0.0000036099,0.05000,5.172 | |
| 22,self_attn.k_proj,0.0000112382,0.05000,5.192 | |
| 22,self_attn.q_proj,0.0000197390,0.05000,5.234 | |
| 22,self_attn.o_proj,0.0000000599,0.05000,1.053 | |
| 22,mlp.gate_proj,0.0000153890,0.05000,2.339 | |
| 22,mlp.up_proj,0.0000115268,0.05000,2.361 | |
| 22,mlp.down_proj,0.0000003044,0.05000,3.107 | |
| 23,self_attn.k_proj,0.0000127207,0.05000,5.052 | |
| 23,self_attn.v_proj,0.0000033499,0.05000,5.106 | |
| 23,self_attn.q_proj,0.0000205526,0.05000,5.127 | |
| 23,self_attn.o_proj,0.0000000568,0.05000,1.063 | |
| 23,mlp.up_proj,0.0000131494,0.05000,2.542 | |
| 23,mlp.gate_proj,0.0000187574,0.05000,2.560 | |
| 23,mlp.down_proj,0.0000004297,0.05000,3.052 | |
| 24,self_attn.v_proj,0.0000050478,0.05000,5.095 | |
| 24,self_attn.k_proj,0.0000132556,0.05000,5.190 | |
| 24,self_attn.q_proj,0.0000210217,0.05000,5.220 | |
| 24,self_attn.o_proj,0.0000002743,0.05000,1.064 | |
| 24,mlp.gate_proj,0.0000177907,0.05000,2.397 | |
| 24,mlp.up_proj,0.0000121369,0.05000,2.419 | |
| 24,mlp.down_proj,0.0000003998,0.05000,3.048 | |
| 25,self_attn.v_proj,0.0000035746,0.05000,5.082 | |
| 25,self_attn.k_proj,0.0000085866,0.05000,5.154 | |
| 25,self_attn.q_proj,0.0000167753,0.05000,5.200 | |
| 25,self_attn.o_proj,0.0000006733,0.05000,1.076 | |
| 25,mlp.up_proj,0.0000131685,0.05000,2.416 | |
| 25,mlp.gate_proj,0.0000198001,0.05000,2.429 | |
| 25,mlp.down_proj,0.0000007029,0.05000,3.048 | |
| 26,self_attn.v_proj,0.0000052315,0.05000,5.138 | |
| 26,self_attn.q_proj,0.0000171792,0.05000,5.155 | |
| 26,self_attn.k_proj,0.0000105835,0.05000,5.196 | |
| 26,self_attn.o_proj,0.0000003890,0.05000,1.061 | |
| 26,mlp.up_proj,0.0000142373,0.05000,2.443 | |
| 26,mlp.gate_proj,0.0000217037,0.05000,2.462 | |
| 26,mlp.down_proj,0.0000014717,0.05000,3.041 | |
| 27,self_attn.k_proj,0.0000074436,0.05000,5.060 | |
| 27,self_attn.q_proj,0.0000136104,0.05000,5.123 | |
| 27,self_attn.v_proj,0.0000038322,0.05000,5.142 | |
| 27,self_attn.o_proj,0.0000033302,0.05000,1.107 | |
| 27,mlp.up_proj,0.0000177582,0.05000,2.535 | |
| 27,mlp.gate_proj,0.0000236296,0.05000,2.561 | |
| 27,mlp.down_proj,0.0000210622,0.05000,3.164 | |