| layer,module,loss,samples,damp,time | |
| 0,mlp.shared_expert_gate,0.0000000001,0.05000,0.499 | |
| 0,linear_attn.conv1d,fallback(rtn): 0.0025482,0.00000,0.027 | |
| 0,linear_attn.in_proj_b,0.0000000155,0.05000,0.618 | |
| 0,linear_attn.in_proj_a,0.0000000626,0.05000,0.624 | |
| 1,mlp.shared_expert_gate,0.0000000002,0.05000,0.226 | |
| 1,linear_attn.conv1d,fallback(rtn): 0.0029144,0.00000,0.003 | |
| 1,linear_attn.in_proj_a,0.0000000509,0.05000,0.404 | |
| 1,linear_attn.in_proj_b,0.0000000246,0.05000,0.410 | |
| 2,mlp.shared_expert_gate,0.0000000002,0.05000,0.226 | |
| 2,linear_attn.conv1d,fallback(rtn): 0.0023651,0.00000,0.002 | |
| 2,linear_attn.in_proj_a,0.0000000371,0.05000,0.392 | |
| 2,linear_attn.in_proj_b,0.0000000259,0.05000,0.393 | |
| 3,mlp.shared_expert_gate,0.0000000002,0.05000,0.228 | |
| 4,mlp.shared_expert_gate,0.0000000003,0.05000,0.228 | |
| 4,linear_attn.conv1d,fallback(rtn): 0.0034332,0.00000,0.002 | |
| 4,linear_attn.in_proj_b,0.0000000275,0.05000,0.589 | |
| 4,linear_attn.in_proj_a,0.0000000457,0.05000,0.592 | |
| 5,mlp.shared_expert_gate,0.0000000004,0.05000,0.230 | |
| 5,linear_attn.conv1d,fallback(rtn): 0.0032959,0.00000,0.002 | |
| 5,linear_attn.in_proj_a,0.0000000540,0.05000,0.592 | |
| 5,linear_attn.in_proj_b,0.0000000330,0.05000,0.597 | |
| 6,mlp.shared_expert_gate,0.0000000004,0.05000,0.228 | |
| 6,linear_attn.conv1d,fallback(rtn): 0.0032501,0.00000,0.006 | |
| 6,linear_attn.in_proj_b,0.0000000372,0.05000,0.587 | |
| 6,linear_attn.in_proj_a,0.0000000537,0.05000,0.592 | |
| 7,mlp.shared_expert_gate,0.0000000004,0.05000,0.226 | |
| 8,mlp.shared_expert_gate,0.0000000004,0.05000,0.226 | |
| 8,linear_attn.conv1d,fallback(rtn): 0.0051270,0.00000,0.003 | |
| 8,linear_attn.in_proj_b,0.0000000398,0.05000,0.592 | |
| 8,linear_attn.in_proj_a,0.0000000837,0.05000,0.596 | |
| 9,mlp.shared_expert_gate,0.0000000003,0.05000,0.226 | |
| 9,linear_attn.conv1d,fallback(rtn): 0.0042419,0.00000,0.003 | |
| 9,linear_attn.in_proj_a,0.0000000661,0.05000,0.592 | |
| 9,linear_attn.in_proj_b,0.0000000469,0.05000,0.598 | |
| 10,mlp.shared_expert_gate,0.0000000002,0.05000,0.227 | |
| 10,linear_attn.conv1d,fallback(rtn): 0.0034790,0.00000,0.007 | |
| 10,linear_attn.in_proj_a,0.0000000523,0.05000,0.392 | |
| 10,linear_attn.in_proj_b,0.0000000358,0.05000,0.395 | |
| 11,mlp.shared_expert_gate,0.0000000003,0.05000,0.226 | |
| 12,mlp.shared_expert_gate,0.0000000004,0.05000,0.227 | |
| 12,linear_attn.conv1d,fallback(rtn): 0.0037537,0.00000,0.004 | |
| 12,linear_attn.in_proj_a,0.0000000525,0.05000,0.467 | |
| 12,linear_attn.in_proj_b,0.0000000359,0.05000,0.473 | |
| 13,mlp.shared_expert_gate,0.0000000004,0.05000,0.227 | |
| 13,linear_attn.conv1d,fallback(rtn): 0.0045166,0.00000,0.003 | |
| 13,linear_attn.in_proj_a,0.0000000676,0.05000,0.429 | |
| 13,linear_attn.in_proj_b,0.0000000426,0.05000,0.433 | |
| 14,mlp.shared_expert_gate,0.0000000004,0.05000,0.227 | |
| 14,linear_attn.conv1d,fallback(rtn): 0.0046387,0.00000,0.003 | |
| 14,linear_attn.in_proj_a,0.0000000660,0.05000,0.428 | |
| 14,linear_attn.in_proj_b,0.0000000472,0.05000,0.438 | |
| 15,mlp.shared_expert_gate,0.0000000005,0.05000,0.226 | |
| 16,mlp.shared_expert_gate,0.0000000005,0.05000,0.227 | |
| 16,linear_attn.conv1d,fallback(rtn): 0.0041809,0.00000,0.011 | |
| 16,linear_attn.in_proj_a,0.0000000582,0.05000,0.631 | |
| 16,linear_attn.in_proj_b,0.0000000415,0.05000,0.630 | |
| 17,mlp.shared_expert_gate,0.0000000005,0.05000,0.228 | |
| 17,linear_attn.conv1d,fallback(rtn): 0.0041809,0.00000,0.002 | |
| 17,linear_attn.in_proj_b,0.0000000446,0.05000,0.462 | |
| 17,linear_attn.in_proj_a,0.0000000589,0.05000,0.468 | |
| 18,mlp.shared_expert_gate,0.0000000004,0.05000,0.229 | |
| 18,linear_attn.conv1d,fallback(rtn): 0.0042725,0.00000,0.005 | |
| 18,linear_attn.in_proj_b,0.0000000463,0.05000,0.451 | |
| 18,linear_attn.in_proj_a,0.0000000575,0.05000,0.452 | |
| 19,mlp.shared_expert_gate,0.0000000005,0.05000,0.229 | |
| 20,mlp.shared_expert_gate,0.0000000006,0.05000,0.227 | |
| 20,linear_attn.conv1d,fallback(rtn): 0.0056458,0.00000,0.004 | |
| 20,linear_attn.in_proj_a,0.0000000815,0.05000,0.609 | |
| 20,linear_attn.in_proj_b,0.0000000489,0.05000,0.614 | |
| 21,mlp.shared_expert_gate,0.0000000005,0.05000,0.227 | |
| 21,linear_attn.conv1d,fallback(rtn): 0.0043335,0.00000,0.002 | |
| 21,linear_attn.in_proj_b,0.0000000441,0.05000,0.606 | |
| 21,linear_attn.in_proj_a,0.0000000643,0.05000,0.613 | |
| 22,mlp.shared_expert_gate,0.0000000003,0.05000,0.228 | |
| 22,linear_attn.conv1d,fallback(rtn): 0.0036469,0.00000,0.011 | |
| 22,linear_attn.in_proj_a,0.0000000598,0.05000,0.407 | |
| 22,linear_attn.in_proj_b,0.0000000453,0.05000,0.406 | |
| 23,mlp.shared_expert_gate,0.0000000004,0.05000,0.230 | |
| 24,mlp.shared_expert_gate,0.0000000006,0.05000,0.227 | |
| 24,linear_attn.conv1d,fallback(rtn): 0.0038605,0.00000,0.006 | |
| 24,linear_attn.in_proj_b,0.0000000423,0.05000,0.613 | |
| 24,linear_attn.in_proj_a,0.0000000583,0.05000,0.620 | |
| 25,mlp.shared_expert_gate,0.0000000005,0.05000,0.228 | |
| 25,linear_attn.conv1d,fallback(rtn): 0.0043945,0.00000,0.006 | |
| 25,linear_attn.in_proj_a,0.0000000718,0.05000,0.611 | |
| 25,linear_attn.in_proj_b,0.0000000451,0.05000,0.617 | |
| 26,mlp.shared_expert_gate,0.0000000004,0.05000,0.230 | |
| 26,linear_attn.conv1d,fallback(rtn): 0.0047913,0.00000,0.011 | |
| 26,linear_attn.in_proj_a,0.0000000673,0.05000,0.440 | |
| 26,linear_attn.in_proj_b,0.0000000510,0.05000,0.446 | |
| 27,mlp.shared_expert_gate,0.0000000005,0.05000,0.227 | |
| 28,mlp.shared_expert_gate,0.0000000005,0.05000,0.227 | |
| 28,linear_attn.conv1d,fallback(rtn): 0.0040283,0.00000,0.005 | |
| 28,linear_attn.in_proj_a,0.0000000644,0.05000,0.400 | |
| 28,linear_attn.in_proj_b,0.0000000472,0.05000,0.403 | |
| 29,mlp.shared_expert_gate,0.0000000005,0.05000,0.226 | |
| 29,linear_attn.conv1d,fallback(rtn): 0.0042725,0.00000,0.010 | |
| 29,linear_attn.in_proj_b,0.0000000466,0.05000,0.440 | |
| 29,linear_attn.in_proj_a,0.0000000594,0.05000,0.447 | |
| 30,mlp.shared_expert_gate,0.0000000005,0.05000,0.226 | |
| 30,linear_attn.conv1d,fallback(rtn): 0.0045471,0.00000,0.002 | |
| 30,linear_attn.in_proj_a,0.0000000686,0.05000,0.610 | |
| 30,linear_attn.in_proj_b,0.0000000572,0.05000,0.618 | |
| 31,mlp.shared_expert_gate,0.0000000005,0.05000,0.225 | |
| 32,mlp.shared_expert_gate,0.0000000004,0.05000,0.228 | |
| 32,linear_attn.conv1d,fallback(rtn): 0.0040588,0.00000,0.011 | |
| 32,linear_attn.in_proj_b,0.0000000539,0.05000,0.606 | |
| 32,linear_attn.in_proj_a,0.0000000782,0.05000,0.616 | |
| 33,mlp.shared_expert_gate,0.0000000004,0.05000,0.227 | |
| 33,linear_attn.conv1d,fallback(rtn): 0.0041504,0.00000,0.006 | |
| 33,linear_attn.in_proj_a,0.0000000806,0.05000,0.615 | |
| 33,linear_attn.in_proj_b,0.0000000507,0.05000,0.621 | |
| 34,mlp.shared_expert_gate,0.0000000004,0.05000,0.228 | |
| 34,linear_attn.conv1d,fallback(rtn): 0.0044861,0.00000,0.005 | |
| 34,linear_attn.in_proj_b,0.0000000513,0.05000,0.620 | |
| 34,linear_attn.in_proj_a,0.0000000973,0.05000,0.628 | |
| 35,mlp.shared_expert_gate,0.0000000004,0.05000,0.225 | |
| 36,mlp.shared_expert_gate,0.0000000003,0.05000,0.228 | |
| 36,linear_attn.conv1d,fallback(rtn): 0.0070496,0.00000,0.003 | |
| 36,linear_attn.in_proj_b,0.0000000560,0.05000,0.618 | |
| 36,linear_attn.in_proj_a,0.0000001325,0.05000,0.622 | |
| 37,mlp.shared_expert_gate,0.0000000003,0.05000,0.227 | |
| 37,linear_attn.conv1d,fallback(rtn): 0.0072632,0.00000,0.004 | |
| 37,linear_attn.in_proj_a,0.0000001435,0.05000,0.431 | |
| 37,linear_attn.in_proj_b,0.0000000616,0.05000,0.438 | |
| 38,mlp.shared_expert_gate,0.0000000002,0.05000,0.226 | |
| 38,linear_attn.conv1d,fallback(rtn): 0.0062561,0.00000,0.003 | |
| 38,linear_attn.in_proj_b,0.0000000656,0.05000,0.398 | |
| 38,linear_attn.in_proj_a,0.0000001249,0.05000,0.403 | |
| 39,mlp.shared_expert_gate,0.0000000002,0.05000,0.231 | |