{ "model.layers.1.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 154, "reason": "mean activation magnitude=0.5228", "mean_activation_magnitude": 0.522780179977417 }, "model.layers.2.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 97, "reason": "mean activation magnitude=0.7987", "mean_activation_magnitude": 0.7986612915992737 }, "model.layers.3.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 213, "reason": "mean activation magnitude=1.4180", "mean_activation_magnitude": 1.41801917552948 }, "model.layers.4.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 226, "reason": "mean activation magnitude=1.9387", "mean_activation_magnitude": 1.9387125968933105 }, "model.layers.5.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 8, "reason": "mean activation magnitude=2.6871", "mean_activation_magnitude": 2.687067747116089 }, "model.layers.6.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 7, "reason": "mean activation magnitude=4.3966", "mean_activation_magnitude": 4.396553039550781 }, "model.layers.7.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 15, "reason": "mean activation magnitude=5.1095", "mean_activation_magnitude": 5.109454154968262 }, "model.layers.8.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 29, "reason": "mean activation magnitude=6.9894", "mean_activation_magnitude": 6.989428997039795 }, "model.layers.9.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 169, "reason": "mean activation magnitude=5.9495", "mean_activation_magnitude": 5.949464321136475 }, "model.layers.10.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 175, "reason": "mean activation magnitude=8.8505", "mean_activation_magnitude": 8.850502014160156 }, "model.layers.11.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 55, "reason": "mean activation magnitude=9.3091", "mean_activation_magnitude": 9.309072494506836 }, "model.layers.12.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 154, "reason": "mean activation magnitude=14.2129", "mean_activation_magnitude": 14.212921142578125 }, "model.layers.13.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 245, "reason": "mean activation magnitude=8.2107", "mean_activation_magnitude": 8.210664749145508 }, "model.layers.14.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 55, "reason": "mean activation magnitude=18.4452", "mean_activation_magnitude": 18.445188522338867 }, "model.layers.15.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 4, "reason": "mean activation magnitude=18.9182", "mean_activation_magnitude": 18.91815948486328 }, "model.layers.16.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 115, "reason": "mean activation magnitude=0.0000", "mean_activation_magnitude": 0.0 }, "model.layers.17.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 200, "reason": "mean activation magnitude=13.2505", "mean_activation_magnitude": 13.250476837158203 }, "model.layers.18.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 168, "reason": "mean activation magnitude=12.8750", "mean_activation_magnitude": 12.874970436096191 }, "model.layers.19.mlp": { "method": "activation_magnitude", "merge": "replace", "target_expert_idx": 142, "reason": "mean activation magnitude=0.0000", "mean_activation_magnitude": 0.0 } }