MiniMax-M2.5-tiny-24e / expert_prune_plan.json
morriszjm's picture
training-free expert prune K=24/32 (PR=25%) via routing-mass calibration
51d7883 verified
{
"src_model": "morriszjm/MiniMax-M2.5-tiny",
"src_inventory": "artifacts/tiny_inventory.json",
"src_importance": "artifacts/tiny_importance.json",
"method": "routing_softmax_topk_mass + per-layer uniform top-K, drop-the-rest",
"K": 24,
"L": 8,
"E_orig": 32,
"n_dropped": 8,
"pruning_rate": 0.25,
"ep_size_check": 8,
"top_k": 8,
"kept_per_layer_old_indices": [
[
0,
1,
2,
4,
5,
6,
7,
10,
12,
13,
14,
15,
17,
18,
19,
20,
21,
22,
23,
25,
26,
27,
30,
31
],
[
0,
1,
2,
3,
4,
6,
7,
8,
9,
11,
12,
13,
14,
16,
17,
18,
19,
23,
24,
27,
28,
29,
30,
31
],
[
0,
1,
2,
3,
4,
6,
7,
8,
9,
10,
12,
14,
16,
17,
19,
20,
22,
23,
24,
26,
27,
28,
29,
30
],
[
0,
2,
3,
5,
6,
7,
8,
9,
11,
15,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30
],
[
0,
1,
2,
3,
4,
5,
7,
8,
9,
10,
12,
14,
16,
17,
18,
21,
22,
23,
24,
25,
26,
27,
28,
30
],
[
1,
2,
3,
7,
8,
10,
11,
12,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
26,
28,
29,
30,
31
],
[
0,
1,
2,
4,
5,
6,
7,
8,
9,
10,
12,
16,
17,
19,
21,
22,
23,
25,
26,
27,
28,
29,
30,
31
],
[
0,
1,
3,
6,
7,
9,
10,
11,
12,
13,
14,
15,
16,
17,
19,
22,
24,
25,
26,
27,
28,
29,
30,
31
]
],
"kept_score_min_per_layer": [
5.091672860085964,
14.596360385417938,
33.47318064421415,
8.822094783186913,
12.742229215800762,
19.971908435225487,
0.0,
5.011361248791218
],
"drop_score_max_per_layer": [
4.3719402849674225,
14.47503225505352,
30.457208454608917,
8.272616788744926,
11.775540083646774,
15.646341614425182,
0.0,
4.902323044836521
],
"kept_dropped_score_gap_per_layer": [
0.7197325751185417,
0.12132813036441803,
3.015972189605236,
0.5494779944419861,
0.9666891321539879,
4.325566820800304,
0.0,
0.10903820395469666
],
"calibration_meta": {
"n_prompts_used": 64,
"tokens_per_layer": 1851,
"tokens_per_bucket": {
"ai4code": 1008,
"general_en": 416,
"reasoning": 257,
"multilingual": 170
}
}
}