File size: 646 Bytes
a7e09b2 | 1 2 3 4 5 6 7 8 9 10 | {
"rationale": "From head_ablation.py sweep on 1000 COCO val images: 10 heads produced the largest individual F1 drops when ablated. Cumulative pruning of those 10 yields peak F1=0.9159 (vs baseline 0.8939); K=20 cumulative still ahead at F1=0.8971; K=30+ cliff-drops below 0.35. Peak pruning point is K=10.",
"peak_K": 10,
"baseline_F1": 0.8939,
"pruned_K10_F1": 0.9159,
"pruned_K20_F1": 0.8971,
"heads_pruned_K10": "top 10 of ranked_most_prunable_first from head_importance.json",
"how_to_apply": "At load time, for each (block, head) in the pruned list, zero block.attn.proj.weight[:, head*64:(head+1)*64]. See apply_mask.py."
}
|