{ "method": "sensitivity_threshold_auto", "description": "7% pruning. Auto-generated via sensitivity threshold=0.0876. Attention hardcoded (per-head). D0/U3 protected for INT8.", "total_params_M": 746.32, "threshold": 0.0876, "configs": { "7%": { "target": 0.07, "actual": 0.0639, "params_removed_M": 47.7, "strategy": "sensitivity_threshold_auto", "sensitivity_threshold": 0.0876, "attention_config": "hardcoded_per_head", "protected_blocks": [ "up_blocks.3", "down_blocks.0" ], "per_block": { "down_blocks.0": { "cross_attn": 0.125 }, "down_blocks.1": { "cross_attn": 0.125 }, "down_blocks.2": { "self_attn": 0.125, "cross_attn": 0.25 }, "down_blocks.3": { "resnet": 0.25 }, "up_blocks.0": { "resnet": 0.15 }, "up_blocks.1": { "self_attn": 0.125, "cross_attn": 0.25 }, "up_blocks.2": { "cross_attn": 0.125 }, "up_blocks.3": { "cross_attn": 0.125 }, "mid_block": { "self_attn": 0.25, "cross_attn": 0.25, "ffn": 0.6, "resnet": 0.2 } } } } }