{ "method": "sensitivity_threshold_auto", "description": "7% pruning. Auto-generated via sensitivity threshold=0.0864. Attention hardcoded (per-head). D0/U3 protected for INT8.", "total_params_M": 809.45, "threshold": 0.0864, "configs": { "7%": { "target": 0.07, "actual": 0.0753, "params_removed_M": 61.0, "strategy": "sensitivity_threshold_auto", "sensitivity_threshold": 0.0864, "attention_config": "hardcoded_per_head", "protected_blocks": [ "up_blocks.3", "down_blocks.0" ], "per_block": { "down_blocks.0": { "cross_attn": 0.125 }, "down_blocks.1": { "cross_attn": 0.125 }, "down_blocks.2": { "self_attn": 0.125, "cross_attn": 0.25 }, "down_blocks.3": { "resnet": 0.3 }, "up_blocks.0": { "resnet": 0.1 }, "up_blocks.1": { "self_attn": 0.125, "cross_attn": 0.25 }, "up_blocks.2": { "cross_attn": 0.125 }, "up_blocks.3": { "cross_attn": 0.125 }, "mid_block": { "self_attn": 0.25, "cross_attn": 0.25, "ffn": 0.6, "resnet": 0.25 } } } } }