EdgeDiffusion_r3 / pruning_config.json
ChenHe727's picture
Upload pruning_config.json with huggingface_hub
2c4c1a8 verified
{
"method": "sensitivity_threshold_auto",
"description": "7% pruning. Auto-generated via sensitivity threshold=0.0876. Attention hardcoded (per-head). D0/U3 protected for INT8.",
"total_params_M": 746.32,
"threshold": 0.0876,
"configs": {
"7%": {
"target": 0.07,
"actual": 0.0639,
"params_removed_M": 47.7,
"strategy": "sensitivity_threshold_auto",
"sensitivity_threshold": 0.0876,
"attention_config": "hardcoded_per_head",
"protected_blocks": [
"up_blocks.3",
"down_blocks.0"
],
"per_block": {
"down_blocks.0": {
"cross_attn": 0.125
},
"down_blocks.1": {
"cross_attn": 0.125
},
"down_blocks.2": {
"self_attn": 0.125,
"cross_attn": 0.25
},
"down_blocks.3": {
"resnet": 0.25
},
"up_blocks.0": {
"resnet": 0.15
},
"up_blocks.1": {
"self_attn": 0.125,
"cross_attn": 0.25
},
"up_blocks.2": {
"cross_attn": 0.125
},
"up_blocks.3": {
"cross_attn": 0.125
},
"mid_block": {
"self_attn": 0.25,
"cross_attn": 0.25,
"ffn": 0.6,
"resnet": 0.2
}
}
}
}
}