File size: 1,320 Bytes
2c4c1a8 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 | {
"method": "sensitivity_threshold_auto",
"description": "7% pruning. Auto-generated via sensitivity threshold=0.0876. Attention hardcoded (per-head). D0/U3 protected for INT8.",
"total_params_M": 746.32,
"threshold": 0.0876,
"configs": {
"7%": {
"target": 0.07,
"actual": 0.0639,
"params_removed_M": 47.7,
"strategy": "sensitivity_threshold_auto",
"sensitivity_threshold": 0.0876,
"attention_config": "hardcoded_per_head",
"protected_blocks": [
"up_blocks.3",
"down_blocks.0"
],
"per_block": {
"down_blocks.0": {
"cross_attn": 0.125
},
"down_blocks.1": {
"cross_attn": 0.125
},
"down_blocks.2": {
"self_attn": 0.125,
"cross_attn": 0.25
},
"down_blocks.3": {
"resnet": 0.25
},
"up_blocks.0": {
"resnet": 0.15
},
"up_blocks.1": {
"self_attn": 0.125,
"cross_attn": 0.25
},
"up_blocks.2": {
"cross_attn": 0.125
},
"up_blocks.3": {
"cross_attn": 0.125
},
"mid_block": {
"self_attn": 0.25,
"cross_attn": 0.25,
"ffn": 0.6,
"resnet": 0.2
}
}
}
}
} |