File size: 1,347 Bytes
e95e1a2 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 | {
"method": "sensitivity_threshold_auto",
"description": "7% pruning. Auto-generated via sensitivity threshold=0.1328. Attention hardcoded (per-head). D0/U3 protected for INT8.",
"total_params_M": 695.07,
"threshold": 0.1328,
"configs": {
"7%": {
"target": 0.07,
"actual": 0.0655,
"params_removed_M": 45.5,
"strategy": "sensitivity_threshold_auto",
"sensitivity_threshold": 0.1328,
"attention_config": "hardcoded_per_head",
"protected_blocks": [
"up_blocks.3",
"down_blocks.0"
],
"per_block": {
"down_blocks.0": {
"cross_attn": 0.125
},
"down_blocks.1": {
"cross_attn": 0.125
},
"down_blocks.2": {
"self_attn": 0.125,
"cross_attn": 0.125,
"ffn": 0.05
},
"down_blocks.3": {
"resnet": 0.35
},
"up_blocks.0": {
"resnet": 0.15
},
"up_blocks.1": {
"self_attn": 0.125,
"cross_attn": 0.125
},
"up_blocks.2": {
"cross_attn": 0.125
},
"up_blocks.3": {
"cross_attn": 0.125
},
"mid_block": {
"self_attn": 0.125,
"cross_attn": 0.125,
"ffn": 0.6,
"resnet": 0.4
}
}
}
}
} |