ChenHe727 commited on
Commit
79a75e0
·
verified ·
1 Parent(s): 2d635d9

Upload pruning_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. pruning_config.json +51 -0
pruning_config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "method": "sensitivity_threshold_auto",
3
+ "description": "7% pruning. Auto-generated via sensitivity threshold=0.0674. Attention hardcoded (per-head). D0/U3 protected for INT8.",
4
+ "total_params_M": 858.49,
5
+ "threshold": 0.0674,
6
+ "configs": {
7
+ "7%": {
8
+ "target": 0.07,
9
+ "actual": 0.07,
10
+ "params_removed_M": 60.1,
11
+ "strategy": "sensitivity_threshold_auto",
12
+ "sensitivity_threshold": 0.0674,
13
+ "attention_config": "hardcoded_per_head",
14
+ "protected_blocks": [
15
+ "down_blocks.0",
16
+ "up_blocks.3"
17
+ ],
18
+ "per_block": {
19
+ "down_blocks.0": {
20
+ "cross_attn": 0.125
21
+ },
22
+ "down_blocks.1": {
23
+ "cross_attn": 0.125
24
+ },
25
+ "down_blocks.2": {
26
+ "self_attn": 0.125,
27
+ "cross_attn": 0.25
28
+ },
29
+ "down_blocks.3": {
30
+ "resnet": 0.25
31
+ },
32
+ "mid_block": {
33
+ "resnet": 0.2,
34
+ "self_attn": 0.25,
35
+ "cross_attn": 0.25,
36
+ "ffn": 0.35
37
+ },
38
+ "up_blocks.1": {
39
+ "self_attn": 0.125,
40
+ "cross_attn": 0.25
41
+ },
42
+ "up_blocks.2": {
43
+ "cross_attn": 0.125
44
+ },
45
+ "up_blocks.3": {
46
+ "cross_attn": 0.125
47
+ }
48
+ }
49
+ }
50
+ }
51
+ }