YiYiXu HF Staff commited on
Commit
4124d91
·
verified ·
1 Parent(s): 0e07219

Update mellon_pipeline_config.json

Browse files
Files changed (1) hide show
  1. mellon_pipeline_config.json +45 -16
mellon_pipeline_config.json CHANGED
@@ -17,53 +17,82 @@
17
  "label": "Quant Type",
18
  "type": "string",
19
  "options": [
20
- "bnb_4bit"
 
21
  ],
22
- "value": "bnb_4bit"
 
 
 
 
 
 
 
 
 
 
 
23
  },
24
  "bnb_4bit_quant_type": {
25
- "label": "Bnb 4Bit Quant Type",
26
  "type": "string",
27
  "options": [
28
- "nf4"
 
29
  ],
30
  "value": "nf4"
31
  },
32
  "bnb_4bit_compute_dtype": {
33
- "label": "Bnb 4Bit Compute Dtype",
34
  "type": "string",
35
  "options": [
36
- ""
 
 
 
37
  ],
38
  "value": ""
39
  },
40
  "bnb_4bit_use_double_quant": {
41
- "label": "Bnb 4Bit Use Double Quant",
42
  "type": "boolean",
43
  "default": false
44
  },
45
  "llm_int8_threshold": {
46
- "label": "Llm Int8 Threshold",
47
  "type": "float",
48
  "display": "slider",
49
  "default": 6.0,
50
- "min": 6.0,
51
- "max": 6.0,
52
- "step": 0.01
53
  },
54
  "llm_int8_has_fp16_weight": {
55
- "label": "Llm Int8 Has Fp16 Weight",
56
  "type": "boolean",
57
  "default": false
58
  },
59
  "llm_int8_skip_modules": {
60
- "label": "Llm Int8 Skip Modules",
61
- "type": "custom",
62
- "display": "input"
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  },
64
  "quantization_config": {
65
  "label": "Quantization Config",
66
- "type": "custom",
67
  "display": "output"
68
  },
69
  "doc": {
 
17
  "label": "Quant Type",
18
  "type": "string",
19
  "options": [
20
+ "bnb_4bit",
21
+ "bnb_8bit"
22
  ],
23
+ "value": "bnb_4bit",
24
+ "onChange": {
25
+ "bnb_4bit": [
26
+ "bnb_4bit_quant_type",
27
+ "bnb_4bit_compute_dtype",
28
+ "bnb_4bit_use_double_quant"
29
+ ],
30
+ "bnb_8bit": [
31
+ "llm_int8_threshold",
32
+ "llm_int8_has_fp16_weight"
33
+ ]
34
+ }
35
  },
36
  "bnb_4bit_quant_type": {
37
+ "label": "4-bit Quant Type",
38
  "type": "string",
39
  "options": [
40
+ "nf4",
41
+ "fp4"
42
  ],
43
  "value": "nf4"
44
  },
45
  "bnb_4bit_compute_dtype": {
46
+ "label": "Compute Dtype",
47
  "type": "string",
48
  "options": [
49
+ "",
50
+ "float32",
51
+ "float16",
52
+ "bfloat16"
53
  ],
54
  "value": ""
55
  },
56
  "bnb_4bit_use_double_quant": {
57
+ "label": "Double Quant",
58
  "type": "boolean",
59
  "default": false
60
  },
61
  "llm_int8_threshold": {
62
+ "label": "Int8 Threshold",
63
  "type": "float",
64
  "display": "slider",
65
  "default": 6.0,
66
+ "min": 0.0,
67
+ "max": 10.0,
68
+ "step": 0.5
69
  },
70
  "llm_int8_has_fp16_weight": {
71
+ "label": "Has FP16 Weight",
72
  "type": "boolean",
73
  "default": false
74
  },
75
  "llm_int8_skip_modules": {
76
+ "label": "Skip Modules",
77
+ "type": "string",
78
+ "display": "select",
79
+ "options": [
80
+ "transformer_blocks.0.img_mod",
81
+ "transformer_blocks.33.img_mod",
82
+ "transformer_blocks.58.attn.to_k",
83
+ "transformer_blocks.59.attn.to_out",
84
+ "time_text_embed",
85
+ "img_in",
86
+ "txt_in"
87
+ ],
88
+ "fieldOptions": {
89
+ "multiple": true
90
+ },
91
+ "value": []
92
  },
93
  "quantization_config": {
94
  "label": "Quantization Config",
95
+ "type": "quant_config",
96
  "display": "output"
97
  },
98
  "doc": {