Update mellon_pipeline_config.json
Browse files- mellon_pipeline_config.json +45 -16
mellon_pipeline_config.json
CHANGED
|
@@ -17,53 +17,82 @@
|
|
| 17 |
"label": "Quant Type",
|
| 18 |
"type": "string",
|
| 19 |
"options": [
|
| 20 |
-
"bnb_4bit"
|
|
|
|
| 21 |
],
|
| 22 |
-
"value": "bnb_4bit"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
},
|
| 24 |
"bnb_4bit_quant_type": {
|
| 25 |
-
"label": "
|
| 26 |
"type": "string",
|
| 27 |
"options": [
|
| 28 |
-
"nf4"
|
|
|
|
| 29 |
],
|
| 30 |
"value": "nf4"
|
| 31 |
},
|
| 32 |
"bnb_4bit_compute_dtype": {
|
| 33 |
-
"label": "
|
| 34 |
"type": "string",
|
| 35 |
"options": [
|
| 36 |
-
""
|
|
|
|
|
|
|
|
|
|
| 37 |
],
|
| 38 |
"value": ""
|
| 39 |
},
|
| 40 |
"bnb_4bit_use_double_quant": {
|
| 41 |
-
"label": "
|
| 42 |
"type": "boolean",
|
| 43 |
"default": false
|
| 44 |
},
|
| 45 |
"llm_int8_threshold": {
|
| 46 |
-
"label": "
|
| 47 |
"type": "float",
|
| 48 |
"display": "slider",
|
| 49 |
"default": 6.0,
|
| 50 |
-
"min":
|
| 51 |
-
"max":
|
| 52 |
-
"step": 0.
|
| 53 |
},
|
| 54 |
"llm_int8_has_fp16_weight": {
|
| 55 |
-
"label": "
|
| 56 |
"type": "boolean",
|
| 57 |
"default": false
|
| 58 |
},
|
| 59 |
"llm_int8_skip_modules": {
|
| 60 |
-
"label": "
|
| 61 |
-
"type": "
|
| 62 |
-
"display": "
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 63 |
},
|
| 64 |
"quantization_config": {
|
| 65 |
"label": "Quantization Config",
|
| 66 |
-
"type": "
|
| 67 |
"display": "output"
|
| 68 |
},
|
| 69 |
"doc": {
|
|
|
|
| 17 |
"label": "Quant Type",
|
| 18 |
"type": "string",
|
| 19 |
"options": [
|
| 20 |
+
"bnb_4bit",
|
| 21 |
+
"bnb_8bit"
|
| 22 |
],
|
| 23 |
+
"value": "bnb_4bit",
|
| 24 |
+
"onChange": {
|
| 25 |
+
"bnb_4bit": [
|
| 26 |
+
"bnb_4bit_quant_type",
|
| 27 |
+
"bnb_4bit_compute_dtype",
|
| 28 |
+
"bnb_4bit_use_double_quant"
|
| 29 |
+
],
|
| 30 |
+
"bnb_8bit": [
|
| 31 |
+
"llm_int8_threshold",
|
| 32 |
+
"llm_int8_has_fp16_weight"
|
| 33 |
+
]
|
| 34 |
+
}
|
| 35 |
},
|
| 36 |
"bnb_4bit_quant_type": {
|
| 37 |
+
"label": "4-bit Quant Type",
|
| 38 |
"type": "string",
|
| 39 |
"options": [
|
| 40 |
+
"nf4",
|
| 41 |
+
"fp4"
|
| 42 |
],
|
| 43 |
"value": "nf4"
|
| 44 |
},
|
| 45 |
"bnb_4bit_compute_dtype": {
|
| 46 |
+
"label": "Compute Dtype",
|
| 47 |
"type": "string",
|
| 48 |
"options": [
|
| 49 |
+
"",
|
| 50 |
+
"float32",
|
| 51 |
+
"float16",
|
| 52 |
+
"bfloat16"
|
| 53 |
],
|
| 54 |
"value": ""
|
| 55 |
},
|
| 56 |
"bnb_4bit_use_double_quant": {
|
| 57 |
+
"label": "Double Quant",
|
| 58 |
"type": "boolean",
|
| 59 |
"default": false
|
| 60 |
},
|
| 61 |
"llm_int8_threshold": {
|
| 62 |
+
"label": "Int8 Threshold",
|
| 63 |
"type": "float",
|
| 64 |
"display": "slider",
|
| 65 |
"default": 6.0,
|
| 66 |
+
"min": 0.0,
|
| 67 |
+
"max": 10.0,
|
| 68 |
+
"step": 0.5
|
| 69 |
},
|
| 70 |
"llm_int8_has_fp16_weight": {
|
| 71 |
+
"label": "Has FP16 Weight",
|
| 72 |
"type": "boolean",
|
| 73 |
"default": false
|
| 74 |
},
|
| 75 |
"llm_int8_skip_modules": {
|
| 76 |
+
"label": "Skip Modules",
|
| 77 |
+
"type": "string",
|
| 78 |
+
"display": "select",
|
| 79 |
+
"options": [
|
| 80 |
+
"transformer_blocks.0.img_mod",
|
| 81 |
+
"transformer_blocks.33.img_mod",
|
| 82 |
+
"transformer_blocks.58.attn.to_k",
|
| 83 |
+
"transformer_blocks.59.attn.to_out",
|
| 84 |
+
"time_text_embed",
|
| 85 |
+
"img_in",
|
| 86 |
+
"txt_in"
|
| 87 |
+
],
|
| 88 |
+
"fieldOptions": {
|
| 89 |
+
"multiple": true
|
| 90 |
+
},
|
| 91 |
+
"value": []
|
| 92 |
},
|
| 93 |
"quantization_config": {
|
| 94 |
"label": "Quantization Config",
|
| 95 |
+
"type": "quant_config",
|
| 96 |
"display": "output"
|
| 97 |
},
|
| 98 |
"doc": {
|