Update config.json

Removing "scale_dtype" and "zp_dtype"from config.json. These are not currently supported in VLLM and there's an active issue about this open:
https://github.com/vllm-project/llm-compressor/issues/2057

Files changed (1) hide show

config.json +2 -6

config.json CHANGED Viewed

@@ -62,11 +62,9 @@
           "num_bits": 4,
           "observer": "static_minmax",
           "observer_kwargs": {},
-          "scale_dtype": "torch.float8_e4m3fn",
           "strategy": "tensor_group",
           "symmetric": true,
-          "type": "float",
-          "zp_dtype": null
         },
         "output_activations": null,
         "targets": [
@@ -80,11 +78,9 @@
           "num_bits": 4,
           "observer": "static_minmax",
           "observer_kwargs": {},
-          "scale_dtype": "torch.float8_e4m3fn",
           "strategy": "tensor_group",
           "symmetric": true,
-          "type": "float",
-          "zp_dtype": null
         }
       }
     },

           "num_bits": 4,
           "observer": "static_minmax",
           "observer_kwargs": {},
           "strategy": "tensor_group",
           "symmetric": true,
+          "type": "float"
         },
         "output_activations": null,
         "targets": [
           "num_bits": 4,
           "observer": "static_minmax",
           "observer_kwargs": {},
           "strategy": "tensor_group",
           "symmetric": true,
+          "type": "float"
         }
       }
     },