Update README.md
Browse files
README.md
CHANGED
|
@@ -68,7 +68,7 @@ This model was created with [llm-compressor](https://github.com/vllm-project/llm
|
|
| 68 |
|
| 69 |
|
| 70 |
```bash
|
| 71 |
-
python quantize.py --model_path ibm-granite/granite-3.1-8b-instruct --quant_path "output_dir/granite-3.1-8b-instruct-quantized.w8a8" --calib_size 3072 --dampening_frac 0.1 --observer mse
|
| 72 |
```
|
| 73 |
|
| 74 |
|
|
@@ -137,7 +137,6 @@ recipe = [
|
|
| 137 |
scheme="W8A8",
|
| 138 |
dampening_frac=args.dampening_frac,
|
| 139 |
observer=args.observer,
|
| 140 |
-
actorder=args.actorder,
|
| 141 |
)
|
| 142 |
]
|
| 143 |
oneshot(
|
|
|
|
| 68 |
|
| 69 |
|
| 70 |
```bash
|
| 71 |
+
python quantize.py --model_path ibm-granite/granite-3.1-8b-instruct --quant_path "output_dir/granite-3.1-8b-instruct-quantized.w8a8" --calib_size 3072 --dampening_frac 0.1 --observer mse
|
| 72 |
```
|
| 73 |
|
| 74 |
|
|
|
|
| 137 |
scheme="W8A8",
|
| 138 |
dampening_frac=args.dampening_frac,
|
| 139 |
observer=args.observer,
|
|
|
|
| 140 |
)
|
| 141 |
]
|
| 142 |
oneshot(
|