sitatech
/

VisualQuality-R1-7B-GPTQ-Int4

4-bit precision

Model card Files Files and versions

sitatech commited on Feb 6

Commit

8e94048

·

verified ·

1 Parent(s): 09a9a08

Update config.json

Files changed (1) hide show

config.json +1 -11

config.json CHANGED Viewed

@@ -21,23 +21,14 @@
     "backend": "auto",
     "batch_size": 1,
     "bits": 4,
-    "block_name_to_quantize": null,
     "cache_block_outputs": true,
     "checkpoint_format": "gptq",
     "damp_percent": 0.1,
     "dataset": "c4",
     "desc_act": false,
-    "exllama_config": {
-      "version": 1
-    },
     "group_size": 128,
     "max_input_length": null,
-    "meta": {
-      "quantizer": [
-        "optimum:2.1.0",
-        "gptqmodel:5.6.12"
-      ]
-    },
     "model_seqlen": null,
     "module_name_preceding_first_block": null,
     "modules_in_block_to_quantize": null,
@@ -47,7 +38,6 @@
     "tokenizer": null,
     "true_sequential": true,
     "use_cuda_fp16": false,
-    "use_exllama": true
   },
   "rms_norm_eps": 1e-06,
   "rope_scaling": {

     "backend": "auto",
     "batch_size": 1,
     "bits": 4,
+    "block_name_to_quantize": "model.language_model.layers",
     "cache_block_outputs": true,
     "checkpoint_format": "gptq",
     "damp_percent": 0.1,
     "dataset": "c4",
     "desc_act": false,
     "group_size": 128,
     "max_input_length": null,
     "model_seqlen": null,
     "module_name_preceding_first_block": null,
     "modules_in_block_to_quantize": null,
     "tokenizer": null,
     "true_sequential": true,
     "use_cuda_fp16": false,
   },
   "rms_norm_eps": 1e-06,
   "rope_scaling": {