kaitchup
/

Qwen2.5-7B-Instruct-gptqmodel-2bit

Text Generation

text-generation-inference

Model card Files Files and versions

bnjmnmarie commited on Feb 4, 2025

Commit

b6cf883

·

verified ·

1 Parent(s): c519ad0

Update config.json

Files changed (1) hide show

config.json +20 -0

config.json CHANGED Viewed

@@ -3,6 +3,26 @@
   "architectures": [
     "Qwen2ForCausalLM"
   ],
   "attention_dropout": 0.0,
   "bos_token_id": 151643,
   "eos_token_id": 151645,

   "architectures": [
     "Qwen2ForCausalLM"
   ],
+  "quantization_config": {
+    "bits": 2,
+    "dynamic": null,
+    "group_size": 128,
+    "desc_act": true,
+    "sym": true,
+    "lm_head": false,
+    "quant_method": "gptq",
+    "checkpoint_format": "gptq",
+    "meta": {
+      "quantizer": [
+        "gptqmodel:1.7.4"
+      ],
+      "uri": "https://github.com/modelcloud/gptqmodel",
+      "damp_percent": 0.01,
+      "damp_auto_increment": 0.0025,
+      "static_groups": false,
+      "true_sequential": true
+    }
+  },
   "attention_dropout": 0.0,
   "bos_token_id": 151643,
   "eos_token_id": 151645,