EXAONE-4.0-1.2B-GPTQ / recipe.yaml
MangoLab's picture
Add GPTQ-quantized EXAONE-4.0-1.2B
68933f7
raw
history blame contribute delete
238 Bytes
default_stage:
default_modifiers:
GPTQModifier:
targets: [Linear]
ignore: [embed_tokens, lm_head]
scheme: W4A16
block_size: 128
dampening_frac: 0.01
actorder: static
offload_hessians: false