my-quant-model / model /recipe.yaml
whitiger's picture
Upload folder using huggingface_hub
034b1c0 verified
raw
history blame contribute delete
237 Bytes
default_stage:
default_modifiers:
GPTQModifier:
targets: [Linear]
ignore: [embed_tokens, lm_head]
scheme: W8A16
block_size: 128
dampening_frac: 0.1
actorder: static
offload_hessians: false