convert_ct_dequant-e2e / recipe.yaml
nm-autobot's picture
Upload folder using huggingface_hub
d88c6c9 verified
Raw
History Blame Contribute Delete
223 Bytes
quant_stage:
quant_modifiers:
GPTQModifier:
ignore: [lm_head]
config_groups:
group_0:
weights: {num_bits: 4, strategy: group, group_size: 128, dynamic: false}
targets: [Linear]