| default_stage: | |
| default_modifiers: | |
| GPTQModifier: | |
| targets: [Linear] | |
| ignore: ['re:.*lm_head$', 're:.*qkv$', 're:.*fc1$', 're:.*fc2$', 're:.*attn.proj$', | |
| 're:.*up_proj$', 're:.*gate_proj$', 're:.*down_proj$', 're:.*router.query_key_value$'] | |
| scheme: W4A16 | |
| sequential_update: true | |
| block_size: 128 | |
| dampening_frac: 0.01 | |
| offload_hessians: false | |