jpodivin's picture
Upload folder using huggingface_hub
184b190 verified
raw
history blame contribute delete
200 Bytes
default_stage:
default_modifiers:
QuantizationModifier:
targets: [Linear, GraniteMoeHybridParallelExpertsLinear]
ignore: [lm_head, 're:.*block_sparse_moe.router']
scheme: W8A8