HunyuanImage-3.0-Instruct-NF4 / quantization_metadata.json
EricRollei's picture
Upload folder using huggingface_hub
41ba802 verified
{
"model_type": "HunyuanImage-3.0-Instruct",
"quantization_method": "bitsandbytes_nf4",
"load_in_4bit": true,
"bnb_4bit_quant_type": "nf4",
"bnb_4bit_use_double_quant": true,
"bnb_4bit_compute_dtype": "torch.bfloat16",
"expected_vram_gb": 45,
"modules_kept_bf16": [
"vae",
"vision_model",
"vision_aligner",
"patch_embed",
"final_layer",
"time_embed",
"time_embed_2",
"timestep_emb",
"attention_projections"
],
"notes": "Instruct model with vision encoder kept at BF16 for image understanding quality.",
"attention_layers_quantized": false
}