{ "model_type": "HunyuanImage-3.0-Instruct", "quantization_method": "bitsandbytes_int8", "load_in_8bit": true, "llm_int8_threshold": 6.0, "expected_vram_gb": 95, "expected_total_memory_gb": 100, "modules_kept_bf16": [ "vae", "vision_model", "vision_aligner", "patch_embed", "final_layer", "time_embed", "time_embed_2", "timestep_emb", "attention_projections" ], "notes": "Instruct model with vision encoder kept at BF16 for image understanding quality.", "attention_layers_quantized": false, "quality_vs_nf4": "Significantly better - approximately 2x memory for ~98% quality retention" }