| { | |
| "model_type": "HunyuanImage-3.0-Instruct", | |
| "quantization_method": "bitsandbytes_int8", | |
| "load_in_8bit": true, | |
| "llm_int8_threshold": 6.0, | |
| "expected_vram_gb": 95, | |
| "expected_total_memory_gb": 100, | |
| "modules_kept_bf16": [ | |
| "vae", | |
| "vision_model", | |
| "vision_aligner", | |
| "patch_embed", | |
| "final_layer", | |
| "time_embed", | |
| "time_embed_2", | |
| "timestep_emb", | |
| "attention_projections" | |
| ], | |
| "notes": "Instruct model with vision encoder kept at BF16 for image understanding quality.", | |
| "attention_layers_quantized": false, | |
| "quality_vs_nf4": "Significantly better - approximately 2x memory for ~98% quality retention" | |
| } |