HunyuanImage-3.0-Instruct-NF4 / quantization_metadata.json

Upload folder using huggingface_hub

41ba802 verified 5 days ago

619 Bytes

	{
	"model_type": "HunyuanImage-3.0-Instruct",
	"quantization_method": "bitsandbytes_nf4",
	"load_in_4bit": true,
	"bnb_4bit_quant_type": "nf4",
	"bnb_4bit_use_double_quant": true,
	"bnb_4bit_compute_dtype": "torch.bfloat16",
	"expected_vram_gb": 45,
	"modules_kept_bf16": [
	"vae",
	"vision_model",
	"vision_aligner",
	"patch_embed",
	"final_layer",
	"time_embed",
	"time_embed_2",
	"timestep_emb",
	"attention_projections"
	],
	"notes": "Instruct model with vision encoder kept at BF16 for image understanding quality.",
	"attention_layers_quantized": false
	}