{ "method": "bitsandbytes", "bits": 4, "quant_type": "nf4", "double_quant": true, "compute_dtype": "bfloat16", "vram_gb": 2.44, "load_time_s": 11.0 }