{ "quantization_stats": { "original_size_mb": 6362.53515625, "quantized_size_mb": 2223.747215270996, "size_reduction_mb": 4138.787940979004, "size_reduction_percent": 65.04935280260761, "compression_ratio": 2.8611773463085064, "n_quantized_layers": 2342 }, "safetensors_size_mb": 3352.126941680908, "mbq_config": { "w_bit": 4, "a_bit": 8, "mixed_precision": true, "sensitivity_metric": "hessian", "calibration_samples": 128, "preserve_ratio": 0.15 }, "model_info": { "base_model": "deepseek-ai/DeepSeek-OCR", "total_params": 3336106240, "quantized_layers": 2342 }, "bit_allocation_summary": { "8-bit": 351, "4-bit": 1991 }, "files": { "model.safetensors": "3352.13 MB", "quantized_weights.pt": "Compressed quantized weights", "config.json": "Model configuration", "tokenizer files": "Tokenizer configuration" } }