DJLougen's picture
Upload NV_FP4 quantized model
086284e verified
{
"model_id": "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct",
"format": "NV_FP4",
"block_size": 32,
"stats": {
"quantized_count": 5207,
"skipped_count": 84,
"original_bytes": 31412968448,
"quantized_bytes": 9438010368
},
"compression_ratio": 3.32834646532145
}