{ "model": "tabnet", "subset": "PE", "quant": "fp32", "model_size_mb": 140.154, "original_size_mb": 7.43, "size_reduction_pct": -1786.3, "latency_ms": { "cold_batch1": 5.664, "warm_batch1": 4.402, "warm_batch16": 10.607, "warm_batch256": 156.092, "throughput_batch1": 227.2, "ms_per_sample_batch1": 4.402, "throughput_batch16": 1508.4, "ms_per_sample_batch16": 0.6629, "throughput_batch256": 1640.1, "ms_per_sample_batch256": 0.6097 }, "original_latency_ms": { "cold_batch1": 10.918, "warm_batch1": 10.183, "warm_batch16": 21.887, "warm_batch256": 111.527, "throughput_batch1": 98.2, "ms_per_sample_batch1": 10.183, "throughput_batch16": 731.0, "ms_per_sample_batch16": 1.3679, "throughput_batch256": 2295.4, "ms_per_sample_batch256": 0.4357 }, "test_metrics": { "roc_auc": 0.9948456613505301, "pr_auc": 0.9951360774507333, "tpr_at_1pct_fpr": 0.9194977105036892, "n_samples": 100000, "n_positive": 50011, "auc_delta_vs_original": -0.00027 }, "peak_rss_delta_mb": 0.3, "platform": "macOS-15.7.7-arm64-arm-64bit", "platform_short": "darwin-arm64" }