{ "model": "tabnet", "subset": "all", "quant": "fp32", "model_size_mb": 140.154, "original_size_mb": 7.433, "size_reduction_pct": -1785.6, "latency_ms": { "cold_batch1": 5.73, "warm_batch1": 4.788, "warm_batch16": 13.262, "warm_batch256": 181.755, "throughput_batch1": 208.9, "ms_per_sample_batch1": 4.788, "throughput_batch16": 1206.5, "ms_per_sample_batch16": 0.8289, "throughput_batch256": 1408.5, "ms_per_sample_batch256": 0.71 }, "original_latency_ms": { "cold_batch1": 8.63, "warm_batch1": 10.467, "warm_batch16": 22.009, "warm_batch256": 106.04, "throughput_batch1": 95.5, "ms_per_sample_batch1": 10.467, "throughput_batch16": 727.0, "ms_per_sample_batch16": 1.3756, "throughput_batch256": 2414.2, "ms_per_sample_batch256": 0.4142 }, "test_metrics": { "roc_auc": 0.9922211951695316, "pr_auc": 0.9915223853617919, "tpr_at_1pct_fpr": 0.8911692412221978, "n_samples": 100000, "n_positive": 50041, "auc_delta_vs_original": 6.7e-05 }, "peak_rss_delta_mb": 7.9, "platform": "macOS-15.7.7-arm64-arm-64bit", "platform_short": "darwin-arm64" }