{ "model": "tabnet", "subset": "APK", "quant": "fp32", "model_size_mb": 13.457, "original_size_mb": 3.25, "size_reduction_pct": -314.1, "latency_ms": { "cold_batch1": 0.765, "warm_batch1": 0.846, "warm_batch16": 2.56, "warm_batch256": 39.071, "throughput_batch1": 1182.0, "ms_per_sample_batch1": 0.846, "throughput_batch16": 6250.0, "ms_per_sample_batch16": 0.16, "throughput_batch256": 6552.2, "ms_per_sample_batch256": 0.1526 }, "original_latency_ms": { "cold_batch1": 2.01, "warm_batch1": 1.776, "warm_batch16": 6.445, "warm_batch256": 24.723, "throughput_batch1": 563.1, "ms_per_sample_batch1": 1.776, "throughput_batch16": 2482.5, "ms_per_sample_batch16": 0.4028, "throughput_batch256": 10354.7, "ms_per_sample_batch256": 0.0966 }, "test_metrics": { "roc_auc": 0.9741325381944445, "pr_auc": 0.9752553810358323, "tpr_at_1pct_fpr": 0.7027916666666667, "n_samples": 96000, "n_positive": 48000, "auc_delta_vs_original": 0.0 }, "peak_rss_delta_mb": 0.0, "platform": "macOS-15.7.7-arm64-arm-64bit", "platform_short": "darwin-arm64" }