{ "model": "tabnet", "subset": ".NET", "quant": "fp32", "model_size_mb": 140.154, "original_size_mb": 7.422, "size_reduction_pct": -1788.4, "latency_ms": { "cold_batch1": 5.084, "warm_batch1": 5.465, "warm_batch16": 13.02, "warm_batch256": 176.076, "throughput_batch1": 183.0, "ms_per_sample_batch1": 5.465, "throughput_batch16": 1228.9, "ms_per_sample_batch16": 0.8137, "throughput_batch256": 1453.9, "ms_per_sample_batch256": 0.6878 }, "original_latency_ms": { "cold_batch1": 9.044, "warm_batch1": 9.268, "warm_batch16": 25.687, "warm_batch256": 111.125, "throughput_batch1": 107.9, "ms_per_sample_batch1": 9.268, "throughput_batch16": 622.9, "ms_per_sample_batch16": 1.6054, "throughput_batch256": 2303.7, "ms_per_sample_batch256": 0.4341 }, "test_metrics": { "roc_auc": 0.9923499432769739, "pr_auc": 0.9916205586874096, "tpr_at_1pct_fpr": 0.8700196211908862, "n_samples": 100000, "n_positive": 49946, "auc_delta_vs_original": -0.000126 }, "peak_rss_delta_mb": 5.3, "platform": "macOS-15.7.7-arm64-arm-64bit", "platform_short": "darwin-arm64" }