| {"ts": "2025-12-19T19:41:40Z", "run": "e6f28dfc458847cc825acfc40a1937dc", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B1_Q100_H8_E256_L4_P4", "batch_size": 1, "num_queries": 100, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.58-82.121.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 3.4261789999732173, "p50": 3.457469000011315, "p90": 3.459429999963959, "mean": 3.4539671999937127, "iqr": 0.0022309999962999427, "raw_times": [3.459429999963959, 3.4695590000524135, 3.457469000011315, 3.457198999967659, 3.4261789999732173], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 3.4921710000048733, "peak_bytes": 5929472, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null} | |
| {"ts": "2025-12-19T19:41:40Z", "run": "e6f28dfc458847cc825acfc40a1937dc", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B1_Q300_H8_E256_L4_P4", "batch_size": 1, "num_queries": 300, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.58-82.121.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 4.229746999953932, "p50": 4.235096999991583, "p90": 4.236528000035378, "mean": 4.242877599995154, "iqr": 0.0027010000280824897, "raw_times": [4.236528000035378, 4.235096999991583, 4.279188999987582, 4.233827000007295, 4.229746999953932], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 4.256637999958457, "peak_bytes": 15161856, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null} | |
| {"ts": "2025-12-19T19:41:41Z", "run": "e6f28dfc458847cc825acfc40a1937dc", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B2_Q100_H8_E256_L4_P4", "batch_size": 2, "num_queries": 100, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.58-82.121.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 4.2112570000085725, "p50": 4.251798000041163, "p90": 4.262317999973675, "mean": 4.247635800004446, "iqr": 0.04195999997591571, "raw_times": [4.2112570000085725, 4.262317999973675, 4.220357999997759, 4.251798000041163, 4.292448000001059], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 4.28278900000123, "peak_bytes": 11958784, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null} | |
| {"ts": "2025-12-19T19:41:41Z", "run": "e6f28dfc458847cc825acfc40a1937dc", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B2_Q300_H8_E256_L4_P4", "batch_size": 2, "num_queries": 300, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.58-82.121.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 4.324839999981123, "p50": 4.342328999996425, "p90": 4.349751000006563, "mean": 4.3508561999942685, "iqr": 0.022982000018600957, "raw_times": [4.326768999987962, 4.410591999999269, 4.342328999996425, 4.324839999981123, 4.349751000006563], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 4.316158999984054, "peak_bytes": 30977024, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null} | |