{"ts": "2025-10-31T20:00:11Z", "run": "f2cf664f6646484f88815be637f5bc9d", "impl": "torch_layer_norm", "tags": {"family": "torch", "op": "layer_norm"}, "wl": {"name": "LN_B16_S2048_D4096", "batch": 16, "seq_len": 2048, "hidden_dim": 4096, "dtype": "bfloat16", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-5.10.244-240.970.amzn2.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 0.807951000012963, "p50": 0.8174310000299556, "p90": 0.8198709999760467, "mean": 0.8162470000002031, "iqr": 0.0038399999766625115, "raw_times": [0.8160309999993842, 0.8198709999760467, 0.8174310000299556, 0.807951000012963, 0.819950999982666], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 0.8318710000025931, "peak_bytes": 2415935488, "ok": true, "absmax": 0.03125, "corr": {"ok": true, "rtol": 0.001, "atol": 0.03125, "absmax": 0.03125, "mae": 0.0015411376953125, "mse": 1.1205673217773438e-05, "ref": "layer_norm_ref"}, "err": null} {"ts": "2025-10-31T20:00:11Z", "run": "f2cf664f6646484f88815be637f5bc9d", "impl": "torch_layer_norm", "tags": {"family": "torch", "op": "layer_norm"}, "wl": {"name": "LN_B16_S2048_D8192", "batch": 16, "seq_len": 2048, "hidden_dim": 8192, "dtype": "bfloat16", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-5.10.244-240.970.amzn2.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 1.6729929999996784, "p50": 1.6790130000003956, "p90": 1.685203000022284, "mean": 1.6802827999867986, "iqr": 0.007120000077520672, "raw_times": [1.685203000022284, 1.6790130000003956, 1.6729929999996784, 1.686121999966872, 1.6780829999447633], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 1.6821429999822612, "peak_bytes": 4831870976, "ok": true, "absmax": 0.03125, "corr": {"ok": true, "rtol": 0.001, "atol": 0.03125, "absmax": 0.03125, "mae": 0.0015106201171875, "mse": 1.1086463928222656e-05, "ref": "layer_norm_ref"}, "err": null} {"ts": "2025-10-31T20:00:12Z", "run": "f2cf664f6646484f88815be637f5bc9d", "impl": "torch_layer_norm", "tags": {"family": "torch", "op": "layer_norm"}, "wl": {"name": "LN_B16_S4096_D4096", "batch": 16, "seq_len": 4096, "hidden_dim": 4096, "dtype": "bfloat16", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-5.10.244-240.970.amzn2.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 1.6009309999844845, "p50": 1.6056009999942944, "p90": 1.611341000000266, "mean": 1.606853000009778, "iqr": 0.008409999963987502, "raw_times": [1.6009309999844845, 1.6056009999942944, 1.613461000033567, 1.6029310000362784, 1.611341000000266], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 1.6386120000220217, "peak_bytes": 4831854592, "ok": true, "absmax": 0.03125, "corr": {"ok": true, "rtol": 0.001, "atol": 0.03125, "absmax": 0.03125, "mae": 0.0015411376953125, "mse": 1.1205673217773438e-05, "ref": "layer_norm_ref"}, "err": null} {"ts": "2025-10-31T20:00:12Z", "run": "f2cf664f6646484f88815be637f5bc9d", "impl": "torch_layer_norm", "tags": {"family": "torch", "op": "layer_norm"}, "wl": {"name": "LN_B16_S4096_D8192", "batch": 16, "seq_len": 4096, "hidden_dim": 8192, "dtype": "bfloat16", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-5.10.244-240.970.amzn2.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 3.3123249999675863, "p50": 3.327974000001177, "p90": 3.3289149999973233, "mean": 3.3240905999946335, "iqr": 0.010180999993281148, "raw_times": [3.3325050000030387, 3.3289149999973233, 3.3123249999675863, 3.318734000004042, 3.327974000001177], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 3.335275000040383, "peak_bytes": 9663709184, "ok": true, "absmax": 0.03125, "corr": {"ok": true, "rtol": 0.001, "atol": 0.03125, "absmax": 0.03125, "mae": 0.0015106201171875, "mse": 1.1026859283447266e-05, "ref": "layer_norm_ref"}, "err": null}