{ "n_samples": 800, "wall_time_s": 10.670467825140804, "throughput_samples_per_s": 74.9732826254451, "gpu_total_kernel_ms": 30.791999965906143, "gpu_ms_per_sample": 0.03848999995738268, "gpu_avg_ms_per_batch": 0.6158399993181228, "gpu_peak_mem_MB": 132.611328125, "telemetry_pre": { "cpu_freq_current_MHz": 2122.2947857142844, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 9.3, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 0, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1777.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 188.923, "gpu_temp_C": 30 }, "telemetry_post": { "cpu_freq_current_MHz": 2181.8124866071416, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 30.9, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 1, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1777.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 189.44, "gpu_temp_C": 30 } }