{ "n_samples": 800, "wall_time_s": 2.795652147033252, "throughput_samples_per_s": 286.15863416661495, "gpu_total_kernel_ms": 20.907391980290413, "gpu_ms_per_sample": 0.026134239975363016, "gpu_avg_ms_per_batch": 0.41814783960580826, "gpu_peak_mem_MB": 91.32421875, "telemetry_pre": { "cpu_freq_current_MHz": 1212.3605714285716, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 10.1, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 1, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1679.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 198.236, "gpu_temp_C": 34 }, "telemetry_post": { "cpu_freq_current_MHz": 1199.1929687499999, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 5.7, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 0, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1717.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 197.954, "gpu_temp_C": 34 } }