{ "n_samples": 800, "wall_time_s": 10.56016085902229, "throughput_samples_per_s": 75.7564217704604, "gpu_total_kernel_ms": 89.66230404376984, "gpu_ms_per_sample": 0.1120778800547123, "gpu_avg_ms_per_batch": 1.7932460808753967, "gpu_peak_mem_MB": 73.56640625, "telemetry_pre": { "cpu_freq_current_MHz": 2012.8739955357153, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 17.5, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 0, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1679.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 190.437, "gpu_temp_C": 31 }, "telemetry_post": { "cpu_freq_current_MHz": 1862.516486607143, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 20.3, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 1, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1679.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 190.592, "gpu_temp_C": 31 } }