{ "n_samples": 1600, "wall_time_s": 17.874322760966606, "throughput_samples_per_s": 89.51388096750891, "gpu_total_kernel_ms": 95.65203130245209, "gpu_ms_per_sample": 0.059782519564032556, "gpu_avg_ms_per_batch": 1.9130406260490418, "gpu_peak_mem_MB": 141.931640625, "telemetry_pre": { "cpu_freq_current_MHz": 1611.7592142857138, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 11.8, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 0, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1707.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 193.651, "gpu_temp_C": 34 }, "telemetry_post": { "cpu_freq_current_MHz": 1583.5828526785713, "cpu_freq_max_MHz": 4000.0, "cpu_util_pct": 13.6, "cpu_count_logical": 224, "cpu_count_physical": 112, "gpu_util_pct": 0, "gpu_mem_util_pct": 0, "gpu_mem_used_MB": 1801.0625, "gpu_mem_total_MB": 183359.0, "gpu_sm_clock_MHz": 1965, "gpu_mem_clock_MHz": 3996, "gpu_power_W": 193.197, "gpu_temp_C": 34 } }