{ "benchmark": "model_cpu_offload_cold_warm", "hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)", "mode": "Diffusers enable_model_cpu_offload()", "cache_state": "warm local HF cache; no download time included", "process_isolation": "single model per fresh Python process", "base_resolution": 1024, "aspect_ratio": "1:1", "num_inference_steps": 4, "guidance_scale": 1.0, "dtype": "torch.bfloat16", "definitions": { "load_time_s": "Pipeline load plus enable_model_cpu_offload setup from warm local HF cache; download time excluded.", "cold_generation": "P01, first generation immediately after fresh process load/offload setup.", "warm_generation": "P02-P10 after the cold P01 generation." }, "models": { "base": { "hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)", "mode": "Diffusers enable_model_cpu_offload()", "cache_state": "warm local HF cache; no download time included", "process_isolation": "single model per fresh Python process", "base_resolution": 1024, "aspect_ratio": "1:1", "num_inference_steps": 4, "guidance_scale": 1.0, "dtype": "torch.bfloat16", "kind": "base", "load": { "load_time_s": 15.411, "peak_allocated_gb": 12.582, "peak_reserved_gb": 13.881, "end_allocated_gb": 10.185, "end_reserved_gb": 10.679 }, "summary": { "cold_time_s": 8.434, "cold_peak_allocated_gb": 18.945, "cold_peak_reserved_gb": 19.262, "warm_avg_time_s": 5.731, "warm_median_time_s": 5.141, "warm_avg_peak_allocated_gb": 18.945, "warm_avg_peak_reserved_gb": 19.267, "warm_max_peak_allocated_gb": 18.968, "warm_max_peak_reserved_gb": 19.29 }, "prompts": [ { "id": "P01", "title": "Orbital Night Market", "seed": 101, "time_s": 8.434, "peak_allocated_gb": 18.945, "peak_reserved_gb": 19.262, "end_allocated_gb": 10.221, "end_reserved_gb": 10.895 }, { "id": "P02", "title": "Arctic Research Desk", "seed": 102, "time_s": 5.613, "peak_allocated_gb": 18.949, "peak_reserved_gb": 19.258, "end_allocated_gb": 10.221, "end_reserved_gb": 10.893 }, { "id": "P03", "title": "Victorian Automaton Repair", "seed": 103, "time_s": 4.006, "peak_allocated_gb": 18.944, "peak_reserved_gb": 19.271, "end_allocated_gb": 10.221, "end_reserved_gb": 10.792 }, { "id": "P04", "title": "Mars Greenhouse Control Room", "seed": 104, "time_s": 7.509, "peak_allocated_gb": 18.938, "peak_reserved_gb": 19.258, "end_allocated_gb": 10.221, "end_reserved_gb": 10.872 }, { "id": "P05", "title": "Lost Railway Poster Wall", "seed": 105, "time_s": 4.658, "peak_allocated_gb": 18.939, "peak_reserved_gb": 19.258, "end_allocated_gb": 10.221, "end_reserved_gb": 10.872 }, { "id": "P06", "title": "Miniature Courtroom Diorama", "seed": 106, "time_s": 5.141, "peak_allocated_gb": 18.942, "peak_reserved_gb": 19.271, "end_allocated_gb": 10.221, "end_reserved_gb": 10.792 }, { "id": "P07", "title": "Rainy Seoul Book Cafe", "seed": 107, "time_s": 5.134, "peak_allocated_gb": 18.942, "peak_reserved_gb": 19.271, "end_allocated_gb": 10.221, "end_reserved_gb": 10.792 }, { "id": "P08", "title": "Oceanographic Expedition Map", "seed": 108, "time_s": 4.657, "peak_allocated_gb": 18.942, "peak_reserved_gb": 19.271, "end_allocated_gb": 10.221, "end_reserved_gb": 10.792 }, { "id": "P09", "title": "Renaissance Lab Notebook", "seed": 109, "time_s": 5.944, "peak_allocated_gb": 18.939, "peak_reserved_gb": 19.258, "end_allocated_gb": 10.221, "end_reserved_gb": 10.872 }, { "id": "P10", "title": "Russian Provincial Print Shop", "seed": 110, "time_s": 8.916, "peak_allocated_gb": 18.968, "peak_reserved_gb": 19.29, "end_allocated_gb": 10.221, "end_reserved_gb": 10.798 } ] }, "quant": { "hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)", "mode": "Diffusers enable_model_cpu_offload()", "cache_state": "warm local HF cache; no download time included", "process_isolation": "single model per fresh Python process", "base_resolution": 1024, "aspect_ratio": "1:1", "num_inference_steps": 4, "guidance_scale": 1.0, "dtype": "torch.bfloat16", "kind": "quant", "load": { "load_time_s": 12.371, "peak_allocated_gb": 12.582, "peak_reserved_gb": 13.881, "end_allocated_gb": 10.185, "end_reserved_gb": 10.679 }, "summary": { "cold_time_s": 8.44, "cold_peak_allocated_gb": 15.085, "cold_peak_reserved_gb": 15.238, "warm_avg_time_s": 4.976, "warm_median_time_s": 3.855, "warm_avg_peak_allocated_gb": 15.084, "warm_avg_peak_reserved_gb": 15.249, "warm_max_peak_allocated_gb": 15.104, "warm_max_peak_reserved_gb": 15.28 }, "prompts": [ { "id": "P01", "title": "Orbital Night Market", "seed": 101, "time_s": 8.44, "peak_allocated_gb": 15.085, "peak_reserved_gb": 15.238, "end_allocated_gb": 10.221, "end_reserved_gb": 10.872 }, { "id": "P02", "title": "Arctic Research Desk", "seed": 102, "time_s": 6.726, "peak_allocated_gb": 15.089, "peak_reserved_gb": 15.261, "end_allocated_gb": 10.221, "end_reserved_gb": 10.878 }, { "id": "P03", "title": "Victorian Automaton Repair", "seed": 103, "time_s": 8.244, "peak_allocated_gb": 15.081, "peak_reserved_gb": 15.246, "end_allocated_gb": 10.221, "end_reserved_gb": 10.775 }, { "id": "P04", "title": "Mars Greenhouse Control Room", "seed": 104, "time_s": 4.033, "peak_allocated_gb": 15.079, "peak_reserved_gb": 15.238, "end_allocated_gb": 10.221, "end_reserved_gb": 10.874 }, { "id": "P05", "title": "Lost Railway Poster Wall", "seed": 105, "time_s": 3.836, "peak_allocated_gb": 15.08, "peak_reserved_gb": 15.238, "end_allocated_gb": 10.221, "end_reserved_gb": 10.876 }, { "id": "P06", "title": "Miniature Courtroom Diorama", "seed": 106, "time_s": 3.845, "peak_allocated_gb": 15.08, "peak_reserved_gb": 15.246, "end_allocated_gb": 10.221, "end_reserved_gb": 10.775 }, { "id": "P07", "title": "Rainy Seoul Book Cafe", "seed": 107, "time_s": 3.855, "peak_allocated_gb": 15.08, "peak_reserved_gb": 15.246, "end_allocated_gb": 10.221, "end_reserved_gb": 10.773 }, { "id": "P08", "title": "Oceanographic Expedition Map", "seed": 108, "time_s": 3.841, "peak_allocated_gb": 15.08, "peak_reserved_gb": 15.246, "end_allocated_gb": 10.221, "end_reserved_gb": 10.773 }, { "id": "P09", "title": "Renaissance Lab Notebook", "seed": 109, "time_s": 3.852, "peak_allocated_gb": 15.08, "peak_reserved_gb": 15.238, "end_allocated_gb": 10.221, "end_reserved_gb": 10.876 }, { "id": "P10", "title": "Russian Provincial Print Shop", "seed": 110, "time_s": 6.556, "peak_allocated_gb": 15.104, "peak_reserved_gb": 15.28, "end_allocated_gb": 10.221, "end_reserved_gb": 10.781 } ] } } }