FORGE-Nano-Benchmark / benchmarks /bench_02_student_build.json
ilessio-aiflowlab's picture
Upload benchmarks/bench_02_student_build.json with huggingface_hub
aa55379 verified
{
"benchmark": "student_build",
"timestamp": "2026-03-19T11:53:02.682225+00:00",
"variant": "nano",
"device": "NVIDIA L4",
"build_time_cpu_s": 5.32,
"build_time_gpu_s": 1.22,
"params": {
"total": 967930567,
"total_m": 967.9,
"trainable": 495637127,
"trainable_m": 495.6,
"frozen": 472293440,
"frozen_m": 472.3,
"trainable_pct": 51.2
},
"components": {
"vision_m": 428.2,
"bridge_m": 39.7,
"language_m": 498.4,
"action_head_m": 1.7
},
"memory": {
"loaded_gb": 3.87,
"peak_gb": 4.65
},
"output_shapes": {
"actions": [
1,
7
],
"vision_features": [
1,
64,
896
]
},
"latency_fp32_b1": {
"mean_ms": 131.57,
"std_ms": 2.77,
"p50_ms": 131.85,
"p95_ms": 135.09,
"p99_ms": 135.68,
"min_ms": 118.81,
"max_ms": 135.89,
"fps": 7.6,
"n_samples": 50
},
"latency_fp32_b2": {
"mean_ms": 230.66,
"std_ms": 9.28,
"p50_ms": 227.98,
"p95_ms": 238.16,
"p99_ms": 263.46,
"min_ms": 222.53,
"max_ms": 271.12,
"fps": 4.3,
"n_samples": 25
},
"latency_fp32_b4": {
"mean_ms": 444.77,
"std_ms": 7.73,
"p50_ms": 442.78,
"p95_ms": 455.93,
"p99_ms": 457.17,
"min_ms": 429.48,
"max_ms": 457.52,
"fps": 2.2,
"n_samples": 25
},
"latency_fp16_b1": {
"mean_ms": 87.35,
"std_ms": 1.89,
"p50_ms": 86.74,
"p95_ms": 91.94,
"p99_ms": 94.54,
"min_ms": 86.27,
"max_ms": 94.88,
"fps": 11.4,
"n_samples": 50
},
"fp16_speedup": 1.51,
"batch_scaling": {
"b1_fps": 7.6,
"b2_fps": 8.7,
"b4_fps": 9.0
}
}