| { | |
| "baseline_gb": 10.78, | |
| "results": [ | |
| { | |
| "phase": "Phase 1a", | |
| "method": "FP8 (float8_e4m3fn)", | |
| "model_MB": 5219, | |
| "total_MB": 6919, | |
| "total_GB": 6.76, | |
| "compression": 1.6 | |
| }, | |
| { | |
| "phase": "Phase 2b", | |
| "method": "INT8", | |
| "model_MB": 5219, | |
| "total_MB": 6919, | |
| "total_GB": 6.76, | |
| "compression": 1.6 | |
| }, | |
| { | |
| "phase": "Phase 1b/2a", | |
| "method": "INT4", | |
| "model_MB": 3229, | |
| "total_MB": 4929, | |
| "total_GB": 4.81, | |
| "compression": 2.24 | |
| }, | |
| { | |
| "phase": "Phase 2c", | |
| "method": "INT3", | |
| "model_MB": 2685, | |
| "total_MB": 4385, | |
| "total_GB": 4.28, | |
| "compression": 2.52 | |
| }, | |
| { | |
| "phase": "Phase 3", | |
| "method": "INT2", | |
| "model_MB": 2141, | |
| "total_MB": 3841, | |
| "total_GB": 3.75, | |
| "compression": 2.88 | |
| } | |
| ], | |
| "hybrid_gb": 4.91, | |
| "hybrid_ratio": 2.19 | |
| } |