| { | |
| "base_model": "apple/FastVLM-1.5B", | |
| "method": "layer_pruning_shortgpt_bi_score", | |
| "layers_removed": [ | |
| 11, | |
| 12, | |
| 13, | |
| 14 | |
| ], | |
| "n_layers_original": 28, | |
| "n_layers_remaining": 24, | |
| "params_before_M": 1909.2, | |
| "params_after_M": 1722.1, | |
| "param_reduction_pct": 9.8, | |
| "benchmarks": { | |
| "vqav2": { | |
| "accuracy": 0.0, | |
| "avg_latency_s": 0.6425, | |
| "peak_memory_mb": 4825.1, | |
| "avg_memory_mb": 4782.0, | |
| "throughput_sps": 1.555, | |
| "avg_power_w": 144.4, | |
| "avg_gpu_util_pct": 37.2, | |
| "n_samples": 50, | |
| "n_evaluated": 50, | |
| "n_skipped": 0, | |
| "all_failed": false, | |
| "zero_accuracy_warning": true, | |
| "metrics": { | |
| "exact_match": 0.0, | |
| "contains": 0.54, | |
| "token_f1": 0.1875, | |
| "bleu": 0.1296, | |
| "rouge_l": 0.1875 | |
| } | |
| } | |
| } | |
| } |