FastVLM-1.5B-LAYER-PRUNED / pruning_info.json
Azaz666's picture
Upload layer-pruned FastVLM-1.5B (ShortGPT, removed 4 layers)
4bb529f verified
{
"base_model": "apple/FastVLM-1.5B",
"method": "layer_pruning_shortgpt_bi_score",
"layers_removed": [
11,
12,
13,
14
],
"n_layers_original": 28,
"n_layers_remaining": 24,
"params_before_M": 1909.2,
"params_after_M": 1722.1,
"param_reduction_pct": 9.8,
"benchmarks": {
"vqav2": {
"accuracy": 0.0,
"avg_latency_s": 0.6425,
"peak_memory_mb": 4825.1,
"avg_memory_mb": 4782.0,
"throughput_sps": 1.555,
"avg_power_w": 144.4,
"avg_gpu_util_pct": 37.2,
"n_samples": 50,
"n_evaluated": 50,
"n_skipped": 0,
"all_failed": false,
"zero_accuracy_warning": true,
"metrics": {
"exact_match": 0.0,
"contains": 0.54,
"token_f1": 0.1875,
"bleu": 0.1296,
"rouge_l": 0.1875
}
}
}
}