File size: 911 Bytes
1cea584
 
 
 
 
 
 
 
 
 
 
 
 
6825dd9
563aa1a
1cea584
 
563aa1a
1cea584
563aa1a
 
1cea584
 
563aa1a
 
 
 
 
 
 
1cea584
 
 
 
563aa1a
1cea584
563aa1a
 
 
 
 
1cea584
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
{
  "base_model": "AIDC-AI/Ovis2-4B",
  "method": "layer_pruning_ppl",
  "method_name": "PPL-based (Shortened LLaMA)",
  "layers_removed": [
    3,
    4,
    5,
    6,
    7,
    8,
    10,
    11,
    18,
    19
  ],
  "n_layers_original": 36,
  "n_layers_remaining": 26,
  "params_before_M": 4304.9,
  "params_after_M": 3534.2,
  "param_reduction_pct": 17.9,
  "benchmarks": {
    "vqav2": {
      "accuracy": 0.06,
      "avg_latency_s": 0.5029,
      "peak_memory_mb": 15235.1,
      "avg_memory_mb": 15230.8,
      "throughput_sps": 1.987,
      "avg_power_w": 236.7,
      "avg_gpu_util_pct": 69.1,
      "n_samples": 50,
      "n_evaluated": 50,
      "n_skipped": 0,
      "all_failed": false,
      "zero_accuracy_warning": false,
      "metrics": {
        "exact_match": 0.06,
        "contains": 0.42,
        "token_f1": 0.1762,
        "bleu": 0.135,
        "rouge_l": 0.1762
      }
    }
  }
}