File size: 1,319 Bytes
2edd871
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
{
  "developer": "AGI-0",
  "models": [
    {
      "id": "AGI-0/Art-v0-3B",
      "name": "Art-v0-3B",
      "developer": "AGI-0",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "hfopenllm_v2/IFEval": 0.3192,
        "hfopenllm_v2/BBH": 0.3401,
        "hfopenllm_v2/MATH Level 5": 0.2462,
        "hfopenllm_v2/GPQA": 0.2592,
        "hfopenllm_v2/MUSR": 0.3768,
        "hfopenllm_v2/MMLU-PRO": 0.1179
      }
    },
    {
      "id": "AGI-0/Artificium-llama3.1-8B-001",
      "name": "Artificium-llama3.1-8B-001",
      "developer": "AGI-0",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "hfopenllm_v2/IFEval": 0.5248,
        "hfopenllm_v2/BBH": 0.4256,
        "hfopenllm_v2/MATH Level 5": 0.136,
        "hfopenllm_v2/GPQA": 0.2659,
        "hfopenllm_v2/MUSR": 0.3795,
        "hfopenllm_v2/MMLU-PRO": 0.3182
      }
    },
    {
      "id": "AGI-0/smartllama3.1-8B-001",
      "name": "smartllama3.1-8B-001",
      "developer": "AGI-0",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "hfopenllm_v2/IFEval": 0.3518,
        "hfopenllm_v2/BBH": 0.467,
        "hfopenllm_v2/MATH Level 5": 0.1299,
        "hfopenllm_v2/GPQA": 0.3062,
        "hfopenllm_v2/MUSR": 0.4386,
        "hfopenllm_v2/MMLU-PRO": 0.3487
      }
    }
  ]
}