File size: 2,693 Bytes
2edd871
aa3daac
2edd871
 
 
 
d91b463
2edd871
 
 
 
 
 
 
 
 
 
 
d91b463
2edd871
 
 
 
 
 
 
 
 
 
 
d91b463
2edd871
 
 
 
 
 
 
 
 
 
 
d91b463
2edd871
 
ddebd57
969ee51
ddebd57
 
2edd871
 
 
 
 
d91b463
2edd871
 
 
 
 
 
 
 
 
 
 
d91b463
2edd871
 
 
 
 
 
 
 
 
 
 
d91b463
2edd871
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
{
  "developer": "AI2",
  "models": [
    {
      "id": "ai2/llama-2-chat-7b-nectar-3.8m.json",
      "name": "ai2/llama-2-chat-7b-nectar-3.8m.json",
      "developer": "AI2",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "reward-bench/Score": 0.5843,
        "reward-bench/Chat": 0.8631,
        "reward-bench/Chat Hard": 0.2654,
        "reward-bench/Safety": 0.6243
      }
    },
    {
      "id": "ai2/llama-2-chat-nectar-180k.json",
      "name": "ai2/llama-2-chat-nectar-180k.json",
      "developer": "AI2",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "reward-bench/Score": 0.5235,
        "reward-bench/Chat": 0.8827,
        "reward-bench/Chat Hard": 0.2851,
        "reward-bench/Safety": 0.4027
      }
    },
    {
      "id": "ai2/llama-2-chat-ultrafeedback-60k.jsonl",
      "name": "ai2/llama-2-chat-ultrafeedback-60k.jsonl",
      "developer": "AI2",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "reward-bench/Score": 0.644,
        "reward-bench/Chat": 0.9441,
        "reward-bench/Chat Hard": 0.4539,
        "reward-bench/Safety": 0.5338
      }
    },
    {
      "id": "ai2/tulu-2-7b-rm-v0-nectar-binarized-3.8m-check...",
      "name": "ai2/tulu-2-7b-rm-v0-nectar-binarized-3.8m-check...",
      "developer": "AI2",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "reward-bench/Score": 0.7008,
        "reward-bench/Chat": 0.9385,
        "reward-bench/Chat Hard": 0.3882,
        "reward-bench/Safety": 0.7757
      }
    },
    {
      "id": "ai2/tulu-2-7b-rm-v0-nectar-binarized-700k.json",
      "name": "ai2/tulu-2-7b-rm-v0-nectar-binarized-700k.json",
      "developer": "AI2",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "reward-bench/Score": 0.7127,
        "reward-bench/Chat": 0.9358,
        "reward-bench/Chat Hard": 0.4079,
        "reward-bench/Safety": 0.7946
      }
    },
    {
      "id": "ai2/tulu-2-7b-rm-v0-nectar-binarized.json",
      "name": "ai2/tulu-2-7b-rm-v0-nectar-binarized.json",
      "developer": "AI2",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "reward-bench/Score": 0.6756,
        "reward-bench/Chat": 0.9134,
        "reward-bench/Chat Hard": 0.3904,
        "reward-bench/Safety": 0.723
      }
    },
    {
      "id": "ai2/tulu-2-7b-rm-v0.json",
      "name": "ai2/tulu-2-7b-rm-v0.json",
      "developer": "AI2",
      "evaluator_relationship": null,
      "benchmark_scores": {
        "reward-bench/Score": 0.6655,
        "reward-bench/Chat": 0.933,
        "reward-bench/Chat Hard": 0.4539,
        "reward-bench/Safety": 0.6095
      }
    }
  ]
}