Spaces:
Running
Running
File size: 2,693 Bytes
2edd871 aa3daac 2edd871 d91b463 2edd871 d91b463 2edd871 d91b463 2edd871 d91b463 2edd871 ddebd57 969ee51 ddebd57 2edd871 d91b463 2edd871 d91b463 2edd871 d91b463 2edd871 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 | {
"developer": "AI2",
"models": [
{
"id": "ai2/llama-2-chat-7b-nectar-3.8m.json",
"name": "ai2/llama-2-chat-7b-nectar-3.8m.json",
"developer": "AI2",
"evaluator_relationship": null,
"benchmark_scores": {
"reward-bench/Score": 0.5843,
"reward-bench/Chat": 0.8631,
"reward-bench/Chat Hard": 0.2654,
"reward-bench/Safety": 0.6243
}
},
{
"id": "ai2/llama-2-chat-nectar-180k.json",
"name": "ai2/llama-2-chat-nectar-180k.json",
"developer": "AI2",
"evaluator_relationship": null,
"benchmark_scores": {
"reward-bench/Score": 0.5235,
"reward-bench/Chat": 0.8827,
"reward-bench/Chat Hard": 0.2851,
"reward-bench/Safety": 0.4027
}
},
{
"id": "ai2/llama-2-chat-ultrafeedback-60k.jsonl",
"name": "ai2/llama-2-chat-ultrafeedback-60k.jsonl",
"developer": "AI2",
"evaluator_relationship": null,
"benchmark_scores": {
"reward-bench/Score": 0.644,
"reward-bench/Chat": 0.9441,
"reward-bench/Chat Hard": 0.4539,
"reward-bench/Safety": 0.5338
}
},
{
"id": "ai2/tulu-2-7b-rm-v0-nectar-binarized-3.8m-check...",
"name": "ai2/tulu-2-7b-rm-v0-nectar-binarized-3.8m-check...",
"developer": "AI2",
"evaluator_relationship": null,
"benchmark_scores": {
"reward-bench/Score": 0.7008,
"reward-bench/Chat": 0.9385,
"reward-bench/Chat Hard": 0.3882,
"reward-bench/Safety": 0.7757
}
},
{
"id": "ai2/tulu-2-7b-rm-v0-nectar-binarized-700k.json",
"name": "ai2/tulu-2-7b-rm-v0-nectar-binarized-700k.json",
"developer": "AI2",
"evaluator_relationship": null,
"benchmark_scores": {
"reward-bench/Score": 0.7127,
"reward-bench/Chat": 0.9358,
"reward-bench/Chat Hard": 0.4079,
"reward-bench/Safety": 0.7946
}
},
{
"id": "ai2/tulu-2-7b-rm-v0-nectar-binarized.json",
"name": "ai2/tulu-2-7b-rm-v0-nectar-binarized.json",
"developer": "AI2",
"evaluator_relationship": null,
"benchmark_scores": {
"reward-bench/Score": 0.6756,
"reward-bench/Chat": 0.9134,
"reward-bench/Chat Hard": 0.3904,
"reward-bench/Safety": 0.723
}
},
{
"id": "ai2/tulu-2-7b-rm-v0.json",
"name": "ai2/tulu-2-7b-rm-v0.json",
"developer": "AI2",
"evaluator_relationship": null,
"benchmark_scores": {
"reward-bench/Score": 0.6655,
"reward-bench/Chat": 0.933,
"reward-bench/Chat Hard": 0.4539,
"reward-bench/Safety": 0.6095
}
}
]
} |