RightNow-Arabic-0.5B-Turbo / benchmarks.json
Jr23xd23's picture
Upload benchmarks.json with huggingface_hub
47b66db verified
{
"final": {
"copa_ar": {
"alias": "copa_ar",
"acc,none": 0.5280898876404494,
"acc_stderr,none": 0.05321600047878916,
"acc_norm,none": 0.5842696629213483,
"acc_norm_stderr,none": 0.05253771631269923
},
"arabic_mt_hellaswag": {
"alias": "arabic_mt_hellaswag",
"acc,none": 0.195,
"acc_stderr,none": 0.028085923439997246,
"acc_norm,none": 0.26,
"acc_norm_stderr,none": 0.031093957143700304
},
"arabic_leaderboard_arabic_mmlu": {
"acc,none": 0.23238593052379397,
"acc_stderr,none": 0.0043980977605237925,
"acc_norm,none": 0.23238593052379397,
"acc_norm_stderr,none": 0.0043980977605237925,
"alias": "arabic_leaderboard_arabic_mmlu"
}
},
"baseline": {
"copa_ar": {
"alias": "copa_ar",
"acc,none": 0.5617977528089888,
"acc_stderr,none": 0.05289150964557706,
"acc_norm,none": 0.5393258426966292,
"acc_norm_stderr,none": 0.05313506354909072
},
"arabic_mt_hellaswag": {
"alias": "arabic_mt_hellaswag",
"acc,none": 0.225,
"acc_stderr,none": 0.029601626330440618,
"acc_norm,none": 0.225,
"acc_norm_stderr,none": 0.029601626330440618
},
"arabic_leaderboard_arabic_mmlu": {
"acc,none": 0.2598279429380377,
"acc_stderr,none": 0.004566720578133093,
"acc_norm,none": 0.2598279429380377,
"acc_norm_stderr,none": 0.004566720578133093,
"alias": "arabic_leaderboard_arabic_mmlu"
}
}
}