File size: 1,440 Bytes
bf80d19 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 |
Task , Accuracy , Centered
hellaswag_zeroshot , 0.451504 , 0.268672
jeopardy , 0.121398 , 0.121398
bigbench_qa_wikidata , 0.527828 , 0.527828
arc_easy , 0.648569 , 0.531425
arc_challenge , 0.343857 , 0.125142
copa , 0.680000 , 0.360000
commonsense_qa , 0.291564 , 0.114455
piqa , 0.695865 , 0.391730
openbook_qa , 0.352000 , 0.136000
lambada_openai , 0.354939 , 0.354939
hellaswag , 0.447520 , 0.263361
winograd , 0.630037 , 0.260073
winogrande , 0.550908 , 0.101815
bigbench_dyck_languages , 0.108000 , 0.108000
agi_eval_lsat_ar , 0.308696 , 0.135870
bigbench_cs_algorithms , 0.371970 , 0.371970
bigbench_operators , 0.142857 , 0.142857
bigbench_repeat_copy_logic , 0.000000 , 0.000000
squad , 0.252791 , 0.252791
coqa , 0.193160 , 0.193160
boolq , 0.529969 , -0.236923
bigbench_language_identification , 0.251200 , 0.176238
CORE , , 0.213673
|