Update README.md
Browse files
README.md
CHANGED
|
@@ -23,4 +23,12 @@ Benchmark Scores
|
|
| 23 |
| Tasks |Version|Filter|n-shot| Metric |Value | |Stderr|
|
| 24 |
|---------|------:|------|-----:|--------|-----:|---|-----:|
|
| 25 |
|hellaswag| 1|none | 0|acc |0.6270|± |0.0048|
|
| 26 |
-
| | |none | 0|acc_norm|0.8228|± |0.0038|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
| Tasks |Version|Filter|n-shot| Metric |Value | |Stderr|
|
| 24 |
|---------|------:|------|-----:|--------|-----:|---|-----:|
|
| 25 |
|hellaswag| 1|none | 0|acc |0.6270|± |0.0048|
|
| 26 |
+
| | |none | 0|acc_norm|0.8228|± |0.0038|
|
| 27 |
+
|
| 28 |
+
| Groups |Version|Filter|n-shot|Metric|Value | |Stderr|
|
| 29 |
+
|------------------|-------|------|-----:|------|-----:|---|-----:|
|
| 30 |
+
|mmlu |N/A |none | 0|acc |0.6243|± |0.1341|
|
| 31 |
+
| - humanities |N/A |none | 0|acc |0.5717|± |0.1400|
|
| 32 |
+
| - other |N/A |none | 0|acc |0.7016|± |0.1143|
|
| 33 |
+
| - social_sciences|N/A |none | 0|acc |0.7342|± |0.0753|
|
| 34 |
+
| - stem |N/A |none | 0|acc |0.5192|± |0.1257|
|