Update README.md
Browse files
README.md
CHANGED
|
@@ -190,9 +190,9 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
| 190 |
</td>
|
| 191 |
<td>80.47
|
| 192 |
</td>
|
| 193 |
-
<td>
|
| 194 |
</td>
|
| 195 |
-
<td>
|
| 196 |
</td>
|
| 197 |
</tr>
|
| 198 |
<tr>
|
|
@@ -220,9 +220,9 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
| 220 |
</td>
|
| 221 |
<td><strong>74.25</strong>
|
| 222 |
</td>
|
| 223 |
-
<td><strong>73.
|
| 224 |
</td>
|
| 225 |
-
<td><strong>98.
|
| 226 |
</td>
|
| 227 |
</tr>
|
| 228 |
</table>
|
|
|
|
| 190 |
</td>
|
| 191 |
<td>80.47
|
| 192 |
</td>
|
| 193 |
+
<td>79.87
|
| 194 |
</td>
|
| 195 |
+
<td>99.3%
|
| 196 |
</td>
|
| 197 |
</tr>
|
| 198 |
<tr>
|
|
|
|
| 220 |
</td>
|
| 221 |
<td><strong>74.25</strong>
|
| 222 |
</td>
|
| 223 |
+
<td><strong>73.45</strong>
|
| 224 |
</td>
|
| 225 |
+
<td><strong>98.9%</strong>
|
| 226 |
</td>
|
| 227 |
</tr>
|
| 228 |
</table>
|