Update README.md
Browse files
README.md
CHANGED
|
@@ -202,9 +202,9 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
| 202 |
</td>
|
| 203 |
<td>78.06
|
| 204 |
</td>
|
| 205 |
-
<td>77.
|
| 206 |
</td>
|
| 207 |
-
<td>99.
|
| 208 |
</td>
|
| 209 |
</tr>
|
| 210 |
<tr>
|
|
@@ -212,9 +212,9 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
| 212 |
</td>
|
| 213 |
<td>54.48
|
| 214 |
</td>
|
| 215 |
-
<td>54.
|
| 216 |
</td>
|
| 217 |
-
<td>99.
|
| 218 |
</td>
|
| 219 |
</tr>
|
| 220 |
<tr>
|
|
@@ -222,7 +222,7 @@ This version of the lm-evaluation-harness includes versions of MMLU, ARC-Challen
|
|
| 222 |
</td>
|
| 223 |
<td><strong>74.05</strong>
|
| 224 |
</td>
|
| 225 |
-
<td><strong>74.
|
| 226 |
</td>
|
| 227 |
<td><strong>100.0%</strong>
|
| 228 |
</td>
|
|
|
|
| 202 |
</td>
|
| 203 |
<td>78.06
|
| 204 |
</td>
|
| 205 |
+
<td>77.51
|
| 206 |
</td>
|
| 207 |
+
<td>99.3%
|
| 208 |
</td>
|
| 209 |
</tr>
|
| 210 |
<tr>
|
|
|
|
| 212 |
</td>
|
| 213 |
<td>54.48
|
| 214 |
</td>
|
| 215 |
+
<td>54.41
|
| 216 |
</td>
|
| 217 |
+
<td>99.9%
|
| 218 |
</td>
|
| 219 |
</tr>
|
| 220 |
<tr>
|
|
|
|
| 222 |
</td>
|
| 223 |
<td><strong>74.05</strong>
|
| 224 |
</td>
|
| 225 |
+
<td><strong>74.06</strong>
|
| 226 |
</td>
|
| 227 |
<td><strong>100.0%</strong>
|
| 228 |
</td>
|