Update README.md
Browse files
README.md
CHANGED
|
@@ -253,26 +253,26 @@ lm_eval \
|
|
| 253 |
<td rowspan="4"><b>Coding</b></td>
|
| 254 |
<td>HumanEval (pass@1)</td>
|
| 255 |
<td>37.90</td>
|
| 256 |
-
<td></td>
|
| 257 |
-
<td><b>%</b></td>
|
| 258 |
</tr>
|
| 259 |
<tr>
|
| 260 |
<td>HumanEval (pass@10)</td>
|
| 261 |
<td>61.30</td>
|
| 262 |
-
<td></td>
|
| 263 |
-
<td>%</td>
|
| 264 |
</tr>
|
| 265 |
<tr>
|
| 266 |
<td>HumanEval+ (pass@10)</td>
|
| 267 |
<td>33.00</td>
|
| 268 |
-
<td></td>
|
| 269 |
-
<td>%</td>
|
| 270 |
</tr>
|
| 271 |
<tr>
|
| 272 |
<td>HumanEval+ (pass@10)</td>
|
| 273 |
<td>55.90</td>
|
| 274 |
-
<td></td>
|
| 275 |
-
<td>%</td>
|
| 276 |
</tr>
|
| 277 |
</tbody>
|
| 278 |
</table>
|
|
|
|
| 253 |
<td rowspan="4"><b>Coding</b></td>
|
| 254 |
<td>HumanEval (pass@1)</td>
|
| 255 |
<td>37.90</td>
|
| 256 |
+
<td>35.70</td>
|
| 257 |
+
<td><b>94.2%</b></td>
|
| 258 |
</tr>
|
| 259 |
<tr>
|
| 260 |
<td>HumanEval (pass@10)</td>
|
| 261 |
<td>61.30</td>
|
| 262 |
+
<td>61.40</td>
|
| 263 |
+
<td>100.2%</td>
|
| 264 |
</tr>
|
| 265 |
<tr>
|
| 266 |
<td>HumanEval+ (pass@10)</td>
|
| 267 |
<td>33.00</td>
|
| 268 |
+
<td>31.90</td>
|
| 269 |
+
<td>96.7%</td>
|
| 270 |
</tr>
|
| 271 |
<tr>
|
| 272 |
<td>HumanEval+ (pass@10)</td>
|
| 273 |
<td>55.90</td>
|
| 274 |
+
<td>55.50</td>
|
| 275 |
+
<td>99.3%</td>
|
| 276 |
</tr>
|
| 277 |
</tbody>
|
| 278 |
</table>
|