Update README.md
Browse files
README.md
CHANGED
|
@@ -253,26 +253,26 @@ lm_eval \
|
|
| 253 |
<td rowspan="4"><b>Coding</b></td>
|
| 254 |
<td>HumanEval (pass@1)</td>
|
| 255 |
<td>40.80</td>
|
| 256 |
-
<td
|
| 257 |
-
<td><b
|
| 258 |
</tr>
|
| 259 |
<tr>
|
| 260 |
<td>HumanEval (pass@10)</td>
|
| 261 |
<td>64.40</td>
|
| 262 |
-
<td
|
| 263 |
-
<td
|
| 264 |
</tr>
|
| 265 |
<tr>
|
| 266 |
<td>HumanEval+ (pass@10)</td>
|
| 267 |
<td>38.50</td>
|
| 268 |
-
<td
|
| 269 |
-
<td
|
| 270 |
</tr>
|
| 271 |
<tr>
|
| 272 |
<td>HumanEval+ (pass@10)</td>
|
| 273 |
<td>60.40</td>
|
| 274 |
-
<td
|
| 275 |
-
<td
|
| 276 |
</tr>
|
| 277 |
</tbody>
|
| 278 |
</table>
|
|
|
|
| 253 |
<td rowspan="4"><b>Coding</b></td>
|
| 254 |
<td>HumanEval (pass@1)</td>
|
| 255 |
<td>40.80</td>
|
| 256 |
+
<td>48.50</td>
|
| 257 |
+
<td><b>118.9%</b></td>
|
| 258 |
</tr>
|
| 259 |
<tr>
|
| 260 |
<td>HumanEval (pass@10)</td>
|
| 261 |
<td>64.40</td>
|
| 262 |
+
<td>67.10</td>
|
| 263 |
+
<td>104.2%</td>
|
| 264 |
</tr>
|
| 265 |
<tr>
|
| 266 |
<td>HumanEval+ (pass@10)</td>
|
| 267 |
<td>38.50</td>
|
| 268 |
+
<td>45.00</td>
|
| 269 |
+
<td>116.9%</td>
|
| 270 |
</tr>
|
| 271 |
<tr>
|
| 272 |
<td>HumanEval+ (pass@10)</td>
|
| 273 |
<td>60.40</td>
|
| 274 |
+
<td>64.10</td>
|
| 275 |
+
<td>106.1%</td>
|
| 276 |
</tr>
|
| 277 |
</tbody>
|
| 278 |
</table>
|