| episode,difficulty,reward_mean,reward_max,success_rate,steps_mean | |
| 25,hard,-10.124,-8.4,0.0,58.0 | |
| 50,hard,-11.184,-9.0,0.0,58.4 | |
| 75,hard,-11.468,-9.38,0.0,35.6 | |
| 100,hard,-9.827,-7.945,0.0,74.0 | |
| 125,hard,-7.792,16.02,0.2,25.0 | |
| 150,hard,-4.2375,13.16,0.4,28.0 | |
| 175,hard,-6.674,10.925,0.2,35.2 | |
| 200,hard,-12.304,-9.13,0.0,74.6 | |
| 225,hard,-11.08,-8.5,0.0,100.0 | |
| 250,hard,-5.648,14.56,0.2,38.4 | |
| 275,hard,-10.368,-6.63,0.0,76.2 | |
| 300,hard,-4.421,14.16,0.2,72.8 | |
| 325,hard,-11.18,-8.89,0.0,48.2 | |
| 350,hard,-9.845,-7.48,0.0,74.0 | |
| 375,hard,-11.32,-10.4,0.0,26.4 | |
| 400,hard,-12.256,-11.49,0.0,34.0 | |
| 425,hard,-7.024,13.05,0.2,36.4 | |
| 450,hard,-10.726,-8.5,0.0,56.4 | |
| 475,hard,-9.072,-6.7,0.0,88.6 | |
| 500,hard,-12.05,-9.91,0.0,66.6 | |
| 525,hard,-5.528,13.05,0.2,41.6 | |
| 550,hard,-11.274,-8.5,0.0,52.4 | |
| 575,hard,-10.578,-8.5,0.0,58.4 | |
| 600,hard,-12.068,-7.86,0.0,36.6 | |