episode,difficulty,reward_mean,reward_max,success_rate,steps_mean 25,hard,-10.124,-8.4,0.0,58.0 50,hard,-11.184,-9.0,0.0,58.4 75,hard,-11.468,-9.38,0.0,35.6 100,hard,-9.827,-7.945,0.0,74.0 125,hard,-7.792,16.02,0.2,25.0 150,hard,-4.2375,13.16,0.4,28.0 175,hard,-6.674,10.925,0.2,35.2 200,hard,-12.304,-9.13,0.0,74.6 225,hard,-11.08,-8.5,0.0,100.0 250,hard,-5.648,14.56,0.2,38.4 275,hard,-10.368,-6.63,0.0,76.2 300,hard,-4.421,14.16,0.2,72.8 325,hard,-11.18,-8.89,0.0,48.2 350,hard,-9.845,-7.48,0.0,74.0 375,hard,-11.32,-10.4,0.0,26.4 400,hard,-12.256,-11.49,0.0,34.0 425,hard,-7.024,13.05,0.2,36.4 450,hard,-10.726,-8.5,0.0,56.4 475,hard,-9.072,-6.7,0.0,88.6 500,hard,-12.05,-9.91,0.0,66.6 525,hard,-5.528,13.05,0.2,41.6 550,hard,-11.274,-8.5,0.0,52.4 575,hard,-10.578,-8.5,0.0,58.4 600,hard,-12.068,-7.86,0.0,36.6