step,training/mean_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward 500,-1.2638757228851318,8.506467935562133,, 1000,-1.2918249368667603,8.534417217254639,, 1500,-1.2429440021514893,8.485536410331726,, 2000,-1.2318264245986938,8.474418429851532,, 2500,-1.204951286315918,8.447543182849884,, 3000,-1.231319546699524,8.473911806106567,, 3500,-1.1939345598220825,8.43652674293518,, 4000,-1.3139466047286987,8.556538533210754,, 4500,-1.269408941268921,8.512001159191131,, 5000,-1.2420543432235718,8.48464625263214,, 5000,,,8.004975762367248,-0.7623839044570923 5500,-1.2467498779296875,8.489342157363891,, 6000,-1.229374885559082,8.471966935157775,, 6500,-1.2253780364990234,8.467969826221466,, 7000,-1.2468763589859009,8.489468628406525,, 7500,-1.2224012613296509,8.464993106365204,, 8000,-1.2332895994186401,8.475881048679351,, 8500,-1.2292163372039795,8.471808386325836,, 9000,-1.2435085773468018,8.48609997367859,, 9500,-1.2183769941329956,8.460968848228454,, 10000,-1.2307666540145874,8.473358258724213,, 10000,,,7.960881587266922,-0.7182897293567657 10500,-1.2136406898498535,8.456233565330505,, 11000,-1.2244008779525757,8.466992930173873,, 11500,-1.233966588973999,8.476557076931,, 12000,-1.1903570890426636,8.432948615074158,, 12500,-1.1589231491088867,8.401514246940613,, 13000,-1.2377092838287354,8.480301039218903,, 13500,-1.1781790256500244,8.420771000385285,, 14000,-1.1713075637817383,8.413900054216384,, 14500,-1.2514299154281616,8.494021889686584,, 15000,-1.1581870317459106,8.400779174804688,, 15000,,,7.956232913732529,-0.7136410558223725 15500,-1.206253170967102,8.448844613552094,, 16000,-1.2153222560882568,8.457913551807403,, 16500,-1.1572656631469727,8.39985796546936,, 17000,-1.162837028503418,8.405428987503052,, 17500,-1.1196784973144531,8.362270884990693,, 18000,-1.1976488828659058,8.440240446090698,, 18500,-1.1802736520767212,8.422865752220154,, 19000,-1.1861079931259155,8.428699759483337,, 19500,-1.175835132598877,8.41842696762085,, 20000,-1.2100130319595337,8.45260515499115,, 20000,,,7.909002994298935,-0.6664111363887787 20500,-1.0803356170654297,8.32292752456665,, 21000,-1.0614991188049316,8.304090758800507,, 21500,-1.1110498905181885,8.353641838073731,, 22000,-1.1087592840194702,8.351351665496827,, 22500,-1.0825586318969727,8.325150571346283,, 23000,-1.1428171396255493,8.385409548282624,, 23500,-1.0502127408981323,8.292804786205291,, 24000,-1.1211448907852173,8.363737188339233,, 24500,-1.0986582040786743,8.341250121593475,, 25000,-1.1315317153930664,8.374123731136322,, 25000,,,7.9271217215061185,-0.6845298635959626 25500,-1.2225385904312134,8.465130236148834,, 26000,-1.2542667388916016,8.49685870552063,, 26500,-1.1935598850250244,8.436151297092438,, 27000,-1.1482439041137695,8.390835689544678,, 27500,-1.0486449003219604,8.291237101078034,, 28000,-1.0865131616592407,8.329105385780334,, 28500,-1.1382107734680176,8.380802344799042,, 29000,-1.143283486366272,8.385874795913697,, 29500,-1.125913143157959,8.368504550933839,, 30000,-1.1172559261322021,8.359847628593444,, 30000,,,7.847749240398407,-0.6051573836803437 30500,-1.0235986709594727,8.266190693378448,, 31000,-1.1044046878814697,8.346997009277343,, 31500,-1.0924290418624878,8.335021157264709,, 32000,-0.9471048712730408,8.189696428775788,, 32500,-0.9405381083488464,8.183129636764527,, 33000,-1.0239322185516357,8.266523794651032,, 33500,-1.0145606994628906,8.25715268421173,, 34000,-1.0216234922409058,8.26421560716629,, 34500,-1.007668375968933,8.250259715557098,, 35000,-1.0353662967681885,8.277958436489104,, 35000,,,7.874070560932159,-0.6314787030220032 35500,-1.0075114965438843,8.250103253364562,, 36000,-0.9544050693511963,8.196997289657594,, 36500,-0.9406864643096924,8.18327812051773,, 37000,-1.033657431602478,8.276249062538147,, 37500,-0.9497969150543213,8.192388789653778,, 38000,-1.0068761110305786,8.249468105793,, 38500,-0.9298377633094788,8.172429467201233,, 39000,-1.035007119178772,8.277599180221557,, 39500,-0.8599153757095337,8.102507478713989,, 40000,-0.9653960466384888,8.207987933158874,, 40000,,,7.793733333349228,-0.5511414742469788 40500,-1.0321928262710571,8.274784571647643,, 41000,-0.9808789491653442,8.223470498085023,, 41500,-0.9243172407150269,8.166909071445465,, 42000,-0.9609916806221008,8.20358335494995,, 42500,-0.9696775078773499,8.21226980304718,, 43000,-0.903010368347168,8.145602182865144,, 43500,-0.9372181296348572,8.179809857845306,, 44000,-0.9655391573905945,8.208130515575409,, 44500,-0.9357297420501709,8.178321737766266,, 45000,-0.9281056523323059,8.170697585105897,, 45000,,,7.64711929321289,-0.4045274353027344 45500,-0.8526376485824585,8.095229726314544,, 46000,-0.8664577603340149,8.109049812316895,, 46500,-0.9083737134933472,8.15096590089798,, 47000,-0.9521086812019348,8.19470103406906,, 47500,-0.9567602872848511,8.199352354049683,, 48000,-0.8979848623275757,8.140576687812805,, 48500,-0.8833582401275635,8.125949962615966,, 49000,-0.9552427530288696,8.197834327220917,, 49500,-0.865196704864502,8.107788438796996,, 50000,-1.066251277923584,8.308843178749084,, 50000,,,7.612463876008987,-0.3698720180988312 50500,-0.8959355354309082,8.138526679992676,, 51000,-0.9262123703956604,8.168804445743561,,