step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward 500,-1.0333396196365356,-1.0333393983840942,8.27593122625351,, 1000,-1.1147913932800293,-1.114791325211525,8.357383209705352,, 1500,-1.3842886686325073,-1.3842888238430022,8.626880667209626,, 2000,-1.510918378829956,-1.5109185495376587,8.753510362625121,, 2500,-1.3396002054214478,-1.3396003789901734,8.582192204475403,, 3000,-1.5393997430801392,-1.539399187207222,8.781991057157516,, 3500,-1.2377198934555054,-1.2377199754714965,8.48031182050705,, 4000,-1.6279903650283813,-1.6279903903007507,8.870582232952119,, 4500,-1.2016804218292236,-1.201680270433426,8.444272145748139,, 5000,-1.2525445222854614,-1.2525446290969848,8.495136489391326,, 5000,,,,8.469941500425339,-1.2273502349853516 5500,-1.0881956815719604,-1.0881956911087036,8.330787517070771,, 6000,-1.2716963291168213,-1.2716965979337693,8.514288442134857,, 6500,-1.548081874847412,-1.548082523226738,8.790674429416656,, 7000,-1.3961704969406128,-1.3961704987287522,8.63876235628128,, 7500,-1.2453620433807373,-1.2453617267608643,8.487953588485718,, 8000,-1.272199273109436,-1.2721994853019714,8.514791397571564,, 8500,-1.2269935607910156,-1.2269939534664154,8.469585789680481,, 9000,-1.2251864671707153,-1.2251866664886475,8.467778541564941,, 9500,-1.0945039987564087,-1.094503772854805,8.337095606327058,, 10000,-1.136132001876831,-1.1361322355270387,8.378724110126495,, 10000,,,,8.156898256540298,-0.9143070578575134 10500,-1.2261931896209717,-1.2261939319372177,8.468785812377929,, 11000,-1.1737016439437866,-1.1737016307115555,8.416293475151061,, 11500,-1.2375633716583252,-1.2375632519721984,8.480155145168304,, 12000,-1.1694486141204834,-1.1694486948251723,8.412040555477143,, 12500,-1.1194995641708374,-1.1194994893074035,8.362091318130494,, 13000,-1.0721402168273926,-1.0721402674913407,8.314732061862946,, 13500,-1.0604079961776733,-1.060407979130745,8.30299983048439,, 14000,-1.0712811946868896,-1.0712814021110535,8.313873225688935,, 14500,-1.1024411916732788,-1.1024406924247743,8.34503256368637,, 15000,-1.102455735206604,-1.1024556616544723,8.345047529220581,, 15000,,,,7.915521247386932,-0.6729300618171692 15500,-1.0382559299468994,-1.0382560498714446,8.280847877502442,, 16000,-1.011733055114746,-1.0117327505350113,8.254324578762054,, 16500,-0.9720138311386108,-0.9720139161348343,8.214605789661407,, 17000,-0.953220784664154,-0.9532204986810684,8.195812367916107,, 17500,-0.9294365048408508,-0.9294367592334747,8.172028653621673,, 18000,-1.0571727752685547,-1.0571724177598953,8.299764328479768,, 18500,-1.0814855098724365,-1.0814852863550186,8.324077178955077,, 19000,-0.9929147362709045,-0.9929148820638657,8.235506742954254,, 19500,-1.0142344236373901,-1.0142343562841416,8.256826230049134,, 20000,-0.9489594101905823,-0.9489594011306762,8.191551280021667,, 20000,,,,8.191939379572869,-0.9493479132652283 20500,-0.9560054540634155,-0.9560053623914718,8.198597234249116,, 21000,-0.9867598414421082,-0.9867599339485168,8.229351812839509,, 21500,-0.9448781609535217,-0.9448782132863999,8.18747004365921,, 22000,-1.0801842212677002,-1.0801836135387421,8.32277545452118,, 22500,-1.087973713874817,-1.0879735567569733,8.330565376281738,, 23000,-1.083853840827942,-1.0838538007736207,8.326445681214333,, 23500,-1.05361807346344,-1.05361832344532,8.29621017408371,, 24000,-1.1522955894470215,-1.1522958492040634,8.394887712955475,, 24500,-1.0659173727035522,-1.0659167734384536,8.30850860619545,, 25000,-0.9780071377754211,-0.9780068607330322,8.220598705768586,, 25000,,,,8.289103412628174,-1.0465120077133179 25500,-0.9732199907302856,-0.9732204055786133,8.215812181472778,, 26000,-0.9292873740196228,-0.9292878185510636,8.171879682540894,, 26500,-1.0054179430007935,-1.0054180960655212,8.24800999879837,, 27000,-1.0687543153762817,-1.0687541034221648,8.311345941543578,, 27500,-1.2876758575439453,-1.2876755746603012,8.530267407417297,, 28000,-0.9462146162986755,-0.9462148092985153,8.188806668281556,, 28500,-1.0014841556549072,-1.001484165072441,8.244075979709626,, 29000,-1.0888694524765015,-1.0888699032068252,8.331461735486984,, 29500,-1.0750365257263184,-1.0750363266468048,8.317628167629241,, 30000,-1.0585095882415771,-1.0585093554258347,8.301101179361343,, 30000,,,,8.179764051437378,-0.9371725916862488 30500,-1.0126644372940063,-1.012663877248764,8.255255708813667,, 31000,-0.9699079394340515,-0.9699079889059067,8.21249983024597,, 31500,-0.9691269397735596,-0.9691276327371597,8.211719492197037,, 32000,-1.0364586114883423,-1.0364589270353317,8.279050760507584,, 32500,-0.9513350129127502,-0.9513349124193191,8.193926766395569,, 33000,-0.9922336339950562,-0.9922331893444061,8.234825077295303,, 33500,-0.9909980893135071,-0.9909984081983566,8.233590279340744,, 34000,-0.9443930387496948,-0.9443930275440217,8.186984880328179,, 34500,-0.9778696298599243,-0.9778697415590286,8.220461508750915,, 35000,-0.965343713760376,-0.965343610048294,8.20793542122841,, 35000,,,,8.341607853770256,-1.099016547203064 35500,-1.1027952432632446,-1.1027950239181519,8.345386881232262,, 36000,-1.001489281654358,-1.0014897187948226,8.244081593036652,, 36500,-1.0018385648727417,-1.0018385891914368,8.244430401086808,, 37000,-0.9757014513015747,-0.9757015175819397,8.218293369293212,, 37500,-1.0115289688110352,-1.0115288578271866,8.25412075662613,, 38000,-0.9523683190345764,-0.9523681931495667,8.194960072755814,, 38500,-1.0045222043991089,-1.0045221866369247,8.247114100694656,, 39000,-0.9730554223060608,-0.9730555921792984,8.215647486686706,, 39500,-0.9448816776275635,-0.9448815714120865,8.187473417639733,, 40000,-0.9437248110771179,-0.9437247395515442,8.186316621303558,, 40000,,,,8.114778230190277,-0.8721867203712463 40500,-0.9231025576591492,-0.9231023691892624,8.165694209814072,, 41000,-0.9852995872497559,-0.9853001909255982,8.227892057418824,, 41500,-0.9821887612342834,-0.9821888897418976,8.224780777215958,, 42000,-0.9859462976455688,-0.9859464155435562,8.2285383374691,, 42500,-0.8936163783073425,-0.8936165065765381,8.136208342075347,, 43000,-0.8970760107040405,-0.8970760304927826,8.139667902946472,, 43500,-1.0576006174087524,-1.0576005789041518,8.30019246697426,, 44000,-0.863156795501709,-0.8631569511890411,8.10574879181385,, 44500,-1.0010710954666138,-1.0010713574886323,8.243663263082505,, 45000,-0.8999436497688293,-0.8999437763690948,8.14253559923172,, 45000,,,,8.056672455072404,-0.8140811920166016 45500,-0.9060203433036804,-0.906020339012146,8.148612174510955,, 46000,-0.9517828822135925,-0.951782767534256,8.194374623775483,, 46500,-0.9139706492424011,-0.9139708330631257,8.156562676906585,, 47000,-0.9804315567016602,-0.9804319001436234,8.223023738384247,, 47500,-1.0324673652648926,-1.0324676105976105,8.27505951666832,, 48000,-0.9349365830421448,-0.9349361239671707,8.17752802991867,, 48500,-0.8992148041725159,-0.8992151494026184,8.141807067394257,, 49000,-0.905844509601593,-0.9058441953659058,8.148436007022857,, 49500,-0.8817610144615173,-0.881761567234993,8.12435345029831,, 50000,-0.9140812754631042,-0.9140814354419708,8.156673292160034,, 50000,,,,8.088772453069687,-0.8461809158325195