step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward 500,-0.8826730847358704,-0.8826732580661774,7.311425181865692,, 1000,-0.9284907579421997,-0.9284906779527664,7.357242681503296,, 1500,-0.9413836002349854,-0.9413833718299865,7.3701353573799135,, 2000,-0.8876110911369324,-0.8876111769676208,7.316363128185272,, 2500,-0.8920140862464905,-0.8920139619112015,7.320765913963318,, 3000,-0.8712360858917236,-0.8712356203794479,7.2999875807762145,, 3500,-0.780922532081604,-0.7809225877523422,7.209674529075622,, 4000,-0.8254739046096802,-0.8254740749597549,7.254226001262665,, 4500,-0.8058051466941833,-0.8058052015304565,7.234557147979737,, 5000,-0.8291323781013489,-0.8291328233480454,7.257884776592254,, 5000,,,,6.861614124774933,-0.4328625202178955 5500,-0.8767406940460205,-0.876740443944931,7.305492392539978,, 6000,-0.9004652500152588,-0.9004655361175538,7.329217529296875,, 6500,-0.8630251884460449,-0.863025498509407,7.291777424812317,, 7000,-0.8769917488098145,-0.8769918146133423,7.305743744373322,, 7500,-0.8004758954048157,-0.8004756615161895,7.229227619171143,, 8000,-0.7848508358001709,-0.7848511632680893,7.213603147983551,, 8500,-0.795461893081665,-0.7954619688987732,7.2242139081954955,, 9000,-0.7548400163650513,-0.7548398860692977,7.183591797828674,, 9500,-0.8628402948379517,-0.8628399702310562,7.291591897010803,, 10000,-0.8437224626541138,-0.8437225048542023,7.272474479198456,, 10000,,,,6.9028217768669125,-0.4740701913833618 10500,-0.7787937521934509,-0.778793981552124,7.207545894622803,, 11000,-0.7654660940170288,-0.7654660601615906,7.194218005657196,, 11500,-0.7723984122276306,-0.7723980704545975,7.201150014400482,, 12000,-0.8093675971031189,-0.8093676044940948,7.238119514942169,, 12500,-0.7434836626052856,-0.7434836536645889,7.172235576629639,, 13000,-0.7665942907333374,-0.7665944067239762,7.195346395492554,, 13500,-0.7432683110237122,-0.7432683602571487,7.1720202641487125,, 14000,-0.7712634205818176,-0.7712638155221939,7.200015776157379,, 14500,-0.7248842120170593,-0.724884193778038,7.153636140346527,, 15000,-0.7476820945739746,-0.7476818935871125,7.176433812141418,, 15000,,,,6.852291383743286,-0.4235397279262543 15500,-0.7236352562904358,-0.7236351323127747,7.152387015342712,, 16000,-0.7481348514556885,-0.7481345603466034,7.17688654756546,, 16500,-0.7173243761062622,-0.7173243901729583,7.146076310157776,, 17000,-0.7788547873497009,-0.7788549395799637,7.207606853485108,, 17500,-0.7863595485687256,-0.7863600237369537,7.215111975669861,, 18000,-0.7383527159690857,-0.7383525381088257,7.167104551792145,, 18500,-0.728952169418335,-0.7289518727064133,7.157703801631928,, 19000,-0.7425087690353394,-0.742508964061737,7.171260910511017,, 19500,-0.8011206388473511,-0.8011208035945893,7.229872732162476,, 20000,-0.7472761869430542,-0.7472763383388519,7.176028297424317,, 20000,,,,6.839366140365601,-0.4106145203113556 20500,-0.7046987414360046,-0.7046986881494522,7.133450669765472,, 21000,-0.8178074359893799,-0.8178075740337372,7.246559473514557,, 21500,-0.7686999440193176,-0.7687001008987426,7.19745206785202,, 22000,-0.7661362290382385,-0.7661362112760544,7.194888129711151,, 22500,-0.7793014645576477,-0.7793010162115097,7.208052957057953,, 23000,-0.7992753386497498,-0.7992751265764236,7.228027068138123,, 23500,-0.7859545946121216,-0.7859546879529953,7.214706622600556,, 24000,-0.7832127213478088,-0.7832125641107559,7.211964526176453,, 24500,-0.6932947039604187,-0.6932941027879715,7.122046052455902,, 25000,-0.7835465669631958,-0.7835461578369141,7.212298062801361,, 25000,,,,6.890855712890625,-0.46210411190986633 25500,-0.777839183807373,-0.7778393992185593,7.206591365337371,, 26000,-0.7468874454498291,-0.7468876587152481,7.175639589309692,, 26500,-0.7492902874946594,-0.7492901644706726,7.178042087554932,, 27000,-0.7073883414268494,-0.7073881895542145,7.1361401119232175,, 27500,-0.7066628932952881,-0.7066625741720199,7.135414509296417,, 28000,-0.7268471121788025,-0.7268472735881806,7.15559920501709,, 28500,-0.7251179218292236,-0.7251179388761521,7.153869863033295,, 29000,-0.702258825302124,-0.7022590751647949,7.131011020183563,, 29500,-0.6992601752281189,-0.6992600899934769,7.1280120530128475,, 30000,-0.6678677201271057,-0.6678676178455353,7.0966195402145384,, 30000,,,,6.7769669151306156,-0.348215252161026 30500,-0.6847480535507202,-0.6847479559183121,7.11349991607666,, 31000,-0.7489768266677856,-0.7489767132997512,7.177728651046753,, 31500,-0.7182478904724121,-0.7182482964992524,7.14700022649765,, 32000,-0.7094802856445312,-0.7094804768562317,7.138232446670532,, 32500,-0.7382886409759521,-0.7382885050773621,7.1670404448509215,, 33000,-0.721687912940979,-0.7216876924037934,7.150439610481262,, 33500,-0.7175383567810059,-0.7175384365320205,7.146290393352508,, 34000,-0.6790506839752197,-0.6790505423545837,7.1078025002479555,, 34500,-0.7429975271224976,-0.742997468829155,7.171749427318573,, 35000,-0.6631206274032593,-0.6631209506988526,7.091872889518738,, 35000,,,,6.712763073444367,-0.2840113341808319 35500,-0.684292733669281,-0.6842925347089768,7.113044474601746,, 36000,-0.6424563527107239,-0.6424564929008484,7.0712084398269655,, 36500,-0.6602780222892761,-0.6602781997919083,7.089030111789703,, 37000,-0.7141735553741455,-0.7141733988523483,7.1429253334999085,, 37500,-0.6882449388504028,-0.6882449839115142,7.116996971130371,, 38000,-0.6786583662033081,-0.6786587404012681,7.107410663604736,, 38500,-0.6644042730331421,-0.6644042220115661,7.093156174182892,, 39000,-0.6893898844718933,-0.6893900538682938,7.11814199924469,, 39500,-0.5794962644577026,-0.5794962276220321,7.008248146533966,, 40000,-0.6019691824913025,-0.601969076871872,7.030721040248871,, 40000,,,,6.652243111133576,-0.22349125146865845 40500,-0.6204452514648438,-0.6204452128410339,7.049197129249572,, 41000,-0.617691695690155,-0.6176921542882919,7.046444096565247,, 41500,-0.6357026100158691,-0.6357026252746582,7.0644545378684995,, 42000,-0.647706151008606,-0.6477065340280533,7.0764584879875185,, 42500,-0.6417402029037476,-0.6417399222850799,7.07049191904068,, 43000,-0.6547427773475647,-0.65474296438694,7.083494876384735,, 43500,-0.5488666296005249,-0.548866616487503,6.977618634223938,, 44000,-0.614368736743927,-0.6143688627481461,7.043120757102966,, 44500,-0.5749431252479553,-0.5749431991577149,7.003695136547089,, 45000,-0.6003791093826294,-0.6003791679143906,7.029131123065948,, 45000,,,,6.637366664409638,-0.20861470699310303 45500,-0.5592147707939148,-0.5592146394252777,6.98796658039093,, 46000,-0.6086897850036621,-0.6086898032426834,7.037441752433777,, 46500,-0.6404269337654114,-0.6404269716739655,7.069178932666778,, 47000,-0.5092765092849731,-0.5092767432928086,6.9380287199020385,, 47500,-0.5683140158653259,-0.5683140224218368,6.997065979480744,, 48000,-0.5337614417076111,-0.533761144042015,6.962513059139252,, 48500,-0.5660397410392761,-0.5660399318933487,6.994791905879975,, 49000,-0.5313796997070312,-0.5313794008493423,6.9601313309669495,, 49500,-0.5021033883094788,-0.5021037582159043,6.930855696201324,, 50000,-0.49182212352752686,-0.49182199692726136,6.92057394361496,, 50000,,,,6.593718408346176,-0.16496641933918 50500,-0.48866650462150574,-0.4886664980649948,6.917418461799621,, 51000,-0.49768272042274475,-0.4976825814247131,6.926434514522552,,