| step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward | |
| 500,-1.270065426826477,-1.2700653417110443,8.512657225131989,, | |
| 1000,-1.2864986658096313,-1.2864983192682267,8.529090170383453,, | |
| 1500,-1.2869242429733276,-1.286924661040306,8.529516491889954,, | |
| 2000,-1.288193702697754,-1.288193546295166,8.530785451412202,, | |
| 2500,-1.2747048139572144,-1.2747046627998353,8.51729649591446,, | |
| 3000,-1.239412546157837,-1.2394124809503555,8.482004292011261,, | |
| 3500,-1.2432786226272583,-1.243278668999672,8.485870545864104,, | |
| 4000,-1.2654087543487549,-1.2654089294672013,8.508000810146331,, | |
| 4500,-1.2173118591308594,-1.2173114240169525,8.45990328502655,, | |
| 5000,-1.2068599462509155,-1.206859837770462,8.449451635837555,, | |
| 5000,,,,7.84308221578598,-0.6004905700683594 | |
| 5500,-1.264957308769226,-1.264957284808159,8.507549148082733,, | |
| 6000,-1.1574242115020752,-1.1574244346618652,8.400016304969787,, | |
| 6500,-1.2240934371948242,-1.2240931686162948,8.466685064315795,, | |
| 7000,-1.2354333400726318,-1.2354329524040222,8.478024799108505,, | |
| 7500,-1.167077660560608,-1.167077220439911,8.409669058799743,, | |
| 8000,-1.2163779735565186,-1.2163783456087112,8.458970185756684,, | |
| 8500,-1.1815603971481323,-1.181560195684433,8.42415205192566,, | |
| 9000,-1.198270559310913,-1.1982703292369843,8.440862208366394,, | |
| 9500,-1.140507698059082,-1.140508132457733,8.38309997177124,, | |
| 10000,-1.148219108581543,-1.1482192741632462,8.390811108112334,, | |
| 10000,,,,7.794463722705841,-0.5518723726272583 | |
| 10500,-1.1983916759490967,-1.1983918534517288,8.440983713626862,, | |
| 11000,-1.1427819728851318,-1.1427819728851318,8.385373857021332,, | |
| 11500,-1.1513265371322632,-1.1513265097141265,8.393918320178985,, | |
| 12000,-1.0919883251190186,-1.0919884765148162,8.334580379486084,, | |
| 12500,-1.1108616590499878,-1.110861811518669,8.35345365333557,, | |
| 13000,-1.125556230545044,-1.1255562281608582,8.36814805650711,, | |
| 13500,-1.057547926902771,-1.0575483101606369,8.300140118598938,, | |
| 14000,-1.085174322128296,-1.0851739600896835,8.327765851020812,, | |
| 14500,-1.0959683656692505,-1.0959689155817032,8.338560762882233,, | |
| 15000,-1.110211968421936,-1.1102120571136476,8.352803963661193,, | |
| 15000,,,,7.793369452953339,-0.5507781505584717 | |
| 15500,-1.0474871397018433,-1.0474869000911713,8.29007874917984,, | |
| 16000,-1.1176717281341553,-1.11767167532444,8.360263526201248,, | |
| 16500,-1.149390459060669,-1.1493904137611388,8.391982279777526,, | |
| 17000,-1.151020884513855,-1.1510206125974656,8.393612429141998,, | |
| 17500,-1.109100580215454,-1.1091008763313293,8.351692714214325,, | |
| 18000,-1.090142846107483,-1.0901431852579118,8.332735067844391,, | |
| 18500,-1.0785597562789917,-1.0785598031282424,8.321151651382447,, | |
| 19000,-1.1184035539627075,-1.1184036073684693,8.360995462417602,, | |
| 19500,-1.0343374013900757,-1.034337504029274,8.276929379463196,, | |
| 20000,-1.1375782489776611,-1.1375781391859054,8.380169957637786,, | |
| 20000,,,,7.842595753669738,-0.6000044345855713 | |
| 20500,-1.0096787214279175,-1.0096789481639863,8.252270806789399,, | |
| 21000,-1.0829722881317139,-1.0829724655151367,8.325564318180085,, | |
| 21500,-0.9490821957588196,-0.9490818880796432,8.191673714160919,, | |
| 22000,-0.957439124584198,-0.9574393122196198,8.200031170368195,, | |
| 22500,-0.9436343312263489,-0.9436345801353455,8.186226438045502,, | |
| 23000,-1.0205410718917847,-1.020541033744812,8.263132899045944,, | |
| 23500,-0.9846765995025635,-0.9846763879060745,8.22726820087433,, | |
| 24000,-1.0036004781723022,-1.0036002452373505,8.246192080974579,, | |
| 24500,-0.9770014882087708,-0.9770018249750138,8.219593661308288,, | |
| 25000,-0.9761715531349182,-0.976171957731247,8.218763832569122,, | |
| 25000,,,,7.6464204704761505,-0.40382900834083557 | |
| 25500,-0.969287633895874,-0.9692881969213486,8.211880033969878,, | |
| 26000,-1.0216294527053833,-1.0216292253732682,8.26422106218338,, | |
| 26500,-0.9931726455688477,-0.9931730550527572,8.235764921665192,, | |
| 27000,-0.956329345703125,-0.9563294883966446,8.19892133808136,, | |
| 27500,-0.9638761878013611,-0.9638758201599121,8.206467646598815,, | |
| 28000,-0.9504192471504211,-0.9504193593263626,8.19301122379303,, | |
| 28500,-0.9230415225028992,-0.9230415585041046,8.165633428573608,, | |
| 29000,-0.8909860253334045,-0.8909856413602829,8.133577525615692,, | |
| 29500,-0.9317854046821594,-0.9317857044935226,8.17437754535675,, | |
| 30000,-0.894836962223053,-0.8948367191553116,8.137428583621979,, | |
| 30000,,,,7.513670065402985,-0.271078497171402 | |
| 30500,-0.8997390270233154,-0.8997387810945511,8.142330650806427,, | |
| 31000,-0.9313161969184875,-0.9313162294626236,8.173908076286317,, | |
| 31500,-0.921440601348877,-0.9214403841495514,8.16403223991394,, | |
| 32000,-0.9456008672714233,-0.9456008784770965,8.188192707538605,, | |
| 32500,-0.8664374947547913,-0.8664374326467514,8.109029299736022,, | |
| 33000,-0.8849108219146729,-0.8849110237360001,8.12750289607048,, | |
| 33500,-0.9271032810211182,-0.9271030998229981,8.169694922447205,, | |
| 34000,-0.87181156873703,-0.8718122116327286,8.114404044628143,, | |
| 34500,-0.8887145519256592,-0.8887146496772766,8.131306488990784,, | |
| 35000,-0.9575279951095581,-0.9575282193422318,8.200120057106018,, | |
| 35000,,,,7.565959758758545,-0.323368102312088 | |
| 35500,-0.8781765103340149,-0.8781765455007553,8.120768403530121,, | |
| 36000,-0.9771652221679688,-0.9771653382778168,8.21975724363327,, | |
| 36500,-0.9594079256057739,-0.9594083290100097,8.202000226259232,, | |
| 37000,-0.8830788135528564,-0.8830787391662598,8.125670560836792,, | |
| 37500,-0.9194141030311584,-0.9194137799739838,8.162005625247955,, | |
| 38000,-0.937061607837677,-0.9370615674257279,8.179653479099274,, | |
| 38500,-1.001966118812561,-1.0019664138555526,8.244558210372924,, | |
| 39000,-0.979603111743927,-0.9796026631593704,8.222194537401199,, | |
| 39500,-0.899408221244812,-0.8994082236289977,8.142000137329102,, | |
| 40000,-0.8799611926078796,-0.8799610028266907,8.122552872180938,, | |
| 40000,,,,7.559117884635925,-0.3165264427661896 | |
| 40500,-0.964604914188385,-0.9646050893068313,8.207196933746339,, | |
| 41000,-0.9258540868759155,-0.9258540937900543,8.168445950508117,, | |
| 41500,-0.9191593527793884,-0.9191593102216721,8.1617512485981,, | |
| 42000,-0.9356387257575989,-0.9356384792327881,8.178230355739593,, | |
| 42500,-0.9559558033943176,-0.9559562244415283,8.198548049926758,, | |
| 43000,-0.930672287940979,-0.9306724803447723,8.173264316558837,, | |
| 43500,-0.9399895071983337,-0.9399897606372833,8.182581650257111,, | |
| 44000,-0.904668927192688,-0.9046686377525329,8.147260546207429,, | |
| 44500,-0.9129497408866882,-0.9129497767686844,8.155541634082795,, | |
| 45000,-0.8489297032356262,-0.8489299325942993,8.09152178621292,, | |
| 45000,,,,7.488188047409057,-0.2455967217683792 | |
| 45500,-0.9351224899291992,-0.9351227858066559,8.17771467590332,, | |
| 46000,-0.9893708825111389,-0.9893711296319961,8.231962990760803,, | |
| 46500,-0.9404740929603577,-0.9404735240936279,8.18306539273262,, | |
| 47000,-0.94874507188797,-0.9487448770999909,8.191336768150329,, | |
| 47500,-0.9764763116836548,-0.976475677371025,8.219067519187927,, | |
| 48000,-0.9990741610527039,-0.9990744426250457,8.241666309833526,, | |
| 48500,-0.9884929060935974,-0.9884930790662766,8.231084918498993,, | |
| 49000,-1.0177738666534424,-1.0177743941545487,8.260366258144378,, | |
| 49500,-0.9281767010688782,-0.9281769477128983,8.17076882839203,, | |
| 50000,-0.9287114143371582,-0.9287113021612168,8.17130313682556,, | |
| 50000,,,,7.41178314447403,-0.16919176280498505 | |
| 50500,-0.9635107517242432,-0.9635106338262558,8.206102511882783,, | |
| 51000,-0.952689528465271,-0.9526894763708115,8.195281312942505,, | |