| step,training/mean_reward,training/mean_global_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward | |
| 500,-0.08366084098815918,-0.08366084432601929,2.5278043789863585,, | |
| 1000,-0.09297764301300049,-0.09297764301300049,2.53712117767334,, | |
| 1500,-0.08641175180673599,-0.08641175746917724,2.530555289745331,, | |
| 2000,-0.0874360054731369,-0.08743599462509155,2.5315795216560364,, | |
| 2500,-0.0405673086643219,-0.04056731128692627,2.484710841178894,, | |
| 3000,-0.021202605217695236,-0.0212026047706604,2.465346137046814,, | |
| 3500,-0.037111878395080566,-0.0371118803024292,2.481255407333374,, | |
| 4000,-0.046849992126226425,-0.046849987983703614,2.490993522167206,, | |
| 4500,-0.0019580242224037647,-0.001958024501800537,2.446101553440094,, | |
| 5000,0.00825823750346899,0.008258237361907958,2.4358853001594545,, | |
| 5000,,,,2.28835297703743,0.1557905673980713 | |
| 5500,-0.00027999942540191114,-0.0002799992561340332,2.4444235401153565,, | |
| 6000,0.004405356477946043,0.004405355930328369,2.439738178730011,, | |
| 6500,0.030355848371982574,0.03035584783554077,2.4137876868247985,, | |
| 7000,0.021564261987805367,0.02156426239013672,2.4225792751312256,, | |
| 7500,0.028914358466863632,0.028914360523223877,2.4152291746139527,, | |
| 8000,0.02819138951599598,0.02819138765335083,2.4159521479606627,, | |
| 8500,0.023626087233424187,0.02362608861923218,2.4205174407958983,, | |
| 9000,0.06576478481292725,0.06576479053497314,2.378378733634949,, | |
| 9500,0.054117247462272644,0.05411725330352783,2.3900262799263,, | |
| 10000,0.05904707312583923,0.059047069549560544,2.3850964593887327,, | |
| 10000,,,,2.239135735034943,0.20500779151916504 | |
| 10500,0.06512696295976639,0.06512696266174317,2.3790165672302246,, | |
| 11000,0.0724114254117012,0.07241142320632935,2.3717321128845215,, | |
| 11500,0.0745772272348404,0.07457722806930542,2.369566306114197,, | |
| 12000,0.06642086803913116,0.06642086744308472,2.3777226538658143,, | |
| 12500,0.06590814143419266,0.06590813875198365,2.37823540019989,, | |
| 13000,0.09832964837551117,0.09832965278625488,2.3458138847351075,, | |
| 13500,0.10290686041116714,0.10290686988830566,2.3412366628646852,, | |
| 14000,0.08539082854986191,0.08539082431793213,2.3587527213096617,, | |
| 14500,0.07266561686992645,0.07266561651229858,2.3714779143333433,, | |
| 15000,0.08612429350614548,0.08612428760528565,2.358019244670868,, | |
| 15000,,,,2.2292354357242585,0.21490809321403503 | |
| 15500,0.10826536267995834,0.10826536083221436,2.335878182411194,, | |
| 16000,0.0939083844423294,0.09390838861465454,2.3502351422309875,, | |
| 16500,0.09960270673036575,0.09960269689559936,2.344540831565857,, | |
| 17000,0.1263253539800644,0.12632535457611083,2.3178181862831115,, | |
| 17500,0.11701292544603348,0.11701291990280151,2.327130614280701,, | |
| 18000,0.11246103048324585,0.11246103191375732,2.331682500362396,, | |
| 18500,0.1060979962348938,0.10609800148010254,2.338045522689819,, | |
| 19000,0.10817639529705048,0.1081763949394226,2.3359671382904055,, | |
| 19500,0.12890228629112244,0.1289022750854492,2.3152412567138674,, | |
| 20000,0.12308061867952347,0.12308062076568603,2.3210629186630247,, | |
| 20000,,,,2.170112668275833,0.274030864238739 | |
| 20500,0.10645964741706848,0.1064596529006958,2.3376838750839233,, | |
| 21000,0.11845333874225616,0.1184533338546753,2.3256902017593384,, | |
| 21500,0.15487515926361084,0.15487514352798462,2.289268393993378,, | |
| 22000,0.13464190065860748,0.13464189291000367,2.3095016331672666,, | |
| 22500,0.14186520874500275,0.1418651933670044,2.3022783303260805,, | |
| 23000,0.12954141199588776,0.12954140520095825,2.3146021370887757,, | |
| 23500,0.12115524709224701,0.12115525341033935,2.3229882917404177,, | |
| 24000,0.15144363045692444,0.1514436273574829,2.292699903011322,, | |
| 24500,0.13261589407920837,0.13261588764190674,2.311527645111084,, | |
| 25000,0.1468086689710617,0.14680867624282837,2.2973348531723023,, | |
| 25000,,,,2.1549171948432924,0.28922632336616516 | |
| 25500,0.15241017937660217,0.15241017961502076,2.2917333550453187,, | |
| 26000,0.13457338511943817,0.13457337522506713,2.3095701665878297,, | |
| 26500,0.1453704982995987,0.14537049198150634,2.298773047924042,, | |
| 27000,0.1668587625026703,0.16685876941680908,2.2772847628593444,, | |
| 27500,0.1698814481496811,0.16988144636154176,2.2742620787620544,, | |
| 28000,0.1558079570531845,0.15580794954299926,2.2883355894088746,, | |
| 28500,0.13617078959941864,0.13617079639434815,2.307972741603851,, | |
| 29000,0.16322462260723114,0.16322461748123168,2.280918914794922,, | |
| 29500,0.17669051885604858,0.17669053888320924,2.26745299243927,, | |
| 30000,0.17846758663654327,0.17846759366989134,2.265675946712494,, | |
| 30000,,,,2.1715856873989106,0.2725578546524048 | |
| 30500,0.16667309403419495,0.1666730899810791,2.277470438480377,, | |
| 31000,0.15678571164608002,0.15678571462631224,2.28735782623291,, | |
| 31500,0.2010551393032074,0.20105513334274291,2.243088393688202,, | |
| 32000,0.17751403152942657,0.17751403713226319,2.266629493713379,, | |
| 32500,0.17216086387634277,0.1721608567237854,2.271982675552368,, | |
| 33000,0.19131796061992645,0.19131796360015868,2.252825571537018,, | |
| 33500,0.18275043368339539,0.18275044250488282,2.2613930921554566,, | |
| 34000,0.20784145593643188,0.20784145212173463,2.2363020701408387,, | |
| 34500,0.18046826124191284,0.18046828508377075,2.26367524766922,, | |
| 35000,0.18855692446231842,0.18855693387985228,2.25558660364151,, | |
| 35000,,,,2.1727890491485597,0.2713544964790344 | |
| 35500,0.1925363689661026,0.19253636932373047,2.2516071653366088,, | |
| 36000,0.16561688482761383,0.1656168942451477,2.278526629924774,, | |
| 36500,0.16554294526576996,0.1655429458618164,2.2786005945205687,, | |
| 37000,0.19604265689849854,0.19604266548156737,2.2481008710861206,, | |
| 37500,0.17421479523181915,0.17421479463577272,2.2699287328720095,, | |
| 38000,0.1756732314825058,0.17567323160171508,2.26847030878067,, | |
| 38500,0.1954001933336258,0.19540018033981324,2.248743362903595,, | |
| 39000,0.17579451203346252,0.17579451847076416,2.2683490142822267,, | |
| 39500,0.1855808049440384,0.18558082294464112,2.258562706947327,, | |
| 40000,0.2053901106119156,0.20539010763168336,2.2387534322738647,, | |
| 40000,,,,2.161219387054443,0.2829241454601288 | |
| 40500,0.20918519794940948,0.20918521451950073,2.2349583129882813,, | |
| 41000,0.19407238066196442,0.19407238340377808,2.2500711522102357,, | |
| 41500,0.2151118963956833,0.21511189603805542,2.229031632900238,, | |
| 42000,0.2062837779521942,0.20628378677368164,2.2378597469329833,, | |
| 42500,0.20741024613380432,0.2074102578163147,2.236733280658722,, | |
| 43000,0.18989317119121552,0.18989318466186522,2.2542503509521485,, | |
| 43500,0.19421561062335968,0.19421561193466186,2.2499279150962828,, | |
| 44000,0.1906915307044983,0.1906915249824524,2.253452006816864,, | |
| 44500,0.20838510990142822,0.2083851203918457,2.235758409500122,, | |
| 45000,0.2230866700410843,0.2230866904258728,2.2210568466186524,, | |
| 45000,,,,2.105118463039398,0.33902508020401 | |
| 45500,0.2155987173318863,0.21559873962402343,2.228544791698456,, | |
| 46000,0.18086951971054077,0.18086951875686647,2.263274023532867,, | |
| 46500,0.20663580298423767,0.2066358060836792,2.2375077238082888,, | |
| 47000,0.2150769680738449,0.2150769772529602,2.22906655216217,, | |
| 47500,0.20921730995178223,0.2092173080444336,2.2349262390136717,, | |
| 48000,0.18769679963588715,0.18769677066802978,2.2564467492103577,, | |
| 48500,0.20955044031143188,0.209550452709198,2.23459308052063,, | |
| 49000,0.19852685928344727,0.19852686166763306,2.2456166667938233,, | |
| 49500,0.20671308040618896,0.20671307468414307,2.2374304571151735,, | |
| 50000,0.18875905871391296,0.1887590742111206,2.2553844656944273,, | |
| 50000,,,,2.1008523547649385,0.34329116344451904 | |
| 50500,0.21066132187843323,0.2106613154411316,2.233482211589813,, | |
| 51000,0.2130340337753296,0.21303403091430664,2.231109505176544,, | |