| step,training/mean_reward,training/mean_nusselt,evaluation/mean_nusselt,evaluation/mean_reward | |
| 500,-1.2648862600326538,8.507478891849518,, | |
| 1000,-1.2338120937347412,8.476403473854065,, | |
| 1500,-1.2463620901107788,8.488954213857651,, | |
| 2000,-1.3571953773498535,8.599787383556366,, | |
| 2500,-1.221134066581726,8.46372664308548,, | |
| 3000,-1.2802939414978027,8.522885219573975,, | |
| 3500,-1.2389633655548096,8.481555224895477,, | |
| 4000,-1.2738490104675293,8.516440599918365,, | |
| 4500,-1.2227914333343506,8.465383412837982,, | |
| 5000,-1.2477883100509644,8.490380630970002,, | |
| 5000,,,7.921645476818084,-0.6790536189079285 | |
| 5500,-1.2848893404006958,8.52748070192337,, | |
| 6000,-1.2552295923233032,8.49782129907608,, | |
| 6500,-1.2832741737365723,8.525866426944733,, | |
| 7000,-1.2559418678283691,8.498534123897553,, | |
| 7500,-1.2371909618377686,8.47978246307373,, | |
| 8000,-1.2011972665786743,8.443789718151093,, | |
| 8500,-1.2420326471328735,8.4846239361763,, | |
| 9000,-1.277016043663025,8.519607528686523,, | |
| 9500,-1.2190701961517334,8.461662427902223,, | |
| 10000,-1.268432855606079,8.51102446269989,, | |
| 10000,,,8.049738378524781,-0.807146520614624 | |
| 10500,-1.2957605123519897,8.538353537559509,, | |
| 11000,-1.1723802089691162,8.414972005844117,, | |
| 11500,-1.2220853567123413,8.464677752017975,, | |
| 12000,-1.2694823741912842,8.512074007034302,, | |
| 12500,-1.2224053144454956,8.464997858524322,, | |
| 13000,-1.2045142650604248,8.447105546951294,, | |
| 13500,-1.2618227005004883,8.504414828777314,, | |
| 14000,-1.2397021055221558,8.482293691158295,, | |
| 14500,-1.134156346321106,8.376747966766358,, | |
| 15000,-1.2440736293792725,8.486665506839753,, | |
| 15000,,,8.149463270902634,-0.9068714141845703 | |
| 15500,-1.2508105039596558,8.493402480125427,, | |
| 16000,-1.2312227487564087,8.473814713001252,, | |
| 16500,-1.1367300748825073,8.379321574687959,, | |
| 17000,-1.1449939012527466,8.38758572626114,, | |
| 17500,-1.1947705745697021,8.43736191558838,, | |
| 18000,-1.1431314945220947,8.385722992897033,, | |
| 18500,-1.198479413986206,8.441071241378785,, | |
| 19000,-1.1451743841171265,8.387767234325409,, | |
| 19500,-1.122506856918335,8.365098190307616,, | |
| 20000,-1.236710548400879,8.479302643299103,, | |
| 20000,,,8.218507186174392,-0.9759153294563293 | |
| 20500,-1.1116316318511963,8.35422279548645,, | |
| 21000,-1.1377480030059814,8.38033922767639,, | |
| 21500,-1.2083076238632202,8.450899731636047,, | |
| 22000,-1.1671226024627686,8.409713720798493,, | |
| 22500,-1.253317952156067,8.495910203933716,, | |
| 23000,-1.1683346033096313,8.410926961898804,, | |
| 23500,-1.0560994148254395,8.29869065618515,, | |
| 24000,-1.1070435047149658,8.349635181903839,, | |
| 24500,-1.1370806694030762,8.37967237520218,, | |
| 25000,-1.1505688428878784,8.393160609722138,, | |
| 25000,,,8.242576564550399,-0.9999847066402435 | |
| 25500,-1.1876877546310425,8.430279606819154,, | |
| 26000,-1.100395679473877,8.342987818717956,, | |
| 26500,-1.0407487154006958,8.283339968681336,, | |
| 27000,-1.1191774606704712,8.361769129276276,, | |
| 27500,-1.1443326473236084,8.386924511909484,, | |
| 28000,-1.2578092813491821,8.500401512145997,, | |
| 28500,-1.1135951280593872,8.35618675327301,, | |
| 29000,-1.1329078674316406,8.37549984741211,, | |
| 29500,-1.0465131998062134,8.28910499572754,, | |
| 30000,-1.2860294580459595,8.52862127685547,, | |
| 30000,,,8.280946964025498,-1.0383551049232482 | |
| 30500,-1.1040349006652832,8.34662652206421,, | |
| 31000,-1.0808707475662231,8.323462380409241,, | |
| 31500,-1.0409836769104004,8.28357599544525,, | |
| 32000,-1.1372066736221313,8.379798205375671,, | |
| 32500,-1.092490315437317,8.335082127571106,, | |
| 33000,-1.199385643005371,8.441977437496185,, | |
| 33500,-0.98192298412323,8.224514891386033,, | |
| 34000,-1.0702688694000244,8.31286094236374,, | |
| 34500,-1.205410361289978,8.448001908302308,, | |
| 35000,-1.1245042085647583,8.367095613479615,, | |
| 35000,,,8.125164510011674,-0.8825726509094238 | |
| 35500,-1.0918993949890137,8.334491700649261,, | |
| 36000,-0.9455532431602478,8.188144985675812,, | |
| 36500,-1.0261520147323608,8.268744242191314,, | |
| 37000,-0.9891917109489441,8.231783352136611,, | |
| 37500,-0.9718740582466125,8.214465849637985,, | |
| 38000,-1.0833275318145752,8.325919157981872,, | |
| 38500,-0.9262539744377136,8.168845703125,, | |
| 39000,-0.9757115840911865,8.218303520202637,, | |
| 39500,-1.0679569244384766,8.310548597335815,, | |
| 40000,-1.0552783012390137,8.297870304107667,, | |
| 40000,,,8.032755798101425,-0.7901639401912689 | |
| 40500,-1.0701168775558472,8.312708149909973,, | |
| 41000,-1.0251420736312866,8.267734111785888,, | |
| 41500,-0.9983317852020264,8.240923062324525,, | |
| 42000,-1.0062366724014282,8.248828182220459,, | |
| 42500,-0.9604449272155762,8.203036922454833,, | |
| 43000,-1.0203297138214111,8.262921420574187,, | |
| 43500,-0.8827806711196899,8.125372834205628,, | |
| 44000,-0.9479599595069885,8.190551757335664,, | |
| 44500,-0.954931378364563,8.1975232796669,, | |
| 45000,-0.959622859954834,8.202214864730834,, | |
| 45000,,,7.657717061042786,-0.4151252019405365 | |
| 45500,-0.8350804448127747,8.077672555446625,, | |
| 46000,-0.9315222501754761,8.17411429309845,, | |
| 46500,-0.8603422045707703,8.102933712482452,, | |
| 47000,-0.9848171472549438,8.227408859729767,, | |
| 47500,-0.8061552047729492,8.048746953964233,, | |
| 48000,-0.858570396900177,8.101162043571472,, | |
| 48500,-0.9205390810966492,8.163131041526794,, | |
| 49000,-0.984183132648468,8.22677476835251,, | |
| 49500,-0.8795024156570435,8.122094462394715,, | |
| 50000,-0.8338159322738647,8.076407314300537,, | |
| 50000,,,7.515316879749298,-0.2727250218391418 | |
| 50500,-0.8908106684684753,8.133402589797974,, | |
| 51000,-0.9163455963134766,8.158937111377716,, | |