O2O / O2O-w-diff-ckpts /cube-double-play-singletask-task2-v0 /cgql /20260319_025622 /online_agent.csv
| actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step | |
| 0.19293259,9.907138,-74.0735,-178.20798,-203.8773,0.27082652,-0.26219606,27.070246,405000 | |
| 0.19252014,9.638598,-57.242535,-175.60722,-203.24329,0.41252255,-0.49855983,34.890682,410000 | |
| 0.20554096,11.74811,-62.49969,-174.58122,-203.46066,0.49164373,-0.28710222,43.582127,415000 | |
| 0.17371646,14.421924,-20.110317,-172.06017,-203.47697,0.89386326,-0.9173048,45.49243,420000 | |
| 0.1958869,12.954251,-59.921646,-171.55022,-204.24956,0.59302336,-0.5973606,39.640522,425000 | |
| 0.19575818,18.936941,-58.794445,-169.29556,-203.68477,0.68581223,-0.88400507,62.530678,430000 | |
| 0.17206165,15.868039,-50.378666,-169.04457,-203.97404,0.456027,-0.44273034,48.150448,435000 | |
| 0.20763367,15.439578,-72.88623,-169.17943,-203.99547,0.8940073,-0.97359496,50.40006,440000 | |
| 0.18131524,25.538229,-63.412403,-166.17267,-204.5714,0.84280807,-0.84719586,74.05749,445000 | |
| 0.17276832,12.441505,-36.185875,-166.53954,-204.28021,0.48796815,-0.55815744,43.229794,450000 | |
| 0.1993267,16.480461,-40.467537,-162.4067,-205.18204,0.656417,-0.7875398,54.60441,455000 | |
| 0.21130565,22.393791,-36.518944,-162.18896,-204.71373,2.382406,-1.4235771,100.16359,460000 | |
| 0.16679285,16.004402,-5.0363894,-163.29659,-204.79256,0.69221336,-0.6724038,51.240562,465000 | |
| 0.1960522,20.769262,-29.53372,-159.29356,-205.06558,1.7088376,-2.041242,65.58013,470000 | |
| 0.18666272,20.510843,-35.41735,-162.73067,-204.70349,0.7100032,-0.73709196,46.69983,475000 | |
| 0.19064161,18.947702,-31.9594,-161.57315,-204.83699,0.4182699,-0.4525539,42.012787,480000 | |
| 0.15446293,23.859823,-10.923028,-160.27985,-205.35754,0.51965487,-0.6998644,55.18577,485000 | |
| 0.17482302,12.360118,-39.36152,-157.81946,-204.6407,0.5389005,-0.49406314,51.441055,490000 | |
| 0.16928247,20.89065,-18.037003,-158.06375,-204.87259,2.1647575,-1.9986082,69.81792,495000 | |
| 0.17078784,14.836273,-9.993163,-152.81229,-203.91219,0.49231347,-0.45242867,46.63926,500000 | |
| 0.19711101,16.342169,-10.956029,-158.39258,-205.2117,3.7709248,-3.2315712,106.97551,505000 | |
| 0.21946144,19.19161,-25.853498,-154.93768,-204.44365,0.4664794,-0.39329302,51.22842,510000 | |
| 0.16704053,14.547241,2.6226995,-152.92876,-205.13116,0.67802083,-0.7490184,62.786533,515000 | |
| 0.17351793,15.682803,-33.78694,-155.42123,-204.28905,1.1151779,-0.67184895,66.66462,520000 | |
| 0.18784773,10.997588,-18.614166,-158.8505,-204.97269,1.436185,-1.2703203,54.63379,525000 | |
| 0.18222764,25.998835,-41.30745,-154.05774,-204.7526,0.90882707,-0.64261436,74.19459,530000 | |
| 0.21863249,14.600888,4.2591925,-155.28772,-205.2016,0.97793674,-0.8745813,46.514977,535000 | |
| 0.15595499,17.312307,-38.975864,-150.47148,-204.37373,0.8721997,-0.68742836,58.19931,540000 | |
| 0.18812896,16.373362,-19.037266,-151.9305,-204.6167,0.56239706,-0.5277464,52.208534,545000 | |
| 0.15866953,20.452711,-6.5908356,-152.19441,-204.17604,1.2207245,-1.0799012,69.69728,550000 | |
| 0.18622011,13.164943,-12.811255,-151.35664,-204.66016,0.6174537,-0.5673161,45.914654,555000 | |
| 0.17418909,15.5453205,-5.1047964,-152.00331,-204.51996,0.49791086,-0.48994464,46.888313,560000 | |
| 0.19339675,16.6531,-3.0377188,-150.64595,-204.46849,0.56662333,-0.35273987,54.086983,565000 | |
| 0.16918263,17.64688,-5.2001452,-147.93697,-204.78783,1.4198532,-1.6399136,69.26174,570000 | |
| 0.19822663,18.992231,-8.790484,-148.88528,-204.67017,2.0179608,-2.1714215,86.28459,575000 | |
| 0.16991523,14.8966675,4.429649,-146.86601,-205.36182,0.81496495,-0.9094021,55.66288,580000 | |
| 0.17325288,22.838043,-11.6778755,-147.01736,-205.01004,1.224624,-1.308386,68.4201,585000 | |
| 0.17559305,9.511724,-7.289504,-147.94647,-205.29025,0.78312635,-0.8768856,44.076157,590000 | |
| 0.17136541,20.212605,-6.5611954,-144.79434,-204.6001,1.9659323,-2.0295773,114.19423,595000 | |
| 0.17628911,14.35776,-18.907938,-147.30101,-205.75365,2.135537,-2.1391914,60.046616,600000 | |
| 0.1663078,16.679417,-6.660442,-146.32591,-204.12038,0.46412918,-0.5812357,49.62188,605000 | |
| 0.16945626,23.171133,-1.2821019,-144.82242,-204.90227,0.8727199,-0.71145064,65.23656,610000 | |
| 0.17034204,15.489438,-21.823488,-144.60747,-203.89963,0.87197083,-0.49242958,58.281982,615000 | |
| 0.1719214,19.50131,-3.1586926,-143.53253,-204.04523,1.9467174,-1.8246776,83.95213,620000 | |
| 0.17436436,19.157572,-1.5850618,-143.75789,-204.39586,0.83962774,-0.86807376,57.182068,625000 | |
| 0.16918018,14.808692,-10.105747,-145.37224,-205.80898,3.2728443,-3.340615,122.6727,630000 | |
| 0.16740867,11.3792925,-6.4171443,-141.35165,-204.52623,1.3755051,-0.79011804,49.86248,635000 | |
| 0.17588545,20.321253,1.430678,-144.01997,-205.4923,1.3672165,-1.2537154,97.21958,640000 | |
| 0.16854571,20.81011,-19.072357,-145.9329,-205.71481,0.79575074,-0.5831123,55.956375,645000 | |
| 0.18725613,17.697933,-2.1800537,-133.26189,-203.31914,1.3757839,-2.0324385,68.679855,650000 | |
| 0.21334401,13.9415,-13.267659,-143.55193,-204.52557,0.60138696,-0.6552927,50.402977,655000 | |
| 0.20314884,9.548378,3.0539074,-139.06445,-204.52995,1.4295458,-1.6076766,51.841385,660000 | |
| 0.18064025,15.037326,-4.71352,-140.88477,-205.89049,0.52962244,-0.6050901,47.470074,665000 | |
| 0.17142916,16.047596,-7.914524,-139.21954,-202.97957,0.4989584,-0.48337996,50.62982,670000 | |
| 0.19343856,22.101835,-4.5833383,-136.25,-203.73117,1.2235782,-1.0579181,68.34454,675000 | |
| 0.1706172,19.804005,-3.5941882,-143.1663,-205.18237,0.616959,-0.7980766,60.035973,680000 | |
| 0.1633843,21.686438,-13.734951,-139.12407,-204.6777,1.7934768,-1.6987383,68.356514,685000 | |
| 0.16015238,15.357272,-4.314893,-132.63086,-203.37535,0.8425819,-0.92384535,44.092476,690000 | |
| 0.19938184,16.732353,8.58818,-138.43694,-205.13054,1.3713561,-1.9309661,74.62749,695000 | |
| 0.18279672,25.81871,-1.4155142,-139.90923,-204.82791,0.89736706,-0.8994338,56.350883,700000 | |
| 0.17433919,13.348009,-9.22397,-141.7094,-203.16736,0.3977709,-0.44729197,39.008247,705000 | |
| 0.16026244,26.300962,-0.6335507,-139.96556,-204.52307,1.811204,-1.5967016,84.954834,710000 | |
| 0.16449033,11.701115,-4.5715756,-136.98831,-202.77066,0.5653049,-0.53272223,49.997265,715000 | |
| 0.17663036,17.929468,-13.482591,-141.75749,-203.18549,1.3467919,-1.1591913,65.905075,720000 | |
| 0.15266798,23.183687,3.1867335,-139.35347,-205.27402,2.1130538,-1.9819491,97.987686,725000 | |
| 0.1750554,18.326187,6.1166763,-131.57074,-203.9454,1.8824185,-1.7720845,79.04568,730000 | |
| 0.17252986,12.730021,-6.1082807,-135.12572,-202.03848,2.889623,-2.970697,96.28128,735000 | |
| 0.14697355,19.242853,-1.5264671,-140.40482,-203.95584,0.4605461,-0.5311394,54.13983,740000 | |
| 0.15494375,16.185846,-10.441478,-145.79843,-203.6855,1.1018966,-0.5938754,56.032677,745000 | |
| 0.14186402,32.378067,-0.089910924,-131.56226,-204.52187,1.1317657,-1.177924,75.04559,750000 | |
| 0.15644208,24.427618,5.4601364,-137.68132,-204.2294,2.343495,-2.5582685,103.207825,755000 | |
| 0.18955284,15.217832,-5.1676865,-134.8067,-204.76367,0.55554676,-0.50452673,48.979267,760000 | |
| 0.1724625,13.812314,-2.1416762,-136.03856,-205.02829,2.900649,-1.1422842,48.947002,765000 | |
| 0.16658014,37.53969,-6.6092186,-134.59329,-203.86382,1.9945168,-2.1232975,127.30568,770000 | |
| 0.14958218,10.821944,1.610851,-134.09033,-202.40506,1.2072473,-1.4046524,61.481064,775000 | |
| 0.16974105,9.353984,-2.6296737,-131.6196,-203.30466,1.2483314,-1.4186112,42.88317,780000 | |
| 0.17055674,17.738012,-2.6905048,-135.70052,-203.40181,1.164408,-0.8372356,56.235497,785000 | |
| 0.16643706,18.06003,-9.344151,-135.96902,-202.6974,2.6085458,-2.8149629,70.84895,790000 | |
| 0.16638562,13.007161,-0.5990053,-136.1955,-201.64857,0.722011,-0.71479243,49.796776,795000 | |
| 0.1606169,19.017263,-6.6281633,-133.0914,-201.1314,0.916941,-0.93489134,56.036446,800000 | |
| 0.1752409,21.168604,-2.8410606,-130.19437,-202.96222,1.6227998,-0.943426,74.218124,805000 | |
| 0.17488131,11.916689,-0.7370927,-134.52916,-203.29138,0.5310685,-0.33956054,38.30432,810000 | |
| 0.17355138,20.260817,3.080631,-132.43623,-201.2804,0.82462984,-0.85641617,64.31917,815000 | |
| 0.16411966,14.513242,-1.0432426,-133.6368,-202.96149,0.7375835,-0.70085543,56.000042,820000 | |
| 0.1660452,12.655291,-6.6960645,-130.97777,-203.62253,1.4451756,-1.5458368,70.37068,825000 | |
| 0.16355984,17.632772,-1.0395985,-128.47105,-202.45274,0.6778488,-0.6229586,49.752945,830000 | |
| 0.16824391,14.740946,1.7965952,-132.25833,-203.85695,0.8817871,-0.5714984,57.287445,835000 | |
| 0.17169434,13.117505,-1.8408611,-127.76574,-205.39325,1.1666328,-1.2198491,65.95709,840000 | |
| 0.16892287,17.05759,-4.4677043,-135.24397,-201.42186,1.0107427,-1.094845,59.51326,845000 | |
| 0.1559192,18.347502,-2.7841,-128.25777,-203.57318,0.8817252,-0.9112874,59.69355,850000 | |
| 0.16591625,11.650714,-1.1615924,-132.2469,-203.72038,3.9414022,-3.8372233,70.93629,855000 | |
| 0.16168834,18.340637,4.628006,-127.70559,-204.16656,1.277314,-1.99956,68.8993,860000 | |
| 0.16285703,14.823981,-2.66449,-131.66576,-201.87245,1.4574983,-1.3563424,71.17433,865000 | |
| 0.14589459,15.98289,0.7675755,-128.47552,-203.9888,0.9557838,-0.77733654,51.66819,870000 | |
| 0.1336284,14.108667,-0.0017611384,-128.3092,-204.31096,1.4799277,-1.3435984,58.96028,875000 | |
| 0.16377008,16.541498,0.2952922,-131.45325,-201.5279,2.9330997,-1.6812704,75.31865,880000 | |
| 0.13891079,11.135706,-6.719701,-128.66544,-204.07614,0.88614154,-0.5416446,44.22813,885000 | |
| 0.16349909,13.32052,1.5242815,-126.63092,-204.3244,1.0639943,-0.97872585,52.924534,890000 | |
| 0.13250843,27.082556,2.6995773,-123.02853,-204.17343,1.1122307,-1.2438087,69.16248,895000 | |
| 0.16681495,31.247644,-2.9708772,-124.07717,-205.4447,1.4168751,-1.3390603,79.82948,900000 | |