O2O / O2O-w-diff-ckpts /cube-double-play-singletask-task2-v0 /fedit /20260319_183100 /online_agent.csv
| actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step | |
| 141.61969,0.19258413,-0.00993097,-13.268411,0.17148148,141.26556,7.3373637,-59.09031,-144.55821,-193.75255,0.24633366,-0.26610547,21.582312,905000 | |
| 139.74092,0.19259813,-0.024512736,-14.582874,0.17162156,139.40121,8.776267,-33.220547,-142.90625,-194.4352,0.45161015,-0.44464776,32.90198,910000 | |
| 142.31792,0.19875152,0.013047107,-11.455079,0.14303058,141.96309,15.347117,-38.521675,-144.83038,-199.36075,0.38685763,-0.6298474,46.406746,915000 | |
| 138.39503,0.17117743,-0.026096927,-14.513361,0.18812032,138.06183,7.9262695,-41.311634,-141.70518,-199.58778,0.9118448,-0.43266627,46.603073,920000 | |
| 135.26549,0.17551883,-0.0027955805,-12.707928,0.17085762,134.9219,16.889542,-5.7573957,-138.38228,-195.86711,1.3931184,-1.3822786,55.873688,925000 | |
| 131.56729,0.17451811,0.0031238573,-12.281324,0.175443,131.2142,22.006275,-21.583086,-135.17752,-196.63298,0.9894806,-1.1113421,53.981735,930000 | |
| 129.36046,0.1844141,-0.021190494,-13.979967,0.20016824,128.99707,11.694087,-43.788544,-132.52373,-195.47643,0.6094503,-0.69503295,31.089924,935000 | |
| 128.60298,0.21070889,1.0434739e-05,-12.499297,0.18556651,128.2067,14.813468,-2.7529454,-132.61807,-197.00346,0.37749672,-0.7426185,52.95964,940000 | |
| 128.18735,0.18781921,0.016830726,-11.382037,0.1713545,127.81134,11.975702,1.5436603,-131.34703,-195.68056,0.5134276,-0.567719,38.69742,945000 | |
| 126.55793,0.2030484,0.0025709819,-12.328445,0.18475875,126.16755,15.175044,-6.933405,-130.08116,-191.4157,0.6269031,-0.6853138,47.550518,950000 | |
| 124.093956,0.19292842,-0.022473063,-13.985893,0.21152654,123.711975,15.849551,-6.0232034,-128.16673,-185.9628,0.83487,-0.94093066,54.229233,955000 | |
| 122.73003,0.18727958,0.0029839252,-12.30492,0.18821508,122.35155,13.551735,-10.27336,-127.10735,-196.90878,0.57431316,-0.6196297,37.036167,960000 | |
| 122.18241,0.19352406,-0.03067371,-14.472147,0.22509198,121.794464,11.607284,-6.963096,-125.67185,-197.30205,0.40278405,-0.4381484,38.338806,965000 | |
| 120.02532,0.20775019,0.0059183347,-12.112782,0.1851345,119.62652,14.868964,-16.980665,-122.83196,-197.44908,0.42865467,-0.58634,46.125267,970000 | |
| 123.14541,0.17804216,-0.032909423,-14.558504,0.23274761,122.76753,12.277448,-8.445863,-127.295006,-198.32991,0.9439093,-1.0890543,54.21439,975000 | |
| 122.5479,0.18278703,-0.014301239,-13.406964,0.21140435,122.16801,10.883747,-1.1638339,-126.345604,-198.694,0.36329573,-0.45713136,38.241543,980000 | |
| 119.806564,0.19428521,0.0044265846,-12.231398,0.20157424,119.40628,14.739154,-0.19148123,-123.583,-196.90521,0.3737885,-0.44119173,35.51541,985000 | |
| 118.61935,0.19459458,-0.027219146,-14.139819,0.234705,118.21727,11.770915,1.1008751,-122.46415,-189.3974,0.6214256,-0.38097292,45.6493,990000 | |
| 117.39258,0.19162664,-0.009175503,-13.047367,0.21871272,116.99142,14.4426365,-2.1480873,-121.20896,-195.98479,3.1594841,-3.2045572,58.379753,995000 | |
| 113.54681,0.166677,-0.005367411,-12.820147,0.21493593,113.17056,12.558192,0.57468265,-117.5437,-186.78273,1.0920516,-1.0345579,38.016636,1000000 | |
| 117.865234,0.17122164,-0.012023838,-13.210989,0.22341667,117.48262,13.023688,-19.652267,-121.74807,-191.55972,1.0437425,-1.0430858,38.96685,1005000 | |
| 116.14941,0.17389295,0.0053852946,-12.179518,0.20466124,115.76547,15.753237,-4.87586,-119.41138,-184.68031,0.39441618,-0.45422253,36.067463,1010000 | |
| 111.76295,0.19116953,-0.025896901,-14.031785,0.23722632,111.36044,11.998752,1.541508,-115.57173,-186.52281,0.6138116,-1.1073151,49.29777,1015000 | |
| 115.66495,0.20003325,-0.0031822554,-12.684902,0.21831325,115.24978,10.751006,-2.9290266,-119.36627,-184.95937,0.9099096,-0.54577273,42.40446,1020000 | |
| 116.21937,0.2106551,0.002738486,-12.338813,0.20963,115.79634,16.329649,-9.1808195,-120.14026,-189.68098,0.93026555,-0.88630265,53.183857,1025000 | |
| 116.07856,0.18520218,0.008232212,-12.019402,0.20588133,115.679245,16.106228,-7.899224,-120.13784,-191.96642,0.7232965,-0.43728104,52.19351,1030000 | |
| 114.15145,0.18994203,-0.0078253,-12.961494,0.21978073,113.74956,10.177643,1.9281185,-117.69033,-191.11119,0.30536097,-0.3467026,30.149042,1035000 | |
| 111.28879,0.13940096,-0.0014988449,-12.589332,0.21122928,110.93965,18.639402,-0.9517595,-115.439125,-184.91553,0.68954545,-0.6217724,49.70854,1040000 | |
| 112.121284,0.18786594,-0.01585188,-13.434328,0.22792783,111.721344,9.819571,-10.727723,-116.42273,-187.12202,0.5821226,-0.7629648,40.626083,1045000 | |
| 111.71091,0.19195715,0.0015859162,-12.407009,0.21159579,111.30577,15.793185,-9.4143715,-115.60003,-191.2853,0.7616935,-0.74494326,40.953175,1050000 | |
| 109.29442,0.1731207,0.027846301,-10.851504,0.18330304,108.91015,7.353349,-3.4890952,-112.21494,-182.20291,0.42489916,-0.42083243,35.505238,1055000 | |
| 112.265205,0.1881838,0.016633758,-11.508312,0.19303101,111.867355,13.164069,2.7953439,-115.700905,-195.72348,5.1711874,-5.318995,84.78675,1060000 | |
| 108.76309,0.19564117,-0.01315676,-13.271214,0.22640444,108.3542,12.560787,-1.1934476,-113.10972,-194.05486,0.6878179,-0.5885366,49.510338,1065000 | |
| 110.71098,0.20880845,-0.006413507,-12.876396,0.21940404,110.289185,14.525943,-9.0907755,-114.53711,-188.45772,1.2163686,-1.3611465,55.496555,1070000 | |
| 114.3119,0.21130796,0.022934027,-11.118032,0.18450597,113.89314,11.162848,-6.443612,-117.44881,-192.80327,0.43103313,-0.37628263,34.78471,1075000 | |
| 110.544525,0.20077601,0.043183003,-9.976212,0.17069685,110.12987,12.5718775,2.1462414,-113.92885,-186.04509,1.950983,-1.8500983,61.590416,1080000 | |
| 108.25968,0.1971484,0.00014703393,-12.491285,0.21075287,107.85163,11.343254,-0.085083395,-111.94767,-186.78279,0.5710362,-0.6058385,38.481956,1085000 | |
| 107.9309,0.17473257,-0.021492798,-13.790918,0.2296082,107.54805,8.5404005,-0.058659375,-110.97066,-198.65068,0.453669,-0.5356928,36.242977,1090000 | |
| 108.54319,0.17899996,-0.01957745,-13.650678,0.23225048,108.15151,15.477025,-3.7065516,-112.36407,-192.83311,0.6624953,-0.6060214,40.138268,1095000 | |
| 108.368744,0.19409165,0.0058646146,-12.153692,0.20581903,107.96297,16.95133,1.3638431,-112.51099,-192.7592,0.72735727,-0.60998034,52.87022,1100000 | |
| 109.06944,0.20036758,-0.007918434,-12.963327,0.22154796,108.65544,14.904807,-4.974561,-112.46023,-180.1854,0.743469,-0.8399211,61.40695,1105000 | |
| 107.41905,0.17169325,-0.032201663,-14.410147,0.24292934,107.03664,9.486651,-1.6761547,-110.969215,-179.46477,0.6773434,-0.72559893,43.832195,1110000 | |
| 110.08702,0.16424009,-0.014132417,-13.354805,0.22079383,109.71612,11.754081,-3.442561,-113.48728,-196.6056,0.8307816,-0.9734811,50.46785,1115000 | |
| 107.70681,0.20197392,-0.0024715208,-12.644049,0.21694076,107.29037,13.475135,-4.395649,-111.7726,-185.71977,2.680392,-3.1292493,77.995575,1120000 | |
| 103.133316,0.2297269,0.029827869,-10.752357,0.18351561,102.69024,14.317542,-1.3380742,-106.5191,-180.58708,0.68112904,-0.6786066,44.36316,1125000 | |
| 108.88444,0.19341174,0.022153275,-11.19627,0.19024956,108.47862,9.171946,0.8115921,-112.31902,-192.35768,0.37144467,-0.80601174,47.707905,1130000 | |
| 102.12268,0.2139337,0.025671396,-11.003735,0.18879086,101.69428,10.5670805,0.20830482,-104.8447,-181.93143,0.3584389,-0.40331352,37.58462,1135000 | |
| 104.189964,0.22611229,0.018460572,-11.4004345,0.19140154,103.75399,12.346096,4.16169,-108.43561,-195.36137,0.7499246,-0.568407,46.246,1140000 | |
| 106.58514,0.20643264,-0.010048332,-13.094099,0.22146787,106.16728,12.139858,0.30164468,-110.733826,-193.09105,0.8308834,-0.8025858,36.81438,1145000 | |
| 96.87398,0.19809948,0.006632452,-12.103203,0.20230466,96.46695,10.958918,-4.0387726,-100.96025,-185.47061,0.44220248,-0.49000674,39.426823,1150000 | |
| 106.56815,0.21314597,-0.0013512837,-12.579473,0.21389069,106.14247,10.4871435,-2.8046658,-109.90966,-191.84378,6.817766,-5.9447627,79.51681,1155000 | |
| 103.41048,0.20634167,-0.020514153,-13.703768,0.23353441,102.99111,31.524958,1.3643092,-107.160194,-190.07587,2.3890324,-1.234423,96.773964,1160000 | |
| 106.59897,0.23073867,0.011366867,-11.824866,0.19908898,106.157776,14.766126,-8.57108,-110.22626,-199.34927,0.5225861,-1.2400628,51.56891,1165000 | |
| 105.284645,0.17566851,-0.008047047,-12.969277,0.22239383,104.89463,18.313293,-4.9122853,-108.57452,-177.10213,0.57688695,-0.46960482,45.31301,1170000 | |
| 103.05096,0.18667886,-0.0016368761,-12.597902,0.21063048,102.65529,15.223587,-3.3430252,-106.42046,-199.329,0.6403487,-0.6979358,52.300156,1175000 | |
| 104.499405,0.21549477,-0.004249556,-12.748918,0.21765131,104.07051,10.915657,-3.331353,-109.33435,-194.05565,0.3824056,-0.36749092,39.207146,1180000 | |
| 101.397156,0.19259706,-0.008180697,-12.978144,0.22204678,100.99069,10.975504,1.2339664,-104.83889,-180.64186,0.44055054,-0.3980621,37.90198,1185000 | |
| 95.36925,0.19703905,-0.0037280067,-12.721262,0.21433847,94.9616,51.005333,-0.4445668,-98.934135,-186.13557,3.3335786,-4.2500377,170.9803,1190000 | |
| 98.56935,0.18711142,0.007733664,-12.041979,0.20332819,98.17117,16.904692,1.2402647,-101.588646,-193.07924,0.61787516,-0.59082544,53.49773,1195000 | |
| 103.67874,0.19028763,0.023344005,-11.125613,0.18896891,103.27614,22.200554,3.4076116,-107.347046,-182.03569,0.5660233,-1.0376976,53.903793,1200000 | |
| 103.933136,0.17044678,-0.00051333394,-12.530425,0.21141422,103.55179,12.711533,-2.6491706,-107.64773,-190.29169,0.6784953,-0.6411771,47.83795,1205000 | |
| 100.639694,0.18690425,-0.026815603,-14.092665,0.23727736,100.24233,13.585082,-3.203769,-105.07918,-194.70345,0.66606873,-0.65783185,46.015533,1210000 | |
| 100.84502,0.20630981,-0.0070264684,-12.913357,0.21950841,100.42623,10.524269,0.5407165,-104.39109,-181.03821,1.458246,-1.1707357,55.57542,1215000 | |
| 102.10247,0.23687224,0.004169019,-12.254404,0.2080199,101.65341,10.375569,-1.5775055,-106.36519,-178.23694,1.9232184,-1.9645299,58.25455,1220000 | |
| 102.91433,0.21531782,-0.032308552,-14.39205,0.24575795,102.485565,13.179969,-1.5717931,-106.69787,-195.2461,0.79809225,-0.74699473,47.45358,1225000 | |
| 94.72009,0.22018605,-0.013116058,-13.2766695,0.22421065,94.28881,13.102672,3.5060275,-98.692276,-178.60501,1.1725878,-1.5328181,82.539925,1230000 | |
| 98.07797,0.22513483,0.0019502856,-12.384337,0.20882292,97.64206,13.959659,0.7124543,-100.85699,-197.10596,1.4622531,-1.023442,87.219315,1235000 | |
| 100.85012,0.21740633,0.013056953,-11.716026,0.19512849,100.42453,13.398956,2.5335472,-103.995804,-180.19795,0.72162855,-0.7952225,52.006264,1240000 | |
| 104.97859,0.2132583,-0.019814866,-13.683392,0.22911653,104.55603,14.923515,0.030684054,-109.13015,-184.36917,0.90350455,-0.9805209,61.29356,1245000 | |
| 95.82923,0.19867676,0.024877485,-11.004076,0.18299979,95.422676,15.17808,-1.6048858,-98.95475,-198.71338,0.8236536,-0.6913687,35.137222,1250000 | |
| 102.38322,0.21533543,0.0551091,-9.185251,0.15270868,101.96007,16.708109,-0.4454923,-105.59377,-185.21637,0.9970907,-1.0170213,59.32346,1255000 | |
| 93.75277,0.20047635,-0.013084522,-13.292053,0.21958143,93.345795,19.022001,-1.3435478,-97.56109,-195.60606,0.9488644,-0.5270957,56.41106,1260000 | |
| 99.91854,0.18982303,-0.020797616,-13.757973,0.22745568,99.522064,15.926501,-6.310375,-104.523026,-196.67311,0.887117,-0.7172049,62.770515,1265000 | |
| 98.86351,0.18549117,0.017032018,-11.465839,0.18883564,98.47215,10.160089,-3.4702644,-102.34133,-192.46498,0.79845667,-0.71333927,54.288822,1270000 | |
| 96.15823,0.24078327,-0.028829217,-14.237717,0.2362078,95.710075,12.281309,0.7427926,-100.27722,-195.40384,0.50282097,-0.636883,41.146667,1275000 | |
| 97.9532,0.21684876,0.0145710325,-11.629898,0.19475836,97.52702,11.016036,-0.1568723,-101.216606,-188.37247,0.73387444,-0.67707634,38.61143,1280000 | |
| 97.67133,0.22025959,-0.0060682595,-12.870442,0.21083218,97.24631,7.7015076,3.0685503,-101.75503,-192.0714,0.5485664,-0.8603313,46.716652,1285000 | |
| 99.935844,0.20472117,-0.02105002,-13.775688,0.22731142,99.524864,8.378829,-4.801093,-103.80447,-186.81642,0.61926043,-0.6009003,41.267002,1290000 | |
| 98.31165,0.23172484,-0.003282709,-12.699469,0.2089986,97.87421,17.319931,3.183525,-102.21684,-177.27281,1.1293231,-0.921166,85.086105,1295000 | |
| 94.070274,0.1990931,0.015891235,-11.529778,0.18884577,93.66644,8.963618,-2.5495615,-97.92334,-180.9534,0.47150105,-0.52350676,40.591316,1300000 | |
| 95.481735,0.18849865,0.012544224,-11.731924,0.1916059,95.08909,17.868834,0.83237433,-99.42714,-191.83151,0.85668206,-0.8734483,57.088806,1305000 | |
| 98.6954,0.21234672,0.01577435,-11.538061,0.18920687,98.27806,9.80886,-5.5288353,-101.63962,-177.43382,0.6036979,-0.6053888,35.737915,1310000 | |
| 95.502464,0.19733684,0.0011426404,-12.430435,0.20417674,95.09981,10.545001,-0.9531243,-98.797386,-177.72348,0.9138199,-0.9433619,49.367874,1315000 | |
| 97.65958,0.1784852,-0.0065125227,-12.896791,0.21167454,97.27593,8.462811,-3.0014822,-101.25889,-182.46417,0.4799808,-1.1967839,46.90453,1320000 | |
| 92.690834,0.20164748,-0.0073330835,-12.949287,0.21135291,92.28517,7.290326,-1.8194964,-96.85494,-195.92825,0.4316411,-0.42292792,36.61888,1325000 | |
| 93.40744,0.21658587,0.013307361,-11.681036,0.18980536,92.98775,14.018176,0.5628443,-96.72567,-188.46745,0.76222956,-0.85618955,47.98011,1330000 | |
| 98.16495,0.2193129,0.013226874,-11.703338,0.19430888,97.7381,11.665961,3.273197,-101.15386,-196.18518,0.49754766,-0.6956313,40.151497,1335000 | |
| 90.57033,0.22895098,-0.017480338,-13.567389,0.22218952,90.136665,10.982618,0.37838393,-94.73927,-193.53415,0.54435694,-0.5591948,52.39071,1340000 | |
| 96.935684,0.20754603,0.0042799707,-12.237002,0.19914253,96.52472,11.74549,-3.5034714,-101.18446,-188.9403,0.77837056,-0.69141185,43.289806,1345000 | |
| 91.316795,0.21502182,-0.009029993,-13.048044,0.2149895,90.89582,14.107233,2.2335846,-94.70068,-182.81433,1.5105165,-1.6885539,49.10044,1350000 | |
| 93.87267,0.23107724,0.02016519,-11.261436,0.18334872,93.43808,19.71081,0.12467815,-97.18679,-185.73618,0.6150604,-0.43995136,46.01805,1355000 | |
| 91.78067,0.21734743,0.028816978,-10.721664,0.17373885,91.36077,14.646544,4.7322397,-95.67447,-183.98152,0.72038496,-0.39805412,44.583366,1360000 | |
| 93.99297,0.1870278,-0.017417416,-13.578894,0.21921459,93.60415,18.69482,-0.49386385,-97.702866,-177.72754,1.4410852,-1.3137282,58.304688,1365000 | |
| 93.168175,0.22718468,0.007661748,-12.020463,0.19205558,92.74127,11.178107,-1.7067108,-96.48596,-173.18451,1.6772097,-1.7895246,48.409004,1370000 | |
| 91.38163,0.2023908,-0.015465705,-13.458682,0.21711889,90.977585,13.260116,-3.7521927,-95.36924,-190.57458,0.5291411,-0.9248805,46.961124,1375000 | |
| 94.255486,0.15672551,-0.01142629,-13.213985,0.21147045,93.89872,15.718274,4.705497,-97.4067,-181.23819,1.7301775,-1.7730728,68.597305,1380000 | |
| 90.76593,0.2032729,0.0030848836,-12.3053465,0.19501606,90.36456,10.905557,-1.7994486,-94.26046,-193.87616,0.8080861,-0.73433626,46.904022,1385000 | |
| 90.84083,0.17005563,-0.0031525467,-12.698545,0.2016302,90.47229,11.054842,0.51119196,-94.20448,-182.02281,0.5182627,-0.8513484,40.281,1390000 | |
| 84.47098,0.19480556,0.008907381,-11.944094,0.19138223,84.075874,13.852483,4.536584,-88.47855,-191.75435,0.7930914,-0.73312306,50.11859,1395000 | |
| 86.48782,0.19694921,-0.015609179,-13.480558,0.21459247,86.09189,9.146953,-1.4627726,-90.04824,-195.73132,0.80150187,-0.5282373,37.683357,1400000 | |