O2O / O2O-w-diff-ckpts /cube-double-play-singletask-task2-v0 /fedit /20260320_005157 /online_agent.csv
| actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step | |
| 144.4084,0.17309554,0.01013396,-11.687023,0.14568166,144.0795,5.1888213,-52.495953,-147.1396,-198.0635,0.23348516,-0.6637227,33.719666,1005000 | |
| 139.30151,0.17696272,-0.009648124,-13.289133,0.162476,138.97173,8.637425,-23.002125,-142.2101,-194.46184,0.5745598,-0.57198757,28.55483,1010000 | |
| 139.84102,0.18007454,0.010033009,-11.724112,0.15160441,139.4993,6.5845413,-39.448307,-142.92863,-195.60527,0.5203078,-0.47028893,23.496502,1015000 | |
| 136.45786,0.19024755,-0.018002905,-13.85706,0.18382922,136.10179,9.449695,-36.26998,-139.76297,-201.1817,0.27692485,-0.33133727,29.117558,1020000 | |
| 135.08223,0.207127,0.017962113,-11.172236,0.15113911,134.70601,14.703247,-8.479385,-138.4066,-194.57385,0.6501119,-0.6513935,34.509106,1025000 | |
| 131.53441,0.17204146,0.00950929,-11.819162,0.16507876,131.18777,15.026511,-16.640718,-134.95425,-194.80849,0.5799519,-0.60933626,44.477047,1030000 | |
| 130.62842,0.19076452,-0.0007052944,-12.548601,0.18210389,130.25626,11.410281,-7.4051185,-133.89185,-198.94281,0.47256917,-0.42395982,29.923996,1035000 | |
| 127.8723,0.1429317,0.0030792877,-12.2885895,0.17898872,127.5473,17.541197,-20.765274,-131.91872,-200.16103,0.64462596,-0.66667277,37.63832,1040000 | |
| 127.51706,0.1833891,0.014797973,-11.521598,0.17425995,127.14461,13.454521,-11.882954,-130.44933,-199.55238,1.0539817,-1.1136581,40.176193,1045000 | |
| 125.061775,0.20003533,-0.0051979963,-12.831512,0.20119351,124.66574,14.074391,-17.56693,-128.64497,-193.78233,0.9259103,-1.1266578,62.592964,1050000 | |
| 121.95757,0.1838625,-0.034920998,-14.641917,0.23871621,121.569916,19.704227,-11.49902,-126.57818,-189.52847,1.6422628,-1.9261513,74.95491,1055000 | |
| 120.62932,0.18296969,-0.004502388,-12.781664,0.2043145,120.24654,16.903503,-26.224688,-124.96448,-199.57733,0.48046458,-0.44925645,37.692135,1060000 | |
| 119.231026,0.17698726,-0.009856355,-13.120396,0.20844647,118.85545,16.763874,-2.8544264,-122.90635,-197.81677,0.4721732,-0.55254114,49.053032,1065000 | |
| 116.83299,0.20097816,-0.018048072,-13.652539,0.21379057,116.43627,18.011023,-30.775711,-120.37146,-193.60374,0.65939826,-0.67872167,49.2378,1070000 | |
| 120.26202,0.20310634,-0.02117106,-13.804028,0.22411023,119.855965,15.898168,-7.6461763,-124.19289,-198.3079,2.3208015,-2.1016119,49.90384,1075000 | |
| 119.08539,0.18978211,0.0135680465,-11.684372,0.1943706,118.68767,13.9244995,-5.4228864,-122.69033,-195.81505,0.7004239,-0.7867006,43.79332,1080000 | |
| 118.6226,0.19796658,0.01244488,-11.748307,0.19450271,118.21768,15.981272,-9.345109,-122.30186,-197.41763,0.78454083,-0.71013707,43.73771,1085000 | |
| 115.686775,0.17398795,-0.03048399,-14.355391,0.23585846,115.30742,14.001093,-11.740263,-119.3702,-193.05507,0.6473081,-0.326892,38.00142,1090000 | |
| 117.62651,0.17015399,-0.012088029,-13.248764,0.21388772,117.254555,15.681006,-0.98620987,-121.05935,-194.07239,2.8696895,-2.8297503,55.74931,1095000 | |
| 111.555885,0.19868356,0.0013050471,-12.4227295,0.20981158,111.14609,16.084282,-5.435948,-115.53562,-189.87395,0.6887911,-0.78116214,44.819862,1100000 | |
| 116.09745,0.19949594,-0.015645819,-13.429947,0.22595112,115.68765,18.82363,-3.734115,-120.08788,-193.04196,0.84436464,-1.4455993,58.76275,1105000 | |
| 114.07877,0.1762133,0.009535828,-11.923918,0.19737533,113.69565,12.477162,-8.213863,-117.49518,-182.89864,0.5786928,-0.65248466,40.505054,1110000 | |
| 113.08428,0.15378517,-0.017225446,-13.527666,0.22674689,112.72098,14.794947,2.21136,-116.64385,-191.50354,0.43888354,-0.4439856,42.104485,1115000 | |
| 113.53056,0.19852608,0.014702647,-11.615658,0.19311634,113.12422,11.803645,-12.637952,-116.99575,-189.10612,0.52292067,-0.6487677,41.521667,1120000 | |
| 116.06072,0.21568976,-0.0066967607,-12.8922825,0.22008765,115.631645,15.541046,-4.023478,-119.81746,-192.06918,0.49330556,-0.98071057,38.763065,1125000 | |
| 115.18526,0.18253393,0.013632576,-11.713127,0.20292997,114.78616,15.251346,-6.570859,-119.28975,-190.91695,0.61246455,-0.65727466,42.37417,1130000 | |
| 115.80029,0.20250255,0.008222125,-12.011845,0.20231856,115.38725,11.385228,2.6393247,-119.38738,-190.30974,0.7024144,-0.537431,45.520885,1135000 | |
| 109.72176,0.21579337,-0.008542402,-13.005258,0.21988018,109.29464,10.239298,-0.10273175,-113.90027,-190.25851,0.8459465,-0.49597996,40.3012,1140000 | |
| 111.171455,0.19626084,0.02057825,-11.283347,0.19084452,110.76378,14.297111,0.3425782,-114.77368,-189.36137,0.5792942,-0.6276986,46.356102,1145000 | |
| 112.032585,0.17133851,0.0062026144,-12.140506,0.20946893,111.64557,12.981761,-3.9038403,-115.83785,-196.83202,1.0351857,-0.95809627,41.107826,1150000 | |
| 110.15676,0.2111508,0.007152241,-12.084211,0.20786808,109.73059,7.8639297,-4.5063343,-113.20684,-188.22247,0.4656523,-0.6041104,32.830177,1155000 | |
| 112.954926,0.21914805,-0.004112801,-12.736025,0.2219289,112.51796,14.353754,2.864946,-115.72866,-195.98856,0.43073225,-0.4166362,40.61218,1160000 | |
| 110.42498,0.21315818,-0.020544987,-13.69383,0.23566142,109.996704,10.236064,-2.5688565,-114.41831,-194.82623,0.74292564,-0.6645662,44.2381,1165000 | |
| 108.85328,0.15851572,0.020974385,-11.280209,0.19396387,108.47983,10.89223,-4.664843,-112.266945,-187.13329,0.9749109,-0.9087961,42.098602,1170000 | |
| 112.13996,0.19866726,0.02716975,-10.927748,0.18884003,111.72528,10.776504,-8.0781555,-115.42187,-195.61418,0.69936717,-0.63126624,43.75266,1175000 | |
| 109.661606,0.20886102,0.02682049,-10.983514,0.19425383,109.231674,9.980611,0.29996538,-113.06243,-194.38899,0.68259525,-0.6183017,40.337357,1180000 | |
| 107.057724,0.19873145,-0.014163649,-13.316246,0.2310659,106.64209,8.664744,2.3873942,-110.38174,-184.6448,0.76307064,-0.6230946,37.67279,1185000 | |
| 105.67403,0.1739096,-0.017557284,-13.520647,0.23258367,105.28509,14.075866,-2.5449407,-109.247574,-193.83493,1.3813646,-0.91141915,62.511353,1190000 | |
| 106.67274,0.19779196,-0.011027919,-13.135319,0.22800402,106.257965,14.637759,-0.7462112,-110.03509,-187.62706,0.82195616,-0.34227204,52.13639,1195000 | |
| 107.20281,0.18850347,0.016710753,-11.54085,0.20106992,106.796524,12.413599,-5.1422367,-111.29185,-189.7326,0.90906215,-0.64824826,47.977108,1200000 | |
| 106.87177,0.16234514,-0.011245861,-13.144133,0.22948238,106.49119,10.3190155,-4.015192,-110.33533,-177.06537,0.5291586,-0.9998961,43.54429,1205000 | |
| 106.96306,0.19460271,-0.0016361203,-12.593751,0.21978328,106.55031,12.171466,-0.746665,-109.913,-181.99379,0.5648663,-1.1453551,56.524895,1210000 | |
| 108.98769,0.20914058,4.4816472e-05,-12.497469,0.22128844,108.55722,13.424373,2.6971955,-112.50118,-197.18326,0.6260827,-0.7038702,47.87917,1215000 | |
| 105.09281,0.23834929,0.0155517375,-11.602005,0.20092689,104.637985,10.798381,2.1008604,-108.76255,-180.31602,0.6665114,-0.76300293,35.611122,1220000 | |
| 102.65714,0.21092537,0.010044544,-11.929779,0.21014518,102.22603,11.247155,-6.543077,-106.326195,-178.60173,0.77953035,-0.62754923,46.91847,1225000 | |
| 105.93126,0.22808224,0.054832127,-9.323914,0.16096854,105.48738,10.828718,0.96957076,-109.00561,-190.87135,0.5593208,-0.53374904,41.257294,1230000 | |
| 102.02902,0.23135278,0.029288247,-10.845885,0.19204047,101.57634,7.031616,-4.4241996,-104.947586,-181.96442,0.53099847,-0.46812478,36.0318,1235000 | |
| 103.52145,0.20044789,0.030093696,-10.726958,0.1820678,103.10884,9.402107,2.7378054,-107.6168,-191.71962,0.39314097,-0.4195359,36.500637,1240000 | |
| 105.274,0.19531853,0.005092932,-12.205944,0.21140209,104.86218,8.663789,-3.6863377,-108.88723,-192.62604,0.65522504,-0.69915056,37.517033,1245000 | |
| 95.467094,0.20651172,0.02095718,-11.260839,0.19044782,95.04918,9.35362,1.5048025,-99.26393,-189.00523,0.5989109,-0.5709751,37.84695,1250000 | |
| 107.84936,0.21940915,0.0033061549,-12.306912,0.21072593,107.415924,11.688501,-1.2205225,-111.75122,-192.20303,0.7258249,-0.6705856,41.76359,1255000 | |
| 102.32596,0.19350305,-0.018655404,-13.597704,0.23109208,101.92001,18.129576,1.8546538,-105.91322,-180.97362,2.8931332,-2.8245146,90.83487,1260000 | |
| 103.88827,0.19429186,0.002428966,-12.358697,0.21244307,103.47911,14.330042,-0.66923666,-107.47402,-195.15973,0.96221447,-0.62759584,51.519577,1265000 | |
| 101.72277,0.17639741,-0.02621281,-14.021259,0.24160023,101.330986,12.290746,0.5767433,-105.90625,-182.43742,0.7233818,-1.015738,67.99472,1270000 | |
| 101.43822,0.2589123,0.028336963,-10.818126,0.18226857,100.968704,9.707646,-6.197583,-104.472084,-196.61276,0.4976939,-0.47918114,39.01912,1275000 | |
| 104.57216,0.22809008,-0.00829879,-12.983227,0.22297,104.1294,13.2933855,-3.9007223,-108.73335,-194.59885,0.47767952,-0.9988346,52.552254,1280000 | |
| 99.125145,0.20152509,0.016969359,-11.513155,0.19797522,98.70868,13.956697,4.7797756,-102.54107,-180.91628,0.8924891,-0.93492854,45.87147,1285000 | |
| 96.88838,0.20515703,-0.0313077,-14.348032,0.2430715,96.471466,18.902115,1.1181347,-101.20715,-186.86835,1.071536,-1.1704524,52.612873,1290000 | |
| 96.158035,0.23442268,0.030076949,-10.722738,0.181463,95.712074,14.23545,0.7131933,-99.96081,-192.46275,0.7413616,-0.7281073,52.919075,1295000 | |
| 103.79574,0.21282905,0.025431968,-11.012491,0.1882808,103.3692,14.921979,-4.2234864,-107.47434,-181.02919,0.9002108,-0.8622433,52.926247,1300000 | |
| 103.21292,0.18425688,0.004937605,-12.210489,0.20824987,102.815475,13.282519,0.48120505,-107.02981,-193.4308,0.7191449,-0.6336026,39.500755,1305000 | |
| 99.4298,0.2029992,-0.036827434,-14.707047,0.24540606,99.01822,11.960586,-0.23398831,-103.94147,-192.09857,0.7827479,-0.8454186,41.31266,1310000 | |
| 100.02914,0.19505593,0.0031418658,-12.311076,0.20473728,99.626205,19.325802,2.8029733,-103.93719,-174.32886,1.9949422,-2.0873544,80.811295,1315000 | |
| 101.00037,0.18518214,-0.0008633871,-12.550953,0.21267346,100.60337,16.011314,-1.8596536,-105.311195,-179.10262,0.5315233,-0.5331034,43.61187,1320000 | |
| 98.53554,0.19300088,-0.0106897205,-13.140289,0.21937898,98.13385,11.233377,-3.9312325,-102.30115,-196.30164,3.0610101,-2.8097048,73.906136,1325000 | |
| 96.92799,0.22555499,0.0087744435,-11.965403,0.19639032,96.49728,8.559509,-0.5949456,-99.810486,-181.45924,0.939312,-0.81442237,46.16909,1330000 | |
| 101.1596,0.24452713,0.019567383,-11.335874,0.19054063,100.704956,11.436725,-3.0219588,-104.47903,-191.47183,0.5826118,-0.6574091,50.794445,1335000 | |
| 100.81999,0.21261466,0.007146833,-12.068523,0.19989896,100.40033,15.0016575,0.054602563,-104.022606,-182.33171,0.7150445,-0.61392385,52.69715,1340000 | |
| 104.99609,0.20619553,-0.047807854,-15.3827,0.2551129,104.582596,15.61514,-2.5161107,-109.03402,-184.12311,0.73921925,-0.45780316,50.858025,1345000 | |
| 93.96289,0.21521285,0.05660181,-9.114948,0.15241203,93.538666,14.122024,-1.8263075,-97.410324,-197.53696,1.0069737,-0.5011975,60.389217,1350000 | |
| 100.91636,0.23390386,0.039589804,-10.098106,0.16644454,100.476425,17.478304,0.38572097,-104.01147,-182.82059,1.117592,-0.99429524,65.20374,1355000 | |
| 94.42095,0.19327563,-0.013057126,-13.291747,0.21920133,94.02153,17.452082,3.5103111,-98.34838,-190.24336,1.2397919,-0.82919854,62.048965,1360000 | |
| 100.292656,0.19071409,-0.026793513,-14.099317,0.23620728,99.89253,16.030691,5.4755344,-103.974,-197.40318,0.66877973,-0.5501449,47.804535,1365000 | |
| 98.2816,0.21627139,-0.022980547,-13.870466,0.23258573,97.85573,13.429313,1.676564,-101.99857,-186.84729,0.9334692,-0.45445925,47.15665,1370000 | |
| 96.74265,0.197249,-0.004520745,-12.772412,0.21196114,96.33797,9.4805765,1.4193426,-100.50518,-193.27809,0.714216,-1.0641919,52.970108,1375000 | |
| 96.45968,0.16603844,0.02709258,-10.861577,0.1796045,96.086945,12.272731,-0.60102594,-99.366,-193.32045,1.2303681,-1.000957,46.247833,1380000 | |
| 98.18589,0.17925516,-0.016245387,-13.482033,0.22302803,97.79985,13.579948,3.0346441,-102.28371,-194.01915,0.42739427,-0.53876793,40.70731,1385000 | |
| 98.17783,0.17452812,-0.010165387,-13.114357,0.21699516,97.79647,13.137441,-5.175605,-102.40053,-180.3458,0.48776782,-0.68518937,45.562157,1390000 | |
| 99.4506,0.20514281,0.0034454365,-12.290781,0.20240563,99.039604,10.170339,-4.9180493,-103.53904,-178.83862,0.7893916,-0.45951167,54.12285,1395000 | |
| 93.666695,0.17933673,0.015241821,-11.582521,0.19241726,93.27969,11.320576,10.720198,-97.06602,-175.78653,2.832233,-2.864868,69.79698,1400000 | |
| 93.53375,0.17943063,0.0022880917,-12.362028,0.20500882,93.147026,14.464835,4.4165416,-97.59692,-186.75548,1.0091656,-0.92939985,56.612083,1405000 | |
| 98.30739,0.21549094,-6.450081e-05,-12.503983,0.20251302,97.88944,13.043059,-3.7746258,-101.72964,-181.54878,0.44974348,-0.39402252,37.19667,1410000 | |
| 94.508156,0.21198982,0.0009299666,-12.442497,0.20122702,94.09401,19.275888,3.74663,-98.72877,-174.74109,0.7352816,-1.0321537,66.12491,1415000 | |
| 97.31555,0.1973686,-0.008560073,-13.024936,0.2123963,96.91435,10.189555,1.7078452,-101.19876,-181.4718,0.80018896,-1.0294946,45.811485,1420000 | |
| 91.64408,0.21553618,-0.027007962,-14.141559,0.23266587,91.222885,8.334312,-3.9511795,-95.81732,-192.44719,0.5563668,-0.55297416,39.466526,1425000 | |
| 92.10221,0.17744556,0.017590117,-11.431155,0.18812399,91.71905,12.586532,0.30195004,-95.662926,-189.52826,1.1784267,-1.2068053,48.732372,1430000 | |
| 97.819,0.19950023,0.0033519673,-12.296234,0.20227419,97.41388,12.384676,6.361733,-100.6973,-195.23416,0.63614905,-0.64525634,40.157906,1435000 | |
| 87.508835,0.21779028,-0.005350979,-12.826469,0.21023156,87.08617,16.477825,7.47219,-91.242516,-193.97185,0.51973706,-0.36439723,41.991234,1440000 | |
| 95.36434,0.20376654,0.018058559,-11.379389,0.1833779,94.95914,7.9670167,-3.0075722,-99.92777,-191.20782,0.89031553,-0.8187602,41.98015,1445000 | |
| 91.687004,0.21111271,-0.011858591,-13.246592,0.21040408,91.27734,11.21865,-1.9255507,-95.218864,-183.37303,0.79599184,-0.5841421,42.271656,1450000 | |
| 95.33792,0.20719285,0.0026909984,-12.33403,0.19998124,94.928055,11.492063,-4.366525,-98.972565,-186.87672,1.0044495,-0.5977879,42.681534,1455000 | |
| 91.08106,0.20014614,0.0072255004,-12.0482,0.19268306,90.68101,12.769612,-2.6788497,-95.01554,-183.81412,0.9885431,-0.96797484,47.681602,1460000 | |
| 93.36493,0.18194455,-0.01057833,-13.152818,0.2131297,92.98044,11.843424,-5.1826563,-97.48171,-175.43277,1.089936,-1.0512753,46.915855,1465000 | |
| 92.16897,0.18954806,0.010816161,-11.82626,0.1898576,91.77875,15.044296,-3.0964909,-95.523926,-168.88097,0.84337056,-0.7282294,41.488434,1470000 | |
| 93.857765,0.19377479,-0.009639554,-13.098482,0.2109729,93.462654,7.127103,5.737853,-96.73793,-190.11949,0.31053412,-0.30493706,32.33541,1475000 | |
| 92.58727,0.18863712,-0.01844987,-13.649101,0.21914878,92.19794,16.709229,1.6111307,-96.3656,-180.56853,0.42664236,-0.5064059,44.908485,1480000 | |
| 91.02209,0.19266635,0.0066294307,-12.083945,0.19254601,90.63025,11.760968,1.4176176,-94.09954,-195.16634,0.71566725,-0.8087704,66.71344,1485000 | |
| 91.35259,0.2018925,-0.010936768,-13.178903,0.21230526,90.94934,14.535733,7.2325125,-94.898094,-184.8937,0.7999317,-0.48331988,53.63892,1490000 | |
| 86.29956,0.18344884,-0.001520502,-12.595417,0.20071217,85.916916,14.259452,-0.6909279,-89.76678,-190.27112,0.58360213,-0.56678975,44.14792,1495000 | |
| 86.10573,0.22268292,-0.0072952774,-12.961872,0.204733,85.68561,10.75118,5.905188,-89.344666,-195.84227,0.74976707,-0.80259174,35.474865,1500000 | |