O2O / O2O-w-diff-ckpts /cube-double-play-singletask-task2-v0 /fedit /20260319_054536 /online_agent.csv
| actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step | |
| 142.22467,0.19724998,-0.003392768,-12.75399,0.17036617,141.86044,9.805751,-56.938065,-145.46315,-195.44598,0.44529516,-0.36793858,39.34777,405000 | |
| 139.81764,0.19557726,0.0049355817,-12.114027,0.15490662,139.46223,5.938343,-56.97401,-142.9116,-188.71814,0.38585398,-0.6409478,24.44507,410000 | |
| 142.47205,0.20879248,0.016501924,-11.199326,0.14208815,142.10468,6.341258,-49.264572,-144.88725,-195.88751,0.29550356,-0.34070557,26.331944,415000 | |
| 139.50183,0.17860708,-0.014844757,-13.578739,0.18685988,139.15121,9.0695915,-43.28179,-142.45775,-198.60043,0.26270103,-0.36135292,29.020561,420000 | |
| 134.13617,0.20409997,-0.0021690542,-12.643364,0.19129038,133.74295,15.052722,-48.167065,-137.59178,-194.25197,0.57770836,-0.66591465,42.43364,425000 | |
| 130.61128,0.19928366,0.003881416,-12.248251,0.18884107,130.21928,13.850858,-43.63822,-134.08699,-195.524,1.7957826,-1.7771385,57.855118,430000 | |
| 128.54376,0.17183661,-0.0073256684,-12.959245,0.20672013,128.17253,13.883544,-45.58586,-131.69533,-192.26152,0.704441,-0.51224196,40.669968,435000 | |
| 126.81196,0.2146208,-0.019095356,-13.664509,0.22406755,126.392365,14.327176,-5.7274394,-130.9311,-198.40053,0.3906818,-0.36371803,35.883106,440000 | |
| 125.806725,0.18302576,0.02981052,-10.698715,0.17705932,125.416824,15.800162,-19.843931,-129.13773,-194.43314,0.71952087,-0.76135075,41.07122,445000 | |
| 124.6656,0.17793618,-0.006242988,-12.883287,0.20984308,124.284065,15.375974,-7.5104413,-127.86031,-186.95538,1.4397291,-2.0634599,62.64809,450000 | |
| 123.28135,0.20897588,-0.005879716,-12.859491,0.2103254,122.86793,19.126133,-15.371694,-126.92218,-185.19652,1.6891512,-1.4827029,58.673157,455000 | |
| 121.47641,0.21695346,0.01229297,-11.781603,0.20160282,121.04556,12.078338,-0.02522032,-125.462234,-195.22052,1.222493,-1.1790318,45.213318,460000 | |
| 119.26785,0.17669764,0.009813637,-11.924593,0.20337537,118.87797,18.412064,-5.5330486,-122.68246,-193.20769,0.94419134,-0.9259949,59.706207,465000 | |
| 115.68386,0.20364721,0.010264613,-11.927105,0.21369901,115.256256,19.220808,-30.340061,-119.3469,-195.47362,0.55976826,-0.6381404,44.82702,470000 | |
| 119.75209,0.191796,0.00026517035,-12.484171,0.20913601,119.35089,16.21495,-1.3454994,-123.20503,-193.34491,0.88478035,-0.81840223,50.312397,475000 | |
| 118.3376,0.20955625,5.928335e-05,-12.496587,0.2170513,117.910934,20.496222,-1.3666053,-122.89668,-194.15404,1.1156993,-0.9846423,64.080536,480000 | |
| 117.52846,0.15975638,0.011763554,-11.838703,0.21059409,117.14634,19.238058,-13.044911,-121.03383,-182.97734,0.9260542,-0.998397,80.73567,485000 | |
| 114.98107,0.1821447,-0.02802917,-14.095164,0.24767086,114.579285,14.588266,-9.361954,-118.687355,-182.61952,0.8343776,-0.7852055,53.01512,490000 | |
| 114.66237,0.17383197,0.019565428,-11.411486,0.20511499,114.263855,21.856138,-1.839778,-118.170265,-187.53555,3.2695355,-3.235152,66.48562,495000 | |
| 111.034035,0.1820087,-0.012972684,-13.233714,0.23398322,110.63101,12.159671,-6.9047384,-114.41473,-179.86205,0.47060096,-0.43112326,43.679707,500000 | |
| 115.80381,0.20543118,0.007238078,-12.090468,0.21368742,115.37746,17.710814,-15.998586,-120.5949,-183.68678,0.9546672,-0.9548487,60.75303,505000 | |
| 113.549194,0.22652584,0.016017538,-11.579997,0.20161135,113.10504,16.599468,-20.434448,-117.20298,-181.01495,0.5060833,-0.50573003,42.90764,510000 | |
| 109.0155,0.1768633,-0.01886177,-13.596224,0.2339384,108.62356,14.179057,1.3046273,-112.79769,-180.71132,1.0487956,-1.0388619,53.729164,515000 | |
| 112.79665,0.18539357,0.016376335,-11.556786,0.20065191,112.39423,18.675333,-8.592517,-116.1793,-179.98224,1.2271938,-1.3222458,61.67128,520000 | |
| 114.62584,0.20339978,-0.0026624908,-12.652889,0.22034381,114.20476,13.26593,-14.8670435,-118.71555,-177.63503,0.5730812,-0.51445645,54.127457,525000 | |
| 114.462364,0.1985496,-0.0034407456,-12.692657,0.22668317,114.04057,16.969477,-7.997439,-118.51965,-184.66826,1.139284,-1.0990369,54.21824,530000 | |
| 114.29223,0.22971365,-0.0045444905,-12.753717,0.22843976,113.83862,12.968991,0.81336486,-117.82373,-181.63252,1.4438976,-1.2844524,63.993317,535000 | |
| 106.98438,0.17561813,-0.004069124,-12.731416,0.22386423,106.58897,14.007227,-3.9447756,-111.39441,-182.31357,0.61606693,-0.87352574,61.315056,540000 | |
| 108.23639,0.20547235,-0.015444699,-13.375903,0.23585576,107.8105,12.642759,-6.148325,-111.95725,-185.81625,0.4380914,-0.47955316,43.12178,545000 | |
| 111.16016,0.1627776,-0.0068611377,-12.886917,0.22852159,110.77571,11.653918,-0.50751185,-114.53645,-188.91502,1.0990227,-1.1433343,55.566727,550000 | |
| 109.92446,0.20906411,0.027088761,-10.966885,0.19377494,109.49454,7.93758,-5.9863563,-112.5084,-179.61174,1.1615518,-1.044347,48.595856,555000 | |
| 111.39829,0.1917037,0.011001644,-11.882542,0.21171872,110.98387,14.179515,-4.5432153,-114.89455,-187.63704,0.88315713,-0.80526143,49.088593,560000 | |
| 106.8727,0.20691302,-0.007513227,-12.915862,0.2333461,106.43996,11.945306,-1.9904928,-110.504395,-187.30493,0.3968167,-0.44055578,42.210594,565000 | |
| 107.02122,0.18739688,0.020604083,-11.32585,0.19874689,106.61447,11.667717,-7.4577923,-110.88082,-183.68802,0.87920254,-0.48426875,56.052666,570000 | |
| 111.654076,0.22465333,0.0383834,-10.261921,0.1759935,111.21504,16.008942,-7.6973495,-114.366234,-191.40315,1.0988207,-1.0105971,53.105633,575000 | |
| 109.081856,0.1932351,0.043528084,-10.038322,0.17750049,108.667595,14.522926,1.9009913,-112.02111,-177.01114,1.0965586,-1.1656919,61.233955,580000 | |
| 106.08879,0.19602299,-0.027652329,-14.040659,0.25200707,105.66841,17.21857,-4.158478,-109.85683,-180.51553,1.392746,-0.47971448,58.91733,585000 | |
| 103.58725,0.20343122,0.0029727442,-12.330069,0.21569961,103.165146,18.894281,-4.7199984,-107.32094,-187.74762,1.6120654,-1.6194942,72.59152,590000 | |
| 106.98519,0.18676691,0.0057946495,-12.177164,0.21857046,106.57406,11.0311365,-6.2588515,-110.32892,-182.58046,0.49919584,-0.5541354,39.469223,595000 | |
| 105.54729,0.18921968,0.01763878,-11.519598,0.20725341,105.13318,12.465834,1.6088665,-109.15065,-180.6389,0.6296998,-0.5911415,55.44529,600000 | |
| 105.42162,0.18626194,0.00268849,-12.352631,0.22535159,105.007324,10.600258,1.1076522,-109.03627,-177.2841,1.0322182,-1.0862784,51.59421,605000 | |
| 105.50738,0.2027498,-0.027987434,-14.074841,0.2501324,105.08248,12.658179,-3.7463593,-109.058815,-174.61728,0.5070495,-0.6069681,55.815037,610000 | |
| 106.43428,0.17930453,-0.009326104,-13.019765,0.23361272,106.030685,13.086246,2.1425176,-109.83788,-193.86005,1.1692036,-0.64800423,63.587616,615000 | |
| 104.33087,0.19253321,-0.007871761,-12.943193,0.22988996,103.91632,19.217735,1.4441602,-108.00958,-181.67577,0.62563884,-0.51666075,46.767532,620000 | |
| 100.93342,0.19470185,0.022521444,-11.197918,0.19368464,100.52251,10.159808,-1.7784482,-104.61147,-176.1988,0.73183465,-0.78390026,43.418377,625000 | |
| 104.994484,0.18470603,0.03691848,-10.454363,0.18867433,104.58418,11.584065,-5.7868376,-108.888016,-187.64406,0.70080024,-0.78722465,64.16923,630000 | |
| 101.30239,0.1953979,0.026314672,-11.037681,0.19862483,100.88206,10.292042,0.9212266,-104.260635,-175.13235,0.33379483,-0.59312475,46.37333,635000 | |
| 101.50235,0.19823349,-0.0061323014,-12.851336,0.22431056,101.08594,10.357642,0.49496436,-106.23502,-193.41193,0.6649617,-0.591452,45.24546,640000 | |
| 104.40377,0.19096564,-0.018157301,-13.506737,0.24360476,103.98736,10.906247,1.7986319,-108.48596,-187.88707,1.8207929,-1.4194535,52.869015,645000 | |
| 94.029045,0.20790523,0.023620684,-11.163839,0.19735464,93.60016,11.6212,-4.15136,-98.032715,-187.55223,0.68759316,-0.7079805,42.13076,650000 | |
| 105.180145,0.24150692,0.0058041243,-12.171896,0.2153195,104.717514,10.485339,-5.2126217,-109.22595,-189.89667,0.4451899,-0.38450944,36.895714,655000 | |
| 100.12052,0.22727837,0.0014495864,-12.417002,0.21686614,99.67493,14.92912,2.4681795,-104.42549,-177.26454,0.74425006,-0.57501066,48.638695,660000 | |
| 102.33838,0.20558006,0.010077734,-11.926068,0.20941123,101.91331,14.744016,1.5924649,-106.02773,-189.98253,0.5506395,-0.5838308,48.830627,665000 | |
| 100.3568,0.20062822,-0.0073483586,-12.917844,0.22717807,99.93633,12.260611,-4.110455,-104.513626,-180.39558,0.5570179,-0.6603365,53.06993,670000 | |
| 99.99706,0.22289923,0.008967151,-11.98362,0.20810036,99.5571,12.319209,-1.8155595,-103.436356,-190.1067,0.86313486,-0.5108046,52.98831,675000 | |
| 102.313385,0.19417408,-0.011565083,-13.149618,0.23410127,101.896675,14.345215,6.527643,-106.62862,-177.52533,1.0757029,-0.5579598,60.77507,680000 | |
| 98.99212,0.1893543,0.0007038871,-12.459703,0.21764202,98.58442,23.574797,-2.5339584,-102.69148,-183.25351,1.9973627,-2.0867567,86.24567,685000 | |
| 96.130516,0.19397487,-0.022631805,-13.790447,0.24185626,95.71731,18.822353,0.28472924,-100.031944,-181.43718,0.8578789,-0.8402781,76.57361,690000 | |
| 97.72576,0.22853991,0.019465836,-11.382367,0.19824693,97.27951,13.190902,2.7169483,-100.9912,-186.27829,0.88386786,-0.8938185,44.09863,695000 | |
| 102.52866,0.21629149,0.019145863,-11.403129,0.19904134,102.094185,12.096599,-9.119725,-106.07815,-182.22836,0.48855025,-0.48337433,46.539,700000 | |
| 101.51931,0.20107162,0.010869889,-11.8681965,0.20418686,101.10318,12.8593445,-4.883183,-104.99103,-181.45404,0.93955064,-0.5850918,59.279396,705000 | |
| 98.886185,0.1830818,-0.039381944,-14.763855,0.2568315,98.48566,13.961517,-4.928098,-103.05845,-191.85965,1.7582738,-1.7676892,51.672466,710000 | |
| 98.69067,0.193122,0.017439522,-11.484745,0.19727895,98.28282,14.824216,-3.1401956,-102.46619,-171.33221,0.8527688,-0.7354639,47.528008,715000 | |
| 97.16074,0.20946798,0.015919445,-11.59899,0.20493622,96.73042,14.538841,1.9871198,-101.290794,-172.08179,0.44246832,-0.5103479,48.898342,720000 | |
| 98.50649,0.17979497,-0.007589332,-12.941291,0.22256464,98.111725,12.244751,-10.581043,-101.90107,-191.91794,0.42243,-0.5946408,40.636265,725000 | |
| 93.354546,0.21264416,-0.00015120793,-12.508729,0.21668269,92.92537,11.955328,-2.6755898,-96.429955,-171.02626,0.5872266,-0.6679362,53.51135,730000 | |
| 98.50614,0.21205312,0.011974183,-11.816626,0.2070526,98.075066,13.965573,-3.3398297,-101.56211,-179.265,1.3110914,-1.1805464,62.51306,735000 | |
| 97.98349,0.16851035,0.004953969,-12.213509,0.21119428,97.59883,10.929885,6.7827396,-101.207054,-174.5349,0.62281805,-0.7154352,53.4946,740000 | |
| 103.56326,0.16951722,-0.006322426,-12.872276,0.21861184,103.18146,12.476272,-1.9426899,-107.09063,-179.75507,0.66306156,-0.6584883,54.696,745000 | |
| 91.43585,0.17501467,0.039277546,-10.207924,0.17492536,91.04663,14.793854,-1.8184315,-94.853004,-194.53389,0.47727185,-0.50112796,41.22413,750000 | |
| 97.67782,0.19544353,0.042430524,-10.0362425,0.17284292,97.267105,14.836095,3.2336733,-100.90886,-177.92732,0.6724175,-0.6845518,45.210747,755000 | |
| 91.7408,0.2242035,-0.0033059488,-12.693747,0.21659675,91.3033,12.139722,6.185742,-95.54708,-177.97159,1.3230456,-1.192579,53.56531,760000 | |
| 97.34703,0.20600411,-0.032316055,-14.369734,0.24836321,96.92499,17.248533,-6.157846,-100.455956,-193.77246,0.66694874,-0.6018577,42.837852,765000 | |
| 95.76429,0.19711839,0.0109218275,-11.859816,0.20233369,95.35391,19.586796,-3.28389,-99.27317,-186.6871,0.51644987,-0.47388953,53.05974,770000 | |
| 95.75828,0.18849564,-0.0058916584,-12.846695,0.2183139,95.35736,14.186653,2.254191,-99.40853,-180.29501,1.6556274,-1.5490323,57.30641,775000 | |
| 92.38485,0.21452543,0.011731434,-11.799142,0.19750196,91.96109,14.500409,3.0059357,-95.765976,-179.23204,1.5781146,-1.6244335,64.64287,780000 | |
| 96.487175,0.21060373,-0.0017931715,-12.606966,0.21134238,96.067024,12.124263,-2.51704,-100.38101,-187.08223,0.7850716,-0.75432557,54.621616,785000 | |
| 96.89853,0.20197164,-0.008143415,-12.971868,0.2238664,96.48083,16.647654,2.8885932,-100.96055,-184.56966,0.63071895,-0.7392853,51.058548,790000 | |
| 95.57525,0.20329508,-5.3492746e-05,-12.50313,0.21368547,95.158325,14.6787,5.813659,-99.99287,-173.2625,0.43661344,-0.46026474,42.80774,795000 | |
| 91.80034,0.19116792,0.020269455,-11.290085,0.18914042,91.39976,9.51644,-1.355526,-95.85372,-177.39125,0.72358036,-0.8402512,55.97972,800000 | |
| 93.77563,0.20956951,-0.0016382892,-12.596235,0.21443567,93.35326,24.343,1.3357842,-97.41246,-184.06499,2.2914524,-2.0517406,75.118126,805000 | |
| 98.11002,0.21711528,0.012882368,-11.733853,0.19729878,97.682724,13.457941,0.6117728,-101.03038,-178.7308,0.4716434,-0.49188453,47.543114,810000 | |
| 94.60032,0.21953103,0.0029066121,-12.327898,0.20820457,94.16968,11.893686,-1.2987251,-97.981186,-174.35974,0.919945,-0.8435753,47.220837,815000 | |
| 95.175026,0.18027076,-0.009262448,-13.053003,0.21862936,94.78539,13.106071,1.7474558,-98.707855,-181.46506,0.4509476,-0.49307296,40.1418,820000 | |
| 91.06041,0.20583534,-0.0128686195,-13.272969,0.2209723,90.64648,8.33669,-5.1908607,-95.5021,-187.82428,0.5254419,-0.36422923,41.941,825000 | |
| 90.45305,0.21207413,-0.00407471,-12.738085,0.21800637,90.02704,10.809904,8.592395,-93.78776,-174.8729,0.8781694,-0.83012044,42.690674,830000 | |
| 96.69761,0.20288077,-0.008225537,-12.989187,0.2184093,96.284546,10.185951,0.03464684,-100.15487,-184.31267,0.4039918,-0.77936983,43.78657,835000 | |
| 87.55371,0.20413756,0.0010917006,-12.435368,0.21004474,87.138435,8.250606,2.191376,-91.233116,-185.03397,0.322233,-0.61796796,37.67129,840000 | |
| 93.43861,0.19246097,0.037776668,-10.239003,0.17107294,93.0373,10.612015,-2.6316803,-97.3837,-183.00148,1.7473373,-0.5594089,55.38513,845000 | |
| 87.573746,0.19998986,-0.00498279,-12.796703,0.21490587,87.16383,10.651252,-3.0807412,-91.5543,-182.87138,0.80568904,-0.8190322,51.41633,850000 | |
| 91.60055,0.20965266,0.022144469,-11.172183,0.18632239,91.18242,13.888168,-1.5874568,-94.47501,-179.64635,0.64695096,-0.5956812,49.621346,855000 | |
| 89.22641,0.20564404,0.012098176,-11.768193,0.1945509,88.81412,16.65694,4.060488,-93.29956,-174.18019,0.9447881,-0.50205225,52.336014,860000 | |
| 93.912155,0.19216594,-0.017110169,-13.529602,0.2248381,93.51226,11.485209,4.8414893,-96.92926,-184.2908,0.48704162,-0.5802207,35.269814,865000 | |
| 91.93932,0.19218534,-0.0032075685,-12.695056,0.20876196,91.54158,14.467067,-0.22931968,-95.24652,-170.80632,1.5706182,-0.8673708,48.381744,870000 | |
| 91.16346,0.17615911,0.00017596195,-12.489485,0.20899948,90.77812,9.735013,-5.537423,-95.11013,-189.76671,0.77968556,-0.8614044,60.71826,875000 | |
| 91.51225,0.197838,-0.029265232,-14.262323,0.23684089,91.10684,14.927167,0.18784434,-95.3237,-176.21082,0.47260365,-0.48853406,44.99313,880000 | |
| 88.51375,0.17240968,-5.2326533e-05,-12.503159,0.20713392,88.13426,11.795323,0.5494245,-92.40301,-183.36504,0.8624656,-0.7748262,59.19551,885000 | |
| 89.68305,0.20532899,-0.00028636534,-12.517385,0.20619166,89.27182,14.873596,4.1464705,-93.373375,-181.27982,1.6405364,-1.4344778,62.82807,890000 | |
| 85.40258,0.17088136,0.018355524,-11.38454,0.18733898,85.026,19.461613,1.3264853,-89.16634,-184.35254,0.91269875,-1.2005254,75.41293,895000 | |
| 85.07639,0.21939209,-0.0064551653,-12.896566,0.20992568,84.653534,13.13906,1.5214543,-88.177444,-188.80399,0.62370646,-0.7047949,50.695316,900000 | |