Tiredsheep commited on
Commit
f1d76c0
·
verified ·
1 Parent(s): 9290a10

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_250000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_300000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_350000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_400000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_450000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_500000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_550000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_600000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_650000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_700000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.032100898337100635,0.018013430354117597,-0.03220314910217288,-0.0018174535851372558,32.82097786641414,10.79999999999963,0.92,5975.76,-0.08,-299.2,214.0,0.6660559844970703,250000
3
+ 0.0,0.0,-0.008580130096298936,0.00981087398520963,-0.00784745580403333,0.004665798850437601,35.06966440004249,7.639999999999625,0.98,14884.72,-0.02,-216.06,150.8,0.47900086879730225,300000
4
+ 0.0,0.0,-0.011663867950245491,0.05076861665231991,-0.009363246581778074,0.046192377875139454,35.67358313270122,6.127999999999672,1.0,22263.1,0.0,-178.68,120.56,0.38775736808776856,350000
5
+ 0.0,0.0,-0.020764777769042144,0.0541114022905938,-0.016882484219918753,0.061675788472179534,35.16507761102275,4.49599999999977,1.0,27405.64,0.0,-127.92,87.92,0.2877710580825806,400000
6
+ 0.0,0.0,-0.030564958771079318,0.06370754781217387,-0.026824387801915626,0.0546009401570277,35.90741069401493,3.816999999999881,1.0,31599.2,0.0,-105.26,74.34,0.24462635993957518,450000
7
+ 0.0,0.0,-0.026583860444845106,0.06785783483161273,-0.0224980904801925,0.06032834204823372,35.67836030084676,3.627999999999852,1.0,35254.72,0.0,-104.44,70.56,0.23619484424591064,500000
8
+ 0.0,0.0,-0.02925354365151506,0.048986477891192315,-0.026154735849911813,0.04390185085645233,35.9144188093312,3.149999999999875,1.0,38820.5,0.0,-89.08,61.0,0.20783519744873047,550000
9
+ 0.0,0.0,-0.013547412162643904,0.054522985472731274,-0.010740163173055057,0.05137970496425071,35.925014993299186,3.1399999999998753,1.0,41939.18,0.0,-87.52,60.8,0.19969687938690187,600000
10
+ 0.0,0.0,-0.03368607053338356,0.06411059242079416,-0.03021719531312195,0.05277305218349021,35.8183528536541,3.052999999999887,1.0,45093.72,0.0,-84.5,59.06,0.19931025981903075,650000
11
+ 0.0,0.0,-0.028076519378313937,0.04897046259684214,-0.025441609123222172,0.04274102632749926,35.794637673860535,2.8639999999999066,1.0,48002.1,0.0,-80.4,55.28,0.18481061458587647,700000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.032100898337100635,0.018013430354117597,-0.03220314910217288,-0.0018174535851372558,32.82097786641414,10.79999999999963,0.92,5975.76,-0.08,-299.2,214.0,0.6660559844970703,250000
3
+ 0.0,0.0,-0.008580130096298936,0.00981087398520963,-0.00784745580403333,0.004665798850437601,35.06966440004249,7.639999999999625,0.98,14884.72,-0.02,-216.06,150.8,0.47900086879730225,300000
4
+ 0.0,0.0,-0.011663867950245491,0.05076861665231991,-0.009363246581778074,0.046192377875139454,35.67358313270122,6.127999999999672,1.0,22263.1,0.0,-178.68,120.56,0.38775736808776856,350000
5
+ 0.0,0.0,-0.020764777769042144,0.0541114022905938,-0.016882484219918753,0.061675788472179534,35.16507761102275,4.49599999999977,1.0,27405.64,0.0,-127.92,87.92,0.2877710580825806,400000
6
+ 0.0,0.0,-0.030564958771079318,0.06370754781217387,-0.026824387801915626,0.0546009401570277,35.90741069401493,3.816999999999881,1.0,31599.2,0.0,-105.26,74.34,0.24462635993957518,450000
7
+ 0.0,0.0,-0.026583860444845106,0.06785783483161273,-0.0224980904801925,0.06032834204823372,35.67836030084676,3.627999999999852,1.0,35254.72,0.0,-104.44,70.56,0.23619484424591064,500000
8
+ 0.0,0.0,-0.02925354365151506,0.048986477891192315,-0.026154735849911813,0.04390185085645233,35.9144188093312,3.149999999999875,1.0,38820.5,0.0,-89.08,61.0,0.20783519744873047,550000
9
+ 0.0,0.0,-0.013547412162643904,0.054522985472731274,-0.010740163173055057,0.05137970496425071,35.925014993299186,3.1399999999998753,1.0,41939.18,0.0,-87.52,60.8,0.19969687938690187,600000
10
+ 0.0,0.0,-0.03368607053338356,0.06411059242079416,-0.03021719531312195,0.05277305218349021,35.8183528536541,3.052999999999887,1.0,45093.72,0.0,-84.5,59.06,0.19931025981903075,650000
11
+ 0.0,0.0,-0.028076519378313937,0.04897046259684214,-0.025441609123222172,0.04274102632749926,35.794637673860535,2.8639999999999066,1.0,48002.1,0.0,-80.4,55.28,0.18481061458587647,700000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 144.48218,0.20084155,0.007955507,-11.939722,0.16953468,144.10385,5.6320925,-61.609184,-147.72014,-192.55522,0.3365969,-0.3545817,34.435097,205000
3
+ 141.52284,0.20601317,0.0051709497,-12.13455,0.17169836,141.13997,8.522275,-49.670933,-144.36105,-189.64992,5.1706257,-7.740093,86.80667,210000
4
+ 141.91428,0.17490241,0.01826083,-11.226896,0.16103359,141.56009,8.085265,-51.68727,-144.41907,-189.92767,0.3219849,-0.34089342,31.617275,215000
5
+ 139.75023,0.18226436,-0.02458897,-14.171362,0.20848817,139.38406,7.448753,-39.921883,-142.92554,-199.56168,0.4707362,-0.34605148,39.64032,220000
6
+ 135.58205,0.21704067,-0.0012576939,-12.583085,0.1904755,135.17578,12.413958,-25.195766,-138.71,-191.81935,0.7280265,-0.64803606,59.958717,225000
7
+ 130.08755,0.18765236,0.015086443,-11.597219,0.19380215,129.69101,15.468149,-49.83012,-134.03163,-192.93794,1.0398954,-0.97762054,54.171432,230000
8
+ 130.44162,0.1888678,0.006047253,-12.134399,0.20071024,130.04599,11.8002,-42.18964,-133.5037,-189.61465,3.6813872,-3.652266,78.41486,235000
9
+ 130.88297,0.22584003,-0.014606258,-13.386118,0.22064905,130.45108,17.989021,-44.303562,-134.64374,-197.72902,0.9195378,-0.9870174,64.79435,240000
10
+ 131.55867,0.18186271,0.025066465,-10.969579,0.17966855,131.17206,11.021298,-23.255741,-134.35143,-201.91087,0.9887526,-0.48836735,41.54718,245000
11
+ 128.80318,0.20678943,-0.015101453,-13.382331,0.22904405,128.38245,12.094199,-33.19275,-132.44287,-190.24712,0.7013745,-0.5877644,41.800476,250000
12
+ 125.54997,0.18703696,-0.020380223,-13.695589,0.23345745,125.14986,15.098124,-7.386241,-129.13432,-189.60175,1.3864138,-1.3081933,56.94703,255000
13
+ 124.31259,0.21824645,0.0005268152,-12.46993,0.21846628,123.87535,14.957232,-5.7514653,-128.47237,-195.73836,1.030421,-0.9760635,80.46483,260000
14
+ 125.89017,0.19474377,-0.008222612,-12.975603,0.22433272,125.47932,12.199797,-30.707668,-128.94447,-195.33046,0.6997693,-0.70229477,49.997604,265000
15
+ 120.81332,0.19289371,-0.0194915,-13.588592,0.24330705,120.39661,21.915207,-30.642334,-124.371666,-201.77202,0.8438717,-0.813125,71.765045,270000
16
+ 122.494354,0.20799544,-0.030378412,-14.261794,0.24591446,122.07082,20.9703,-20.236235,-126.33733,-197.22522,2.4760046,-2.0115874,105.5294,275000
17
+ 123.49063,0.20606653,-0.018395767,-13.5148,0.24498925,123.05797,17.570011,-7.2122307,-127.25187,-196.16934,1.0048642,-0.96069825,80.91629,280000
18
+ 121.554375,0.19578737,0.0108189965,-11.902279,0.21543612,121.13233,13.894259,-36.35514,-125.29781,-197.84816,0.87089163,-1.0272144,64.01187,285000
19
+ 119.0697,0.19609824,-0.019701831,-13.591909,0.24524516,118.648056,16.67483,-9.279862,-122.77602,-191.60829,0.66713595,-0.71127427,57.63592,290000
20
+ 120.27925,0.18039733,-0.00013375818,-12.507637,0.21906422,119.87993,16.382938,-2.3988245,-123.41537,-189.57196,3.4317386,-3.420048,68.78206,295000
21
+ 115.216484,0.21515399,-0.012243445,-13.200209,0.23081124,114.78276,9.70177,-10.437784,-118.66335,-193.57097,0.64383346,-0.6483637,43.586178,300000
22
+ 119.501076,0.17617288,-0.008795963,-13.009455,0.22461402,119.109085,17.875471,-15.194057,-123.814514,-188.69203,1.0821308,-1.0835013,75.81144,305000
23
+ 118.00852,0.19232787,0.008458496,-12.027052,0.21509925,117.592636,16.713726,3.5033665,-121.50606,-186.2886,2.353953,-1.5965722,81.40209,310000
24
+ 113.55228,0.17097896,0.018878518,-11.43467,0.20263179,113.15979,12.901244,1.3406298,-116.846756,-186.32684,0.79442936,-0.86039066,47.06075,315000
25
+ 116.36646,0.19617718,0.008543284,-12.002956,0.20630918,115.95544,19.114908,-9.321144,-119.55932,-196.51677,1.0275877,-1.4465806,55.844055,320000
26
+ 117.38713,0.21147352,-0.008250286,-12.973329,0.22612973,116.95778,14.150728,-5.901023,-121.19329,-182.08931,0.83120906,-0.8294971,44.850304,325000
27
+ 116.75811,0.19610855,-0.0043269587,-12.74073,0.22900574,116.337326,16.160324,-5.6663594,-120.59756,-198.87804,2.15585,-2.2830417,53.35273,330000
28
+ 116.94549,0.19901495,0.009186578,-11.981067,0.21209855,116.52519,11.759593,1.6414704,-120.41815,-186.79749,0.53586686,-0.5250851,50.5316,335000
29
+ 108.93243,0.18757223,-0.051170416,-15.334039,0.27686608,108.519165,16.279835,-4.7676296,-113.5625,-183.38005,0.59261274,-0.790006,54.269386,340000
30
+ 113.84219,0.20547168,0.0011042095,-12.437635,0.22021721,113.4154,13.960497,-11.343479,-117.24744,-197.81271,0.9424458,-0.8763122,74.27308,345000
31
+ 113.14261,0.19256692,0.01456056,-11.682483,0.20807327,112.72741,13.435145,-4.731493,-116.97102,-193.97385,0.6362939,-0.5244417,47.549667,350000
32
+ 112.658356,0.19187821,0.050226495,-9.744099,0.17758687,112.23866,15.970774,-8.040866,-115.52478,-187.88014,1.6573689,-1.9955028,85.72754,355000
33
+ 113.9489,0.22773285,0.02687861,-11.013138,0.19908895,113.4952,14.736795,-6.699558,-117.49114,-186.91785,3.7270505,-3.7050714,107.29452,360000
34
+ 112.526695,0.18453003,-0.008910083,-12.991556,0.23548856,112.115585,13.551719,1.7961043,-116.11182,-190.64087,0.48566732,-0.54164183,50.633957,365000
35
+ 110.87313,0.20040402,0.03266639,-10.686939,0.19254938,110.44751,13.552001,-8.706027,-114.829704,-188.37375,0.9943002,-0.8764734,51.54306,370000
36
+ 113.31839,0.22617154,0.040899754,-10.241089,0.18542476,112.86589,20.346548,-2.9180305,-116.29736,-193.89908,1.061439,-0.9535161,74.86721,375000
37
+ 112.10307,0.18414056,0.030142447,-10.838998,0.19669688,111.69209,15.630881,2.9794111,-115.29461,-196.13448,1.0509855,-1.1081816,59.27148,380000
38
+ 107.93893,0.20868012,-0.03285881,-14.293082,0.26192534,107.50118,16.14296,-5.8019753,-111.6614,-179.94127,0.7113738,-0.70418465,46.92609,385000
39
+ 107.14751,0.18791865,-0.017461417,-13.463472,0.24400422,106.73305,15.503365,-10.185286,-110.75378,-200.5079,1.0120332,-0.7968678,60.829765,390000
40
+ 108.76094,0.18286063,-0.0035371901,-12.691629,0.23426835,108.34735,11.668123,-4.2940083,-112.68676,-201.29973,0.5523828,-0.5761741,51.239532,395000
41
+ 108.6889,0.17124566,-0.0048458534,-12.768627,0.23033744,108.29216,9.676522,-2.3043008,-112.710815,-198.99835,0.5341521,-0.55172676,47.346535,400000
42
+ 107.85487,0.2022472,-0.019386478,-13.569939,0.245877,107.42613,19.12713,-3.333591,-111.87544,-194.56795,1.1276473,-1.1018034,79.25743,405000
43
+ 109.1956,0.19780378,-0.021385392,-13.668522,0.2501508,108.76903,13.238149,-7.897752,-112.656166,-184.45027,0.4505389,-0.57169324,49.759193,410000
44
+ 108.95648,0.21866512,0.011095352,-11.880872,0.21291624,108.51381,12.348601,2.1229436,-112.45379,-198.30408,1.5401742,-0.936708,61.596863,415000
45
+ 107.78601,0.19296041,0.038201857,-10.429166,0.19239277,107.36246,14.963687,-5.8542953,-112.3101,-193.4103,0.7105955,-0.45953342,53.192596,420000
46
+ 100.86755,0.21008077,0.02927794,-10.926798,0.20335221,100.424835,18.414717,-1.1180243,-104.40838,-180.58965,0.7808968,-0.8466123,55.266632,425000
47
+ 106.99209,0.23280206,0.04400285,-10.078108,0.18310702,106.53217,12.4727545,0.22057597,-109.62371,-189.80302,0.7959405,-0.7455131,56.99437,430000
48
+ 102.15905,0.19823489,0.03952041,-10.32045,0.1871342,101.73416,14.295875,-7.1629725,-105.39282,-183.49532,0.5814135,-0.6473388,52.314888,435000
49
+ 105.74219,0.23047909,-0.00510736,-12.786837,0.22768006,105.28914,13.682334,1.91177,-109.62107,-194.26242,1.0837262,-1.1873109,61.283512,440000
50
+ 105.57046,0.21301453,-0.014497222,-13.302532,0.24030161,105.13164,15.52254,-2.4786177,-109.77361,-192.06009,0.6005032,-0.58952963,56.71501,445000
51
+ 96.02997,0.20390232,0.0068056514,-12.115505,0.21444741,95.60481,15.363355,-0.7407328,-100.571915,-188.8019,3.265701,-3.1980455,124.76698,450000
52
+ 107.834236,0.19974846,0.016163357,-11.605266,0.20964888,107.408676,12.720616,1.7086813,-111.479065,-191.27725,0.92290133,-0.8774392,56.13313,455000
53
+ 102.61572,0.21998237,-0.023953574,-13.807033,0.25303715,102.16666,14.961654,4.182927,-107.32101,-175.1483,1.3203807,-0.94046956,68.59372,460000
54
+ 105.71762,0.19785048,0.0053135836,-12.204096,0.2191503,105.29531,11.124604,0.13958555,-109.354935,-196.7954,0.33575726,-0.30397153,43.54039,465000
55
+ 104.55611,0.20837197,-0.0059245178,-12.830792,0.22980048,104.12386,15.764697,-0.1866479,-108.480385,-178.34082,0.55118746,-0.7164967,61.12774,470000
56
+ 101.89255,0.19421902,0.03815691,-10.404072,0.18940881,101.470764,18.49876,-3.1212564,-105.305984,-198.9275,0.6578603,-0.61028916,54.848602,475000
57
+ 104.3254,0.22101441,-0.0039160107,-12.719625,0.22679606,103.8815,15.808222,2.3985164,-108.30929,-185.74664,0.6763765,-0.63784397,55.039986,480000
58
+ 100.457726,0.17040385,0.015365672,-11.646547,0.20968594,100.06227,14.231496,-2.5880926,-104.08529,-186.18611,0.73227197,-0.68519914,66.28463,485000
59
+ 95.98286,0.19375272,-0.018650683,-13.547211,0.24127401,95.56648,12.929675,-1.7087694,-99.71756,-189.89651,1.4537938,-1.0739446,62.959198,490000
60
+ 96.95832,0.18100323,0.02298829,-11.199713,0.19800413,96.55633,15.424746,2.1550176,-100.73403,-187.70694,0.65347666,-0.66966665,51.564484,495000
61
+ 103.30666,0.18409148,0.011005498,-11.886796,0.21333864,102.898224,11.001643,4.4614487,-106.8218,-186.98354,1.0446597,-1.1974869,57.441597,500000
62
+ 104.11237,0.2119989,0.0064724083,-12.141982,0.2195082,103.6744,12.966901,-4.852639,-107.65192,-186.69624,0.6619718,-0.7371205,51.73815,505000
63
+ 101.219154,0.22665215,-0.029118562,-14.130408,0.25236452,100.76926,16.068237,2.7447135,-105.83877,-187.89012,1.6782681,-1.1656168,81.72133,510000
64
+ 99.659676,0.1991556,-0.003305091,-12.686611,0.22469395,99.23913,18.469042,0.37632442,-103.0979,-173.2029,1.4742724,-1.6946459,71.09447,515000
65
+ 101.53622,0.19294938,-0.013327824,-13.24182,0.23790753,101.11869,21.168392,0.3276844,-105.72636,-176.60555,0.7084468,-0.78685445,52.149307,520000
66
+ 100.001854,0.19316767,-0.015034795,-13.338364,0.23920357,99.58452,15.459645,-6.502727,-103.466896,-193.10562,0.8794011,-0.56086475,50.482197,525000
67
+ 94.66868,0.21223928,0.009364967,-11.976281,0.21415591,94.23292,12.669234,1.1424009,-98.52688,-179.6625,0.8318671,-0.8459036,47.53846,530000
68
+ 98.11875,0.24313857,0.031759333,-10.728203,0.19230224,97.65155,11.386756,-1.8942977,-101.29712,-195.2967,1.2640833,-1.1816268,49.766186,535000
69
+ 100.56572,0.1918727,-0.018083632,-13.522186,0.2392228,100.15271,10.468319,2.2365003,-103.838585,-178.03792,0.5896302,-1.004943,60.095757,540000
70
+ 104.29299,0.20302548,-0.020324063,-13.643448,0.24250366,103.86779,13.617067,0.26236588,-108.511635,-182.53113,1.6690643,-1.5379288,70.94473,545000
71
+ 93.35487,0.18078624,0.020062627,-11.357159,0.19937538,92.95464,12.353987,1.9561225,-96.49399,-195.6002,0.57203656,-0.49931806,49.33632,550000
72
+ 100.783035,0.2266238,0.05234677,-9.556952,0.16998556,100.33408,15.639102,-4.6070056,-103.794106,-179.04424,0.9387619,-0.981881,56.830452,555000
73
+ 93.595375,0.1952857,0.015811564,-11.615412,0.20761956,93.17667,13.199035,-0.6915468,-97.88607,-194.18123,1.2509279,-1.4785067,69.604866,560000
74
+ 100.571014,0.21253684,-0.013409591,-13.257418,0.23471403,100.13718,18.589264,-2.3848374,-104.782585,-195.90927,0.9690139,-1.058016,65.89617,565000
75
+ 99.47717,0.19854213,0.020355087,-11.329058,0.19693878,99.06134,14.217746,-4.7761006,-103.292625,-183.89185,0.563324,-1.1710415,52.609978,570000
76
+ 93.96791,0.21082443,-0.019607067,-13.620179,0.23840094,93.53829,13.341354,0.44965428,-98.26929,-194.24696,0.88882697,-0.8811726,52.785988,575000
77
+ 97.08873,0.20038673,0.025810106,-11.021286,0.19237024,96.670166,12.322398,-6.5810256,-100.01922,-186.84222,3.2572615,-3.1786613,93.59266,580000
78
+ 99.119995,0.18664584,-0.0020291524,-12.616219,0.2202766,98.7151,15.008262,0.5094697,-103.41986,-186.90839,0.4659963,-1.2349048,59.09327,585000
79
+ 98.885666,0.20326236,-0.0037335213,-12.710922,0.22499524,98.461136,10.66067,0.2584749,-103.33437,-184.34279,0.5142447,-0.7345837,45.781082,590000
80
+ 97.10636,0.20016071,0.0078133,-12.045544,0.2070946,96.6913,12.601805,-3.7903326,-101.05985,-175.7221,0.93101054,-0.9833789,58.653236,595000
81
+ 92.69583,0.19493331,0.011370296,-11.835869,0.20263667,92.286896,12.2004385,-1.50473,-96.74457,-179.48283,0.80195814,-0.76226634,41.898224,600000
82
+ 96.7689,0.19045278,-0.00032607355,-12.518959,0.21531154,96.363464,15.082018,-1.1828538,-100.419395,-185.94722,1.7004442,-1.5880386,70.48593,605000
83
+ 100.978004,0.21194842,0.0048114173,-12.223032,0.21233538,100.548904,14.865462,-1.2003509,-103.99081,-178.61853,0.50217426,-0.47013068,43.852295,610000
84
+ 96.39523,0.19218355,-0.01201133,-13.204086,0.22525454,95.9898,15.579315,-5.719487,-100.30284,-176.87817,0.64583755,-0.77532834,58.563423,615000
85
+ 97.46895,0.20190716,-0.007109236,-12.917715,0.21985102,97.054306,14.730883,-6.9476438,-101.0094,-181.2802,0.62570894,-0.4324931,44.96777,620000
86
+ 91.41616,0.18742393,0.0016213772,-12.405298,0.21238959,91.014725,13.397905,2.4210954,-95.6568,-195.26028,1.1223907,-2.3732648,91.49403,625000
87
+ 92.86538,0.17850384,-0.00976491,-13.069395,0.22413518,92.4725,12.915317,2.2094488,-96.06704,-179.6738,0.9774584,-0.82771474,56.155495,630000
88
+ 97.16791,0.1749259,-0.005356047,-12.80888,0.2221089,96.77623,16.576202,-1.8786843,-100.398735,-197.19804,0.68039346,-0.6022853,48.594063,635000
89
+ 91.032745,0.21544379,-0.010187798,-13.1044035,0.22088724,90.6066,17.67761,-2.7024894,-94.89996,-185.80748,0.93691355,-0.94662374,67.9303,640000
90
+ 96.91459,0.18290232,-0.004434367,-12.75839,0.21895313,96.517166,10.526415,-0.8988881,-100.79792,-189.10696,0.80707514,-0.73392785,42.116062,645000
91
+ 89.92172,0.2283191,-0.0024608846,-12.64592,0.21326886,89.4826,15.54274,0.8789863,-93.36523,-182.84052,1.4404923,-0.65669423,65.38707,650000
92
+ 93.882454,0.23276907,-0.019054191,-13.63269,0.22933,93.4394,11.913089,7.9470644,-97.28379,-186.13687,1.3415191,-1.6438317,60.858982,655000
93
+ 91.04675,0.22117695,0.0152726555,-11.596546,0.19603664,90.614265,14.648636,-5.7407303,-95.66656,-178.12619,0.7223559,-0.8267481,62.805084,660000
94
+ 93.498436,0.20861232,0.003915936,-12.265543,0.20486093,93.08105,16.460321,-3.2960992,-97.09664,-182.29492,0.86724937,-0.52584934,61.12159,665000
95
+ 91.79163,0.19751763,-0.009785227,-13.082009,0.21994567,91.38396,13.827472,1.0966086,-95.717415,-170.01292,0.75192523,-0.6598349,53.060894,670000
96
+ 91.90259,0.2296434,-0.0051046894,-12.804781,0.21446365,91.463585,10.865422,-2.2053943,-95.12341,-186.66797,0.5548681,-0.5010523,50.15647,675000
97
+ 91.29799,0.190397,-0.018349785,-13.604924,0.22594076,90.899994,12.10377,-0.08709981,-94.96803,-178.6473,0.6541593,-0.97311294,55.577835,680000
98
+ 90.08467,0.21382946,-0.003422664,-12.702711,0.2144782,89.65979,12.002584,-1.9941986,-94.63219,-196.22978,1.1439602,-0.80145377,60.468624,685000
99
+ 89.51065,0.20019987,-0.008286612,-12.998247,0.21618073,89.102554,15.148002,5.7550926,-93.57145,-182.58557,0.6980976,-0.69148105,54.453827,690000
100
+ 85.13675,0.22236139,0.025544738,-10.975828,0.18395212,84.704895,14.361011,2.518338,-89.16363,-186.72763,0.4995863,-0.4983075,46.942955,695000
101
+ 87.48237,0.23108757,0.00030294416,-12.481717,0.20681977,87.04416,9.668177,0.8420371,-91.21854,-192.87311,0.56080806,-0.4799571,40.62745,700000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 144.48218,0.20084155,0.007955507,-11.939722,0.16953468,144.10385,5.6320925,-61.609184,-147.72014,-192.55522,0.3365969,-0.3545817,34.435097,205000
3
+ 141.52284,0.20601317,0.0051709497,-12.13455,0.17169836,141.13997,8.522275,-49.670933,-144.36105,-189.64992,5.1706257,-7.740093,86.80667,210000
4
+ 141.91428,0.17490241,0.01826083,-11.226896,0.16103359,141.56009,8.085265,-51.68727,-144.41907,-189.92767,0.3219849,-0.34089342,31.617275,215000
5
+ 139.75023,0.18226436,-0.02458897,-14.171362,0.20848817,139.38406,7.448753,-39.921883,-142.92554,-199.56168,0.4707362,-0.34605148,39.64032,220000
6
+ 135.58205,0.21704067,-0.0012576939,-12.583085,0.1904755,135.17578,12.413958,-25.195766,-138.71,-191.81935,0.7280265,-0.64803606,59.958717,225000
7
+ 130.08755,0.18765236,0.015086443,-11.597219,0.19380215,129.69101,15.468149,-49.83012,-134.03163,-192.93794,1.0398954,-0.97762054,54.171432,230000
8
+ 130.44162,0.1888678,0.006047253,-12.134399,0.20071024,130.04599,11.8002,-42.18964,-133.5037,-189.61465,3.6813872,-3.652266,78.41486,235000
9
+ 130.88297,0.22584003,-0.014606258,-13.386118,0.22064905,130.45108,17.989021,-44.303562,-134.64374,-197.72902,0.9195378,-0.9870174,64.79435,240000
10
+ 131.55867,0.18186271,0.025066465,-10.969579,0.17966855,131.17206,11.021298,-23.255741,-134.35143,-201.91087,0.9887526,-0.48836735,41.54718,245000
11
+ 128.80318,0.20678943,-0.015101453,-13.382331,0.22904405,128.38245,12.094199,-33.19275,-132.44287,-190.24712,0.7013745,-0.5877644,41.800476,250000
12
+ 125.54997,0.18703696,-0.020380223,-13.695589,0.23345745,125.14986,15.098124,-7.386241,-129.13432,-189.60175,1.3864138,-1.3081933,56.94703,255000
13
+ 124.31259,0.21824645,0.0005268152,-12.46993,0.21846628,123.87535,14.957232,-5.7514653,-128.47237,-195.73836,1.030421,-0.9760635,80.46483,260000
14
+ 125.89017,0.19474377,-0.008222612,-12.975603,0.22433272,125.47932,12.199797,-30.707668,-128.94447,-195.33046,0.6997693,-0.70229477,49.997604,265000
15
+ 120.81332,0.19289371,-0.0194915,-13.588592,0.24330705,120.39661,21.915207,-30.642334,-124.371666,-201.77202,0.8438717,-0.813125,71.765045,270000
16
+ 122.494354,0.20799544,-0.030378412,-14.261794,0.24591446,122.07082,20.9703,-20.236235,-126.33733,-197.22522,2.4760046,-2.0115874,105.5294,275000
17
+ 123.49063,0.20606653,-0.018395767,-13.5148,0.24498925,123.05797,17.570011,-7.2122307,-127.25187,-196.16934,1.0048642,-0.96069825,80.91629,280000
18
+ 121.554375,0.19578737,0.0108189965,-11.902279,0.21543612,121.13233,13.894259,-36.35514,-125.29781,-197.84816,0.87089163,-1.0272144,64.01187,285000
19
+ 119.0697,0.19609824,-0.019701831,-13.591909,0.24524516,118.648056,16.67483,-9.279862,-122.77602,-191.60829,0.66713595,-0.71127427,57.63592,290000
20
+ 120.27925,0.18039733,-0.00013375818,-12.507637,0.21906422,119.87993,16.382938,-2.3988245,-123.41537,-189.57196,3.4317386,-3.420048,68.78206,295000
21
+ 115.216484,0.21515399,-0.012243445,-13.200209,0.23081124,114.78276,9.70177,-10.437784,-118.66335,-193.57097,0.64383346,-0.6483637,43.586178,300000
22
+ 119.501076,0.17617288,-0.008795963,-13.009455,0.22461402,119.109085,17.875471,-15.194057,-123.814514,-188.69203,1.0821308,-1.0835013,75.81144,305000
23
+ 118.00852,0.19232787,0.008458496,-12.027052,0.21509925,117.592636,16.713726,3.5033665,-121.50606,-186.2886,2.353953,-1.5965722,81.40209,310000
24
+ 113.55228,0.17097896,0.018878518,-11.43467,0.20263179,113.15979,12.901244,1.3406298,-116.846756,-186.32684,0.79442936,-0.86039066,47.06075,315000
25
+ 116.36646,0.19617718,0.008543284,-12.002956,0.20630918,115.95544,19.114908,-9.321144,-119.55932,-196.51677,1.0275877,-1.4465806,55.844055,320000
26
+ 117.38713,0.21147352,-0.008250286,-12.973329,0.22612973,116.95778,14.150728,-5.901023,-121.19329,-182.08931,0.83120906,-0.8294971,44.850304,325000
27
+ 116.75811,0.19610855,-0.0043269587,-12.74073,0.22900574,116.337326,16.160324,-5.6663594,-120.59756,-198.87804,2.15585,-2.2830417,53.35273,330000
28
+ 116.94549,0.19901495,0.009186578,-11.981067,0.21209855,116.52519,11.759593,1.6414704,-120.41815,-186.79749,0.53586686,-0.5250851,50.5316,335000
29
+ 108.93243,0.18757223,-0.051170416,-15.334039,0.27686608,108.519165,16.279835,-4.7676296,-113.5625,-183.38005,0.59261274,-0.790006,54.269386,340000
30
+ 113.84219,0.20547168,0.0011042095,-12.437635,0.22021721,113.4154,13.960497,-11.343479,-117.24744,-197.81271,0.9424458,-0.8763122,74.27308,345000
31
+ 113.14261,0.19256692,0.01456056,-11.682483,0.20807327,112.72741,13.435145,-4.731493,-116.97102,-193.97385,0.6362939,-0.5244417,47.549667,350000
32
+ 112.658356,0.19187821,0.050226495,-9.744099,0.17758687,112.23866,15.970774,-8.040866,-115.52478,-187.88014,1.6573689,-1.9955028,85.72754,355000
33
+ 113.9489,0.22773285,0.02687861,-11.013138,0.19908895,113.4952,14.736795,-6.699558,-117.49114,-186.91785,3.7270505,-3.7050714,107.29452,360000
34
+ 112.526695,0.18453003,-0.008910083,-12.991556,0.23548856,112.115585,13.551719,1.7961043,-116.11182,-190.64087,0.48566732,-0.54164183,50.633957,365000
35
+ 110.87313,0.20040402,0.03266639,-10.686939,0.19254938,110.44751,13.552001,-8.706027,-114.829704,-188.37375,0.9943002,-0.8764734,51.54306,370000
36
+ 113.31839,0.22617154,0.040899754,-10.241089,0.18542476,112.86589,20.346548,-2.9180305,-116.29736,-193.89908,1.061439,-0.9535161,74.86721,375000
37
+ 112.10307,0.18414056,0.030142447,-10.838998,0.19669688,111.69209,15.630881,2.9794111,-115.29461,-196.13448,1.0509855,-1.1081816,59.27148,380000
38
+ 107.93893,0.20868012,-0.03285881,-14.293082,0.26192534,107.50118,16.14296,-5.8019753,-111.6614,-179.94127,0.7113738,-0.70418465,46.92609,385000
39
+ 107.14751,0.18791865,-0.017461417,-13.463472,0.24400422,106.73305,15.503365,-10.185286,-110.75378,-200.5079,1.0120332,-0.7968678,60.829765,390000
40
+ 108.76094,0.18286063,-0.0035371901,-12.691629,0.23426835,108.34735,11.668123,-4.2940083,-112.68676,-201.29973,0.5523828,-0.5761741,51.239532,395000
41
+ 108.6889,0.17124566,-0.0048458534,-12.768627,0.23033744,108.29216,9.676522,-2.3043008,-112.710815,-198.99835,0.5341521,-0.55172676,47.346535,400000
42
+ 107.85487,0.2022472,-0.019386478,-13.569939,0.245877,107.42613,19.12713,-3.333591,-111.87544,-194.56795,1.1276473,-1.1018034,79.25743,405000
43
+ 109.1956,0.19780378,-0.021385392,-13.668522,0.2501508,108.76903,13.238149,-7.897752,-112.656166,-184.45027,0.4505389,-0.57169324,49.759193,410000
44
+ 108.95648,0.21866512,0.011095352,-11.880872,0.21291624,108.51381,12.348601,2.1229436,-112.45379,-198.30408,1.5401742,-0.936708,61.596863,415000
45
+ 107.78601,0.19296041,0.038201857,-10.429166,0.19239277,107.36246,14.963687,-5.8542953,-112.3101,-193.4103,0.7105955,-0.45953342,53.192596,420000
46
+ 100.86755,0.21008077,0.02927794,-10.926798,0.20335221,100.424835,18.414717,-1.1180243,-104.40838,-180.58965,0.7808968,-0.8466123,55.266632,425000
47
+ 106.99209,0.23280206,0.04400285,-10.078108,0.18310702,106.53217,12.4727545,0.22057597,-109.62371,-189.80302,0.7959405,-0.7455131,56.99437,430000
48
+ 102.15905,0.19823489,0.03952041,-10.32045,0.1871342,101.73416,14.295875,-7.1629725,-105.39282,-183.49532,0.5814135,-0.6473388,52.314888,435000
49
+ 105.74219,0.23047909,-0.00510736,-12.786837,0.22768006,105.28914,13.682334,1.91177,-109.62107,-194.26242,1.0837262,-1.1873109,61.283512,440000
50
+ 105.57046,0.21301453,-0.014497222,-13.302532,0.24030161,105.13164,15.52254,-2.4786177,-109.77361,-192.06009,0.6005032,-0.58952963,56.71501,445000
51
+ 96.02997,0.20390232,0.0068056514,-12.115505,0.21444741,95.60481,15.363355,-0.7407328,-100.571915,-188.8019,3.265701,-3.1980455,124.76698,450000
52
+ 107.834236,0.19974846,0.016163357,-11.605266,0.20964888,107.408676,12.720616,1.7086813,-111.479065,-191.27725,0.92290133,-0.8774392,56.13313,455000
53
+ 102.61572,0.21998237,-0.023953574,-13.807033,0.25303715,102.16666,14.961654,4.182927,-107.32101,-175.1483,1.3203807,-0.94046956,68.59372,460000
54
+ 105.71762,0.19785048,0.0053135836,-12.204096,0.2191503,105.29531,11.124604,0.13958555,-109.354935,-196.7954,0.33575726,-0.30397153,43.54039,465000
55
+ 104.55611,0.20837197,-0.0059245178,-12.830792,0.22980048,104.12386,15.764697,-0.1866479,-108.480385,-178.34082,0.55118746,-0.7164967,61.12774,470000
56
+ 101.89255,0.19421902,0.03815691,-10.404072,0.18940881,101.470764,18.49876,-3.1212564,-105.305984,-198.9275,0.6578603,-0.61028916,54.848602,475000
57
+ 104.3254,0.22101441,-0.0039160107,-12.719625,0.22679606,103.8815,15.808222,2.3985164,-108.30929,-185.74664,0.6763765,-0.63784397,55.039986,480000
58
+ 100.457726,0.17040385,0.015365672,-11.646547,0.20968594,100.06227,14.231496,-2.5880926,-104.08529,-186.18611,0.73227197,-0.68519914,66.28463,485000
59
+ 95.98286,0.19375272,-0.018650683,-13.547211,0.24127401,95.56648,12.929675,-1.7087694,-99.71756,-189.89651,1.4537938,-1.0739446,62.959198,490000
60
+ 96.95832,0.18100323,0.02298829,-11.199713,0.19800413,96.55633,15.424746,2.1550176,-100.73403,-187.70694,0.65347666,-0.66966665,51.564484,495000
61
+ 103.30666,0.18409148,0.011005498,-11.886796,0.21333864,102.898224,11.001643,4.4614487,-106.8218,-186.98354,1.0446597,-1.1974869,57.441597,500000
62
+ 104.11237,0.2119989,0.0064724083,-12.141982,0.2195082,103.6744,12.966901,-4.852639,-107.65192,-186.69624,0.6619718,-0.7371205,51.73815,505000
63
+ 101.219154,0.22665215,-0.029118562,-14.130408,0.25236452,100.76926,16.068237,2.7447135,-105.83877,-187.89012,1.6782681,-1.1656168,81.72133,510000
64
+ 99.659676,0.1991556,-0.003305091,-12.686611,0.22469395,99.23913,18.469042,0.37632442,-103.0979,-173.2029,1.4742724,-1.6946459,71.09447,515000
65
+ 101.53622,0.19294938,-0.013327824,-13.24182,0.23790753,101.11869,21.168392,0.3276844,-105.72636,-176.60555,0.7084468,-0.78685445,52.149307,520000
66
+ 100.001854,0.19316767,-0.015034795,-13.338364,0.23920357,99.58452,15.459645,-6.502727,-103.466896,-193.10562,0.8794011,-0.56086475,50.482197,525000
67
+ 94.66868,0.21223928,0.009364967,-11.976281,0.21415591,94.23292,12.669234,1.1424009,-98.52688,-179.6625,0.8318671,-0.8459036,47.53846,530000
68
+ 98.11875,0.24313857,0.031759333,-10.728203,0.19230224,97.65155,11.386756,-1.8942977,-101.29712,-195.2967,1.2640833,-1.1816268,49.766186,535000
69
+ 100.56572,0.1918727,-0.018083632,-13.522186,0.2392228,100.15271,10.468319,2.2365003,-103.838585,-178.03792,0.5896302,-1.004943,60.095757,540000
70
+ 104.29299,0.20302548,-0.020324063,-13.643448,0.24250366,103.86779,13.617067,0.26236588,-108.511635,-182.53113,1.6690643,-1.5379288,70.94473,545000
71
+ 93.35487,0.18078624,0.020062627,-11.357159,0.19937538,92.95464,12.353987,1.9561225,-96.49399,-195.6002,0.57203656,-0.49931806,49.33632,550000
72
+ 100.783035,0.2266238,0.05234677,-9.556952,0.16998556,100.33408,15.639102,-4.6070056,-103.794106,-179.04424,0.9387619,-0.981881,56.830452,555000
73
+ 93.595375,0.1952857,0.015811564,-11.615412,0.20761956,93.17667,13.199035,-0.6915468,-97.88607,-194.18123,1.2509279,-1.4785067,69.604866,560000
74
+ 100.571014,0.21253684,-0.013409591,-13.257418,0.23471403,100.13718,18.589264,-2.3848374,-104.782585,-195.90927,0.9690139,-1.058016,65.89617,565000
75
+ 99.47717,0.19854213,0.020355087,-11.329058,0.19693878,99.06134,14.217746,-4.7761006,-103.292625,-183.89185,0.563324,-1.1710415,52.609978,570000
76
+ 93.96791,0.21082443,-0.019607067,-13.620179,0.23840094,93.53829,13.341354,0.44965428,-98.26929,-194.24696,0.88882697,-0.8811726,52.785988,575000
77
+ 97.08873,0.20038673,0.025810106,-11.021286,0.19237024,96.670166,12.322398,-6.5810256,-100.01922,-186.84222,3.2572615,-3.1786613,93.59266,580000
78
+ 99.119995,0.18664584,-0.0020291524,-12.616219,0.2202766,98.7151,15.008262,0.5094697,-103.41986,-186.90839,0.4659963,-1.2349048,59.09327,585000
79
+ 98.885666,0.20326236,-0.0037335213,-12.710922,0.22499524,98.461136,10.66067,0.2584749,-103.33437,-184.34279,0.5142447,-0.7345837,45.781082,590000
80
+ 97.10636,0.20016071,0.0078133,-12.045544,0.2070946,96.6913,12.601805,-3.7903326,-101.05985,-175.7221,0.93101054,-0.9833789,58.653236,595000
81
+ 92.69583,0.19493331,0.011370296,-11.835869,0.20263667,92.286896,12.2004385,-1.50473,-96.74457,-179.48283,0.80195814,-0.76226634,41.898224,600000
82
+ 96.7689,0.19045278,-0.00032607355,-12.518959,0.21531154,96.363464,15.082018,-1.1828538,-100.419395,-185.94722,1.7004442,-1.5880386,70.48593,605000
83
+ 100.978004,0.21194842,0.0048114173,-12.223032,0.21233538,100.548904,14.865462,-1.2003509,-103.99081,-178.61853,0.50217426,-0.47013068,43.852295,610000
84
+ 96.39523,0.19218355,-0.01201133,-13.204086,0.22525454,95.9898,15.579315,-5.719487,-100.30284,-176.87817,0.64583755,-0.77532834,58.563423,615000
85
+ 97.46895,0.20190716,-0.007109236,-12.917715,0.21985102,97.054306,14.730883,-6.9476438,-101.0094,-181.2802,0.62570894,-0.4324931,44.96777,620000
86
+ 91.41616,0.18742393,0.0016213772,-12.405298,0.21238959,91.014725,13.397905,2.4210954,-95.6568,-195.26028,1.1223907,-2.3732648,91.49403,625000
87
+ 92.86538,0.17850384,-0.00976491,-13.069395,0.22413518,92.4725,12.915317,2.2094488,-96.06704,-179.6738,0.9774584,-0.82771474,56.155495,630000
88
+ 97.16791,0.1749259,-0.005356047,-12.80888,0.2221089,96.77623,16.576202,-1.8786843,-100.398735,-197.19804,0.68039346,-0.6022853,48.594063,635000
89
+ 91.032745,0.21544379,-0.010187798,-13.1044035,0.22088724,90.6066,17.67761,-2.7024894,-94.89996,-185.80748,0.93691355,-0.94662374,67.9303,640000
90
+ 96.91459,0.18290232,-0.004434367,-12.75839,0.21895313,96.517166,10.526415,-0.8988881,-100.79792,-189.10696,0.80707514,-0.73392785,42.116062,645000
91
+ 89.92172,0.2283191,-0.0024608846,-12.64592,0.21326886,89.4826,15.54274,0.8789863,-93.36523,-182.84052,1.4404923,-0.65669423,65.38707,650000
92
+ 93.882454,0.23276907,-0.019054191,-13.63269,0.22933,93.4394,11.913089,7.9470644,-97.28379,-186.13687,1.3415191,-1.6438317,60.858982,655000
93
+ 91.04675,0.22117695,0.0152726555,-11.596546,0.19603664,90.614265,14.648636,-5.7407303,-95.66656,-178.12619,0.7223559,-0.8267481,62.805084,660000
94
+ 93.498436,0.20861232,0.003915936,-12.265543,0.20486093,93.08105,16.460321,-3.2960992,-97.09664,-182.29492,0.86724937,-0.52584934,61.12159,665000
95
+ 91.79163,0.19751763,-0.009785227,-13.082009,0.21994567,91.38396,13.827472,1.0966086,-95.717415,-170.01292,0.75192523,-0.6598349,53.060894,670000
96
+ 91.90259,0.2296434,-0.0051046894,-12.804781,0.21446365,91.463585,10.865422,-2.2053943,-95.12341,-186.66797,0.5548681,-0.5010523,50.15647,675000
97
+ 91.29799,0.190397,-0.018349785,-13.604924,0.22594076,90.899994,12.10377,-0.08709981,-94.96803,-178.6473,0.6541593,-0.97311294,55.577835,680000
98
+ 90.08467,0.21382946,-0.003422664,-12.702711,0.2144782,89.65979,12.002584,-1.9941986,-94.63219,-196.22978,1.1439602,-0.80145377,60.468624,685000
99
+ 89.51065,0.20019987,-0.008286612,-12.998247,0.21618073,89.102554,15.148002,5.7550926,-93.57145,-182.58557,0.6980976,-0.69148105,54.453827,690000
100
+ 85.13675,0.22236139,0.025544738,-10.975828,0.18395212,84.704895,14.361011,2.518338,-89.16363,-186.72763,0.4995863,-0.4983075,46.942955,695000
101
+ 87.48237,0.23108757,0.00030294416,-12.481717,0.20681977,87.04416,9.668177,0.8420371,-91.21854,-192.87311,0.56080806,-0.4799571,40.62745,700000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62bbcc8c81497d9882ec160845365b95ec7859f184a364269ebe0bc016dfd735
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e38dd0b35ce8e24d076cb97f7d87220d2af5fc58a1506cb049b82f7177202b44
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a04848e941e9b60c09292419936215168f6b0248cdd05165fba54a6edca024e2
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21bd6a6c6997a0892cd9d0b8ce9d5a86064a8058744d837cf6fef6078d8cb33c
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77efe5d3cbe9cc1b8e1b88e774f025eafffcfa76f57679f063e5cbc9b26533bb
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:836f7066e2780c278b419aaa3ecbb85be5da52abbf8b3af02ab6c6ef5802817e
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d23d7bfe2aacc8a2f618249df608c92eda94876046da4c1b7ed5c04f97e1c6a8
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:739a9f64a402139aa13e2eacaf65cdd6884d3ebd0e4b911c128b3b6adc331963
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e98831c540fdd7e8bafb50c183e6c9e4b5d672bbb827b145ac86e6833029596
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29433c079885556fe949cf8c4b20a90880492e462a261ad4a256b75b3404171c
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260318_164324/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/vb0ppa8i