Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1150000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1200000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,0.030245478438446015,0.00013611886789569234,0.03169655133617692,0.0018991419528869699,30.90605146855988,10.397999999999316,0.9,4737.02,-0.1,-288.26,205.96,0.6546712255477906,750000
|
| 3 |
+
0.0,0.0,-0.00468531642006471,0.015276324424231129,-0.002373038715385243,0.00523673585236507,32.876848819645346,8.634999999999557,0.94,14967.42,-0.12,-262.62,170.7,0.5572284841537476,800000
|
| 4 |
+
0.0,0.0,0.001247494777063081,-0.004708303403925829,0.0034805983980222078,0.018201916043237714,32.4535673462351,6.924999999999643,0.96,22953.56,-0.06,-199.5,136.5,0.4375193691253662,850000
|
| 5 |
+
0.0,0.0,-0.010012418060484076,0.024496193476571636,-0.007013926932615891,0.01656819980373933,32.591870110702125,6.9469999999995,0.92,30351.38,-0.1,-210.78,136.94,0.49802966594696046,900000
|
| 6 |
+
0.0,0.0,-0.0037090974295882063,0.02004772704803898,-0.0006909763714034401,0.015188509478589131,33.03661393933547,7.060999999999789,0.96,37543.2,-0.08,-219.8,139.22,0.5623514461517334,950000
|
| 7 |
+
0.0,0.0,-0.020077744340313074,0.024221298427847118,-0.016719707254095974,0.022895473449917544,33.43338571032952,5.104999999999699,0.98,43379.82,-0.02,-151.84,100.1,0.45555145263671876,1000000
|
| 8 |
+
0.0,0.0,-0.01915823488340761,0.039437638671922,-0.01535511321108981,0.031133158376878974,33.874854005787626,5.538999999999686,0.96,48827.0,-0.08,-170.5,108.78,0.46745193004608154,1050000
|
| 9 |
+
0.0,0.0,-0.01611123581102221,0.0426731750942223,-0.012031777741379833,0.035282312040589424,34.30424185291529,4.3449999999998115,1.0,54270.0,0.0,-123.82,84.9,0.36405004978179933,1100000
|
| 10 |
+
0.0,0.0,-0.02527964972682423,0.047093530901362604,-0.021075403372711878,0.039831817254290094,35.08127501635607,4.317999999999841,1.0,58803.22,0.0,-128.1,84.36,0.37462717056274414,1150000
|
| 11 |
+
0.0,0.0,-0.029930038263050386,0.041803747515132196,-0.025488815470290218,0.03952240427260918,33.53872226877643,4.637999999999736,0.98,62994.12,-0.02,-141.98,90.76,0.38585428714752196,1200000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,0.030245478438446015,0.00013611886789569234,0.03169655133617692,0.0018991419528869699,30.90605146855988,10.397999999999316,0.9,4737.02,-0.1,-288.26,205.96,0.6546712255477906,750000
|
| 3 |
+
0.0,0.0,-0.00468531642006471,0.015276324424231129,-0.002373038715385243,0.00523673585236507,32.876848819645346,8.634999999999557,0.94,14967.42,-0.12,-262.62,170.7,0.5572284841537476,800000
|
| 4 |
+
0.0,0.0,0.001247494777063081,-0.004708303403925829,0.0034805983980222078,0.018201916043237714,32.4535673462351,6.924999999999643,0.96,22953.56,-0.06,-199.5,136.5,0.4375193691253662,850000
|
| 5 |
+
0.0,0.0,-0.010012418060484076,0.024496193476571636,-0.007013926932615891,0.01656819980373933,32.591870110702125,6.9469999999995,0.92,30351.38,-0.1,-210.78,136.94,0.49802966594696046,900000
|
| 6 |
+
0.0,0.0,-0.0037090974295882063,0.02004772704803898,-0.0006909763714034401,0.015188509478589131,33.03661393933547,7.060999999999789,0.96,37543.2,-0.08,-219.8,139.22,0.5623514461517334,950000
|
| 7 |
+
0.0,0.0,-0.020077744340313074,0.024221298427847118,-0.016719707254095974,0.022895473449917544,33.43338571032952,5.104999999999699,0.98,43379.82,-0.02,-151.84,100.1,0.45555145263671876,1000000
|
| 8 |
+
0.0,0.0,-0.01915823488340761,0.039437638671922,-0.01535511321108981,0.031133158376878974,33.874854005787626,5.538999999999686,0.96,48827.0,-0.08,-170.5,108.78,0.46745193004608154,1050000
|
| 9 |
+
0.0,0.0,-0.01611123581102221,0.0426731750942223,-0.012031777741379833,0.035282312040589424,34.30424185291529,4.3449999999998115,1.0,54270.0,0.0,-123.82,84.9,0.36405004978179933,1100000
|
| 10 |
+
0.0,0.0,-0.02527964972682423,0.047093530901362604,-0.021075403372711878,0.039831817254290094,35.08127501635607,4.317999999999841,1.0,58803.22,0.0,-128.1,84.36,0.37462717056274414,1150000
|
| 11 |
+
0.0,0.0,-0.029930038263050386,0.041803747515132196,-0.025488815470290218,0.03952240427260918,33.53872226877643,4.637999999999736,0.98,62994.12,-0.02,-141.98,90.76,0.38585428714752196,1200000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6399652,150.62996,0.007441978,-0.0041644233,-13.059586,0.19752042,-150.53278,150.82332,1.993356,6.024365,-61.41215,-153.44133,-195.06921,8.017721,4.5993915,-4.846877,120.161026,705000
|
| 3 |
+
0.64234936,146.34834,0.007909991,-0.0036814057,-12.965412,0.18676886,-146.24579,146.53143,1.7161225,4.347486,-37.540314,-149.31767,-192.47234,6.0636086,5.627362,-5.5085144,101.17407,710000
|
| 4 |
+
0.64034575,145.6495,0.008618187,-0.0063432576,-13.236032,0.18098184,-145.53545,145.82414,1.7289721,4.910453,-38.268055,-148.65825,-193.70245,6.639425,2.6687353,-1.9912817,55.681793,715000
|
| 5 |
+
0.63641334,140.51756,0.009357729,-0.029424002,-15.644353,0.17801313,-140.37117,140.66615,4.6748176,7.4331217,-19.89864,-144.5689,-200.05511,12.107939,2.0195465,-2.3692784,113.14732,720000
|
| 6 |
+
0.6467866,138.09946,0.00961896,-0.007749981,-13.305698,0.16760571,-137.97147,138.25931,2.9151924,8.399887,-41.617046,-140.94556,-200.64601,11.31508,4.0702267,-4.3277254,101.39447,725000
|
| 7 |
+
0.6470323,136.83026,0.009377777,-0.0021536648,-12.729656,0.18013021,-136.71088,137.00824,2.8862615,8.3325815,-47.28584,-139.52489,-197.5553,11.218843,2.7096663,-2.9917958,109.850945,730000
|
| 8 |
+
0.6527626,138.11095,0.009351747,0.0019143516,-12.295295,0.1707747,-137.99597,138.28363,2.6370888,8.358138,-27.280106,-140.1574,-197.65193,10.995227,3.9421399,-3.4710312,142.62816,735000
|
| 9 |
+
0.6485691,138.42606,0.009522684,-0.007253988,-13.261759,0.16139024,-138.29977,138.5802,3.7915325,10.046554,-51.023315,-142.49455,-198.43317,13.838086,3.3547964,-3.5594466,107.320854,740000
|
| 10 |
+
0.6519624,137.87527,0.008972867,0.004351615,-12.015025,0.1611773,-137.76746,138.0408,2.2646878,8.279596,-34.464584,-140.6022,-197.54265,10.544284,3.7882888,-2.4462206,88.95391,745000
|
| 11 |
+
0.642359,139.53152,0.009103583,-0.005063066,-13.056162,0.15571102,-139.41269,139.68217,4.8807936,9.633966,-23.194445,-142.20546,-197.65178,14.51476,0.71627396,-0.9924114,133.17801,750000
|
| 12 |
+
0.64861554,135.82404,0.009419792,-0.011841703,-13.757109,0.19240439,-135.69446,136.0046,3.1941857,12.724948,-20.730667,-139.55273,-204.49724,15.919134,8.774209,-12.061391,209.12784,755000
|
| 13 |
+
0.6399648,134.6969,0.0093428595,-0.016156958,-14.229338,0.21462372,-134.56395,134.89537,3.2304237,9.035,-35.368694,-138.13841,-201.68102,12.265424,2.564196,-2.4756,112.37913,760000
|
| 14 |
+
0.64506435,137.42596,0.009288826,-0.009364522,-13.508149,0.18185514,-137.3005,137.59845,2.5986588,7.959253,-38.03327,-140.38232,-200.35902,10.557912,1.2116488,-1.1058456,90.75588,765000
|
| 15 |
+
0.6380181,131.32883,0.009170981,-0.0061980146,-13.175829,0.18836421,-131.20798,131.511,3.239322,8.573264,-19.106522,-133.9395,-198.8365,11.812586,6.708796,-7.285101,125.62921,770000
|
| 16 |
+
0.64746535,135.80374,0.009256274,0.0025364326,-12.225977,0.18647113,-135.69057,135.99275,2.8637853,9.560854,-8.195235,-138.84862,-200.73724,12.424639,4.4075947,-6.060534,149.40546,775000
|
| 17 |
+
0.64227295,135.51904,0.009412707,-0.0071058315,-13.254919,0.1656982,-135.39427,135.67763,3.5726883,9.476244,-12.919098,-138.80936,-201.17992,13.048932,0.8348204,-1.2209947,101.36867,780000
|
| 18 |
+
0.6393832,134.44788,0.00921552,0.0038947756,-12.077368,0.187994,-134.33656,134.63976,3.918162,10.820031,-4.6872406,-136.92627,-201.04643,14.7381935,1.5770876,-1.6131506,132.73872,785000
|
| 19 |
+
0.6420999,134.76758,0.009319492,-0.0017209813,-12.684665,0.19092649,-134.64935,134.95679,2.7624972,9.851997,0.7640542,-137.42363,-196.49063,12.614494,2.602545,-2.8813004,111.50621,790000
|
| 20 |
+
0.6457582,133.87082,0.009240372,0.010305436,-11.384738,0.15869956,-133.76561,134.03983,4.8070636,12.32708,-1.6777391,-136.40404,-198.33562,17.134144,2.9357107,-3.8260362,154.47018,795000
|
| 21 |
+
0.6388067,129.70328,0.009392777,0.0039621033,-12.078176,0.18993291,-129.58984,129.89717,16.667929,14.958774,-5.507349,-132.84639,-201.21326,31.626701,6.4294586,-5.1229296,378.947,800000
|
| 22 |
+
0.64455986,132.99115,0.009311237,0.005446124,-11.915102,0.1951417,-132.88022,133.19174,2.874521,9.312723,-5.2028227,-136.67322,-198.77179,12.187244,1.606648,-1.3553473,107.5323,805000
|
| 23 |
+
0.6422736,128.14552,0.009570788,-0.016200466,-14.192699,0.17515306,-128.00969,128.30447,3.5672905,11.471595,-9.392605,-131.5656,-202.38123,15.038885,8.117423,-7.3511224,177.55396,810000
|
| 24 |
+
0.6433419,128.90343,0.009526336,0.00096140424,-12.399079,0.18531379,-128.78532,129.0897,4.4048576,11.482181,0.08337309,-132.62561,-199.64474,15.887038,4.9076147,-4.093933,134.28865,815000
|
| 25 |
+
0.6502551,129.20847,0.009761519,0.007323243,-11.749784,0.16061103,-129.09378,129.3764,3.569388,10.516318,-4.0927734,-132.18399,-201.28163,14.085707,1.6423173,-1.5917459,127.5732,820000
|
| 26 |
+
0.6446814,131.37558,0.009322825,0.00034893377,-12.462572,0.17688714,-131.2594,131.55281,3.532832,8.996374,-2.406207,-134.63963,-199.2928,12.529206,2.014291,-1.9441289,133.74037,825000
|
| 27 |
+
0.64721817,131.84131,0.009554668,0.003256024,-12.159222,0.17455387,-131.72514,132.01912,5.0877852,11.652353,-10.576316,-135.61595,-198.56747,16.740139,3.1849527,-3.0860326,157.77979,830000
|
| 28 |
+
0.6453397,130.04822,0.009230209,-0.00095627183,-12.603602,0.1745134,-129.93188,130.22177,2.7215345,10.291263,1.2241716,-133.94621,-202.47873,13.012797,6.1706457,-6.299524,159.02301,835000
|
| 29 |
+
0.64084935,126.92525,0.009537367,-0.009708782,-13.517973,0.17995939,-126.79632,127.0955,3.0307667,9.908121,-0.79516685,-130.7631,-198.96533,12.938888,4.2857428,-3.9881723,132.00272,840000
|
| 30 |
+
0.65546834,129.61499,0.009173706,0.0068260026,-11.755917,0.16684094,-129.50714,129.78865,3.7224572,11.436128,-7.3310857,-132.4549,-199.24417,15.158585,6.1476445,-6.797014,194.6429,845000
|
| 31 |
+
0.64098686,132.26001,0.009294688,-0.0053968304,-13.080636,0.15837884,-132.13843,132.413,2.3039367,8.484801,-15.385258,-134.50342,-203.08904,10.788738,5.273377,-5.730258,128.45253,850000
|
| 32 |
+
0.6478313,128.93338,0.009321144,0.011216528,-11.296658,0.16721258,-128.8281,129.1118,2.8610492,8.918383,-8.466823,-131.53197,-203.7269,11.779432,2.9454596,-3.42423,136.57321,855000
|
| 33 |
+
0.6492537,129.1051,0.00938072,0.01026731,-11.405488,0.18059194,-128.99814,129.29596,5.082905,12.129733,-1.2686055,-132.09976,-203.16133,17.212639,5.3589997,-5.027045,187.39444,860000
|
| 34 |
+
0.63550276,128.48383,0.00946386,-0.013470848,-13.923399,0.16618153,-128.35205,128.63654,5.077002,11.0001335,-0.70482534,-131.451,-204.1331,16.077135,4.495274,-5.191594,143.43814,865000
|
| 35 |
+
0.6566656,131.52539,0.009323224,0.01663397,-10.715857,0.15464926,-131.42548,131.69667,3.1835911,9.498199,-2.646424,-134.08955,-204.39563,12.68179,1.8258946,-0.86552644,127.299736,870000
|
| 36 |
+
0.64412016,130.16954,0.009440535,0.003197818,-12.161267,0.1747391,-130.05472,130.34749,4.178552,13.522263,-8.899888,-133.1803,-204.06921,17.700815,4.4777484,-3.3986866,184.43817,875000
|
| 37 |
+
0.6443989,128.49594,0.009224106,0.013407446,-11.046477,0.17572019,-128.39404,128.68507,3.1232688,10.143659,2.9052777,-131.22801,-203.06749,13.266928,1.9489622,-1.9022636,152.25809,880000
|
| 38 |
+
0.63074386,128.56387,0.009298491,-0.022752898,-14.946945,0.14063165,-128.4249,128.68175,4.785803,11.656066,-8.058164,-131.83813,-205.03917,16.441868,1.8061006,-1.8567207,160.01138,885000
|
| 39 |
+
0.6442317,128.58682,0.009281693,-0.0046295696,-12.998785,0.16761352,-128.46616,128.74982,3.37169,11.089679,-11.585248,-131.3713,-196.8855,14.461369,3.4328735,-3.710607,126.39656,890000
|
| 40 |
+
0.64519364,125.69474,0.009499202,0.0063342173,-11.833184,0.15335318,-125.58233,125.85442,3.1347682,7.1496134,-4.020186,-128.74043,-198.20334,10.284382,1.9250258,-1.9486667,91.84657,895000
|
| 41 |
+
0.6426446,127.173645,0.009361669,0.002256682,-12.2589445,0.18344668,-127.05888,127.35935,4.7412624,12.799736,-7.038547,-131.02725,-200.16077,17.540998,2.2036493,-2.4365,163.04327,900000
|
| 42 |
+
0.6399388,126.94661,0.009385569,-0.004755646,-13.006698,0.18014127,-126.824524,127.121994,4.909626,15.566318,-8.496581,-130.07121,-195.92186,20.475945,5.287236,-5.2551184,174.73427,905000
|
| 43 |
+
0.63779473,126.26739,0.0094863465,0.0039093853,-12.0878935,0.15909421,-126.15272,126.43039,4.478255,13.123781,-3.9963746,-128.86928,-196.17088,17.602036,2.1534605,-4.8315496,186.02797,910000
|
| 44 |
+
0.6454878,129.34003,0.00938723,-0.0035451255,-12.877654,0.18055668,-129.21913,129.51704,3.117306,9.080153,-17.218676,-132.30951,-203.10294,12.197459,2.046712,-2.2278326,116.708786,915000
|
| 45 |
+
0.6422302,124.50441,0.009323686,-0.008846288,-13.448797,0.17828733,-124.37902,124.67384,4.201111,12.25677,-1.1218333,-127.91941,-197.58585,16.457882,3.9136872,-3.1602683,143.18607,920000
|
| 46 |
+
0.64021087,121.91066,0.009281595,0.006062226,-11.846855,0.16437179,-121.8007,122.0811,6.0990715,15.049962,3.8944066,-125.017876,-196.34456,21.149033,3.500462,-3.239024,194.67255,925000
|
| 47 |
+
0.644786,125.595276,0.0093422895,0.012895514,-11.119662,0.17025232,-125.491394,125.77842,6.817276,9.73454,-0.9652359,-128.84566,-206.95712,16.551815,2.1507173,-2.301363,152.67415,930000
|
| 48 |
+
0.64288694,121.231094,0.00952803,0.008221898,-11.637083,0.19055857,-121.12021,121.42988,4.5842743,10.629351,4.930255,-124.39075,-198.1186,15.213625,2.0411618,-1.6755171,193.48138,935000
|
| 49 |
+
0.6480495,124.05998,0.009059357,0.012773485,-11.090023,0.2065309,-123.95952,124.27928,5.5263057,13.419522,1.4061246,-127.204346,-200.69258,18.945827,1.689919,-1.5245591,145.0128,940000
|
| 50 |
+
0.6511786,124.84674,0.00928076,0.002270466,-12.255358,0.18170053,-124.733,125.030716,7.450448,12.994989,-9.005265,-127.835594,-201.25961,20.445438,6.303255,-5.7909985,203.43564,945000
|
| 51 |
+
0.64310426,117.26034,0.009498318,0.007908785,-11.667349,0.17451096,-117.14952,117.44276,5.955789,15.219736,-7.712293,-120.77559,-197.97006,21.175526,7.1156316,-7.8744497,220.59444,950000
|
| 52 |
+
0.651703,126.01648,0.009148379,0.001226012,-12.365986,0.1695344,-125.903336,126.18724,3.545349,9.067754,-13.766013,-129.40744,-205.36336,12.613103,2.6350546,-2.189055,129.35742,955000
|
| 53 |
+
0.64313024,120.44387,0.009256919,-0.0010328507,-12.611576,0.15393221,-120.327126,120.59677,7.247979,11.832962,3.0549827,-124.497635,-196.2892,19.08094,3.1726627,-3.438404,243.38635,960000
|
| 54 |
+
0.6394558,123.64584,0.00932082,-0.009787529,-13.550072,0.18147802,-123.51956,123.817535,5.0353656,18.827795,-5.3005047,-126.357414,-199.46487,23.863161,12.038689,-9.126397,242.81609,965000
|
| 55 |
+
0.63721246,124.655594,0.0091409655,-0.00041702797,-12.545622,0.17079978,-124.540924,124.82597,4.4291286,12.463872,-8.521346,-126.765114,-194.97328,16.893002,1.5191909,-1.6291854,136.8415,970000
|
| 56 |
+
0.6397903,124.07879,0.009181071,-0.011203054,-13.720234,0.16497211,-123.95282,124.23256,4.3115516,15.058179,-6.524496,-125.94103,-203.86855,19.36973,1.9265403,-3.1771424,183.5629,975000
|
| 57 |
+
0.6449619,126.481735,0.009062546,-0.0009479333,-12.604599,0.16729416,-126.36751,126.64809,6.01037,10.769762,-10.551891,-130.03445,-203.86125,16.780132,2.4918592,-2.373971,201.46684,980000
|
| 58 |
+
0.6468095,120.753265,0.009219097,0.0008313203,-12.409826,0.1613102,-120.63886,120.915405,3.7938745,9.473041,-5.9246945,-122.78163,-199.67693,13.266915,4.9888144,-4.2119994,131.29764,985000
|
| 59 |
+
0.6351343,118.57184,0.009111627,-0.0149091305,-14.136275,0.16454609,-118.44302,118.72147,7.1792665,13.669446,-6.0241103,-121.483696,-206.78264,20.848713,3.856965,-3.550459,216.19415,990000
|
| 60 |
+
0.638468,119.479614,0.009169005,0.005263598,-11.925936,0.18421283,-119.37026,119.66909,9.711718,17.86645,6.0359545,-122.29988,-200.24715,27.578167,3.5069063,-4.323081,292.20493,995000
|
| 61 |
+
0.6436029,125.871506,0.009214469,0.007972184,-11.634819,0.13289818,-125.76429,126.012375,6.505573,12.155992,8.654337,-128.52867,-206.0692,18.661564,3.3392067,-2.7320518,165.03264,1000000
|
| 62 |
+
0.6431514,126.82629,0.009052112,-0.005345357,-13.090509,0.14898214,-126.707794,126.96992,6.4889984,9.911747,-7.0914135,-129.74706,-199.92456,16.400745,1.4613732,-1.6025965,158.20789,1005000
|
| 63 |
+
0.64592665,122.79101,0.008986984,0.0001038335,-12.488446,0.14421284,-122.67877,122.935326,9.7251005,17.512419,9.443184,-126.27266,-204.4824,27.237518,4.529858,-4.699518,298.22696,1010000
|
| 64 |
+
0.641336,125.733345,0.009046481,0.0028280606,-12.187386,0.1599535,-125.62309,125.896126,5.2026258,15.14704,-10.193426,-128.47691,-201.45389,20.349667,1.8537345,-2.0673993,173.47496,1015000
|
| 65 |
+
0.63401616,121.418846,0.009321384,-0.010190855,-13.593277,0.17739025,-121.292145,121.586044,5.4529533,12.63087,0.6501003,-124.60589,-202.69028,18.083824,2.633357,-3.061808,167.95174,1020000
|
| 66 |
+
0.6495139,122.6859,0.008988562,0.010677432,-11.312109,0.1784961,-122.58423,122.87508,4.181917,11.206926,-0.37009484,-124.95827,-204.42694,15.388844,2.3916612,-2.2953718,137.00446,1025000
|
| 67 |
+
0.6412297,119.19217,0.008899503,0.00697735,-11.715984,0.16242287,-119.087906,119.36157,6.2200317,14.5052185,-2.2101605,-122.02984,-202.04897,20.72525,7.0335693,-8.304405,256.13074,1030000
|
| 68 |
+
0.64816236,120.73066,0.00879877,-0.0012217278,-12.638852,0.17041947,-120.61945,120.89986,4.7010016,10.829595,-2.2926445,-123.41614,-202.69545,15.530596,2.1594076,-2.1999135,163.16992,1035000
|
| 69 |
+
0.6485313,122.32833,0.009060118,0.012100244,-11.16445,0.12534398,-122.22718,122.465775,6.868324,24.0452,-3.0470943,-125.239784,-204.89436,30.913525,10.881,-12.683091,365.4353,1040000
|
| 70 |
+
0.6406615,127.33424,0.009098207,-0.0029472236,-12.823935,0.15980822,-127.217575,127.491104,5.4638276,9.355411,-1.3280982,-130.38306,-209.36145,14.819239,1.0635548,-1.0180377,133.38478,1045000
|
| 71 |
+
0.6431515,117.55626,0.008985502,0.018764593,-10.411681,0.16723211,-117.46271,117.742256,5.80049,12.332784,-3.2698796,-119.99438,-203.082,18.133274,1.6859559,-1.6478467,166.4632,1050000
|
| 72 |
+
0.64663327,123.04736,0.009013889,0.010243506,-11.363586,0.14202729,-122.94494,123.19964,4.965732,16.60391,-2.3551557,-126.003044,-206.97897,21.569643,2.8007243,-4.0174966,211.7115,1055000
|
| 73 |
+
0.6442242,115.295975,0.008986479,0.009844662,-11.404503,0.14607507,-115.19349,115.45189,5.1965623,16.74655,1.5760707,-118.7264,-207.23218,21.943111,2.6920686,-2.8448684,201.50403,1060000
|
| 74 |
+
0.6393934,123.70038,0.009166309,-0.017361557,-14.394062,0.16265428,-123.568436,123.845665,3.6160474,12.577919,-2.1845462,-125.97727,-206.28252,16.193966,1.4741958,-1.6489983,155.27928,1065000
|
| 75 |
+
0.6430768,120.15047,0.009067798,-0.0022624268,-12.749501,0.15993023,-120.03486,120.30813,9.07125,12.631204,1.0687145,-122.953575,-204.1062,21.702454,2.6803741,-2.5919428,194.23174,1070000
|
| 76 |
+
0.6445008,117.8512,0.009075134,0.0021487512,-12.2632265,0.16248877,-117.7399,118.01584,7.0098796,16.008215,1.4281921,-121.51143,-208.62712,23.018095,8.751586,-9.384328,242.74269,1075000
|
| 77 |
+
0.65046096,117.873825,0.008852489,0.023450954,-9.85092,0.16823214,-117.78662,118.06551,5.038648,16.921064,-3.4559927,-120.87598,-202.85689,21.959713,3.0602307,-3.363168,190.82669,1080000
|
| 78 |
+
0.6434744,119.3509,0.008812294,0.005576261,-11.867218,0.1463894,-119.24632,119.50287,5.414103,10.34599,2.9200203,-122.69102,-203.7399,15.760094,1.2992455,-1.1440701,156.69586,1085000
|
| 79 |
+
0.6332881,120.927185,0.008808942,-0.013748791,-14.060777,0.14988703,-120.80333,121.063324,7.2897277,17.916203,0.09635651,-123.766655,-208.48708,25.20593,8.4854355,-9.568885,280.3907,1090000
|
| 80 |
+
0.64363587,118.60824,0.008920258,-0.0055122264,-13.117945,0.15795545,-118.49123,118.76069,4.160379,10.827945,2.2171264,-122.16669,-209.33734,14.988323,1.113372,-1.4352105,132.48076,1095000
|
| 81 |
+
0.6470053,116.691696,0.009113912,0.009858234,-11.418331,0.16286854,-116.58763,116.864426,4.869993,18.055414,-1.4983546,-120.06905,-205.03075,22.925407,2.0869095,-2.533445,215.40843,1100000
|
| 82 |
+
0.64381105,120.5636,0.009032282,0.019479666,-10.343328,0.16383955,-120.47017,120.74692,4.967673,12.057758,-2.2838175,-123.11775,-206.88606,17.02543,1.3983307,-1.4608436,158.62877,1105000
|
| 83 |
+
0.641147,120.881516,0.008770132,-0.0034926517,-12.898244,0.14192674,-120.7684,121.01995,3.5765138,10.937434,-0.48328203,-123.38615,-203.82454,14.513948,1.6429541,-1.8659368,146.92435,1110000
|
| 84 |
+
0.64499515,116.68048,0.008843486,-0.0020006674,-12.726231,0.13043508,-116.56793,116.808914,5.2697024,14.193865,-8.133343,-119.54797,-207.51054,19.463568,3.6188838,-2.7531095,215.50247,1115000
|
| 85 |
+
0.64481294,118.2834,0.008762069,0.005907805,-11.825752,0.15816197,-118.17979,118.44747,4.8221974,13.75693,-1.2642927,-121.2282,-205.58162,18.579128,2.6265306,-2.621476,167.80286,1120000
|
| 86 |
+
0.648843,113.79812,0.008924771,0.008279102,-11.572346,0.17471036,-113.69484,113.98111,4.7576294,14.001288,-0.08921463,-116.73142,-207.07802,18.758919,3.2205486,-3.0653536,199.31,1125000
|
| 87 |
+
0.6534241,116.54996,0.00901529,0.021301901,-10.137136,0.15206334,-116.45857,116.72332,4.903936,13.76192,-0.3391986,-119.563286,-204.58592,18.665855,3.5787623,-3.303914,182.7084,1130000
|
| 88 |
+
0.6493373,119.51209,0.008831362,0.009395013,-11.436176,0.17248982,-119.41109,119.69398,5.607742,10.252814,-1.0966692,-121.25504,-203.25642,15.860556,2.3463595,-2.6751924,180.93805,1135000
|
| 89 |
+
0.63651764,110.757416,0.008695075,-0.009413841,-13.582664,0.18135498,-110.63931,110.92936,6.995782,15.420943,-0.87776893,-113.56602,-204.6345,22.416725,1.624832,-1.2641237,181.63391,1140000
|
| 90 |
+
0.64027953,120.73732,0.008843301,-0.006073124,-13.1867485,0.17511576,-120.620705,120.906364,4.525005,21.246851,-4.2116976,-124.808975,-206.33698,25.771856,3.8166778,-4.275342,194.12477,1145000
|
| 91 |
+
0.6476944,113.077805,0.008841113,0.010133424,-11.353829,0.14569002,-112.977425,113.23363,6.4936433,12.585855,4.52926,-115.73321,-205.40375,19.079498,2.6709132,-2.488758,195.38435,1150000
|
| 92 |
+
0.64258665,119.073975,0.00895503,-0.016029427,-14.289991,0.16087195,-118.946014,119.21882,7.100122,13.501746,1.4063656,-122.33471,-197.71037,20.601868,3.8408394,-4.341013,250.28577,1155000
|
| 93 |
+
0.6433364,113.84334,0.009020601,0.0020350327,-12.274402,0.1711415,-113.73262,114.01652,5.3910418,14.262671,-0.62449306,-116.19907,-208.1848,19.653713,1.7614827,-3.0105288,198.67708,1160000
|
| 94 |
+
0.64250344,115.421555,0.009079112,-0.008146174,-13.3972435,0.17297359,-115.29993,115.58638,12.800483,23.930128,4.1185946,-118.257034,-199.52951,36.73061,4.05628,-3.8096597,313.09235,1165000
|
| 95 |
+
0.6436531,110.91116,0.008900433,0.001668203,-12.312571,0.11992441,-110.801575,111.03276,6.0097275,13.937075,7.1140265,-113.09948,-200.16002,19.946802,2.8341112,-2.1976385,233.8071,1170000
|
| 96 |
+
0.64033985,114.935905,0.008942113,-0.005576592,-13.123632,0.14018813,-114.81854,115.07052,6.224197,16.683495,2.5274677,-118.32869,-203.18135,22.907692,2.3693988,-2.8971376,233.62556,1175000
|
| 97 |
+
0.64147836,119.90997,0.008830091,-0.014686868,-14.163275,0.18468255,-119.78491,120.07997,6.886258,23.731117,1.4195355,-123.47017,-205.64088,30.617374,7.224556,-4.6502905,426.9449,1180000
|
| 98 |
+
0.63770413,113.691345,0.008855352,-0.009772188,-13.603535,0.1487444,-113.570885,113.830315,6.701122,14.211255,4.158659,-116.49475,-208.98463,20.912376,1.47606,-2.220014,190.69266,1185000
|
| 99 |
+
0.6511342,115.96462,0.008953001,0.014697286,-10.858396,0.15459505,-115.86742,116.13391,4.33658,14.328055,10.5042095,-117.94667,-204.92564,18.664635,2.652356,-2.7399647,182.02916,1190000
|
| 100 |
+
0.6386027,106.60608,0.009015845,-0.0021253582,-12.735736,0.13437891,-106.49126,106.73833,14.264702,17.393402,-4.6719804,-109.80898,-207.09148,31.658104,3.9873161,-4.0583134,337.3333,1195000
|
| 101 |
+
0.6360383,107.42423,0.008991176,-0.015470767,-14.220661,0.14421996,-107.29637,107.55298,5.311237,14.378943,6.951978,-110.82977,-206.01114,19.69018,2.347659,-2.2013845,186.00365,1200000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6399652,150.62996,0.007441978,-0.0041644233,-13.059586,0.19752042,-150.53278,150.82332,1.993356,6.024365,-61.41215,-153.44133,-195.06921,8.017721,4.5993915,-4.846877,120.161026,705000
|
| 3 |
+
0.64234936,146.34834,0.007909991,-0.0036814057,-12.965412,0.18676886,-146.24579,146.53143,1.7161225,4.347486,-37.540314,-149.31767,-192.47234,6.0636086,5.627362,-5.5085144,101.17407,710000
|
| 4 |
+
0.64034575,145.6495,0.008618187,-0.0063432576,-13.236032,0.18098184,-145.53545,145.82414,1.7289721,4.910453,-38.268055,-148.65825,-193.70245,6.639425,2.6687353,-1.9912817,55.681793,715000
|
| 5 |
+
0.63641334,140.51756,0.009357729,-0.029424002,-15.644353,0.17801313,-140.37117,140.66615,4.6748176,7.4331217,-19.89864,-144.5689,-200.05511,12.107939,2.0195465,-2.3692784,113.14732,720000
|
| 6 |
+
0.6467866,138.09946,0.00961896,-0.007749981,-13.305698,0.16760571,-137.97147,138.25931,2.9151924,8.399887,-41.617046,-140.94556,-200.64601,11.31508,4.0702267,-4.3277254,101.39447,725000
|
| 7 |
+
0.6470323,136.83026,0.009377777,-0.0021536648,-12.729656,0.18013021,-136.71088,137.00824,2.8862615,8.3325815,-47.28584,-139.52489,-197.5553,11.218843,2.7096663,-2.9917958,109.850945,730000
|
| 8 |
+
0.6527626,138.11095,0.009351747,0.0019143516,-12.295295,0.1707747,-137.99597,138.28363,2.6370888,8.358138,-27.280106,-140.1574,-197.65193,10.995227,3.9421399,-3.4710312,142.62816,735000
|
| 9 |
+
0.6485691,138.42606,0.009522684,-0.007253988,-13.261759,0.16139024,-138.29977,138.5802,3.7915325,10.046554,-51.023315,-142.49455,-198.43317,13.838086,3.3547964,-3.5594466,107.320854,740000
|
| 10 |
+
0.6519624,137.87527,0.008972867,0.004351615,-12.015025,0.1611773,-137.76746,138.0408,2.2646878,8.279596,-34.464584,-140.6022,-197.54265,10.544284,3.7882888,-2.4462206,88.95391,745000
|
| 11 |
+
0.642359,139.53152,0.009103583,-0.005063066,-13.056162,0.15571102,-139.41269,139.68217,4.8807936,9.633966,-23.194445,-142.20546,-197.65178,14.51476,0.71627396,-0.9924114,133.17801,750000
|
| 12 |
+
0.64861554,135.82404,0.009419792,-0.011841703,-13.757109,0.19240439,-135.69446,136.0046,3.1941857,12.724948,-20.730667,-139.55273,-204.49724,15.919134,8.774209,-12.061391,209.12784,755000
|
| 13 |
+
0.6399648,134.6969,0.0093428595,-0.016156958,-14.229338,0.21462372,-134.56395,134.89537,3.2304237,9.035,-35.368694,-138.13841,-201.68102,12.265424,2.564196,-2.4756,112.37913,760000
|
| 14 |
+
0.64506435,137.42596,0.009288826,-0.009364522,-13.508149,0.18185514,-137.3005,137.59845,2.5986588,7.959253,-38.03327,-140.38232,-200.35902,10.557912,1.2116488,-1.1058456,90.75588,765000
|
| 15 |
+
0.6380181,131.32883,0.009170981,-0.0061980146,-13.175829,0.18836421,-131.20798,131.511,3.239322,8.573264,-19.106522,-133.9395,-198.8365,11.812586,6.708796,-7.285101,125.62921,770000
|
| 16 |
+
0.64746535,135.80374,0.009256274,0.0025364326,-12.225977,0.18647113,-135.69057,135.99275,2.8637853,9.560854,-8.195235,-138.84862,-200.73724,12.424639,4.4075947,-6.060534,149.40546,775000
|
| 17 |
+
0.64227295,135.51904,0.009412707,-0.0071058315,-13.254919,0.1656982,-135.39427,135.67763,3.5726883,9.476244,-12.919098,-138.80936,-201.17992,13.048932,0.8348204,-1.2209947,101.36867,780000
|
| 18 |
+
0.6393832,134.44788,0.00921552,0.0038947756,-12.077368,0.187994,-134.33656,134.63976,3.918162,10.820031,-4.6872406,-136.92627,-201.04643,14.7381935,1.5770876,-1.6131506,132.73872,785000
|
| 19 |
+
0.6420999,134.76758,0.009319492,-0.0017209813,-12.684665,0.19092649,-134.64935,134.95679,2.7624972,9.851997,0.7640542,-137.42363,-196.49063,12.614494,2.602545,-2.8813004,111.50621,790000
|
| 20 |
+
0.6457582,133.87082,0.009240372,0.010305436,-11.384738,0.15869956,-133.76561,134.03983,4.8070636,12.32708,-1.6777391,-136.40404,-198.33562,17.134144,2.9357107,-3.8260362,154.47018,795000
|
| 21 |
+
0.6388067,129.70328,0.009392777,0.0039621033,-12.078176,0.18993291,-129.58984,129.89717,16.667929,14.958774,-5.507349,-132.84639,-201.21326,31.626701,6.4294586,-5.1229296,378.947,800000
|
| 22 |
+
0.64455986,132.99115,0.009311237,0.005446124,-11.915102,0.1951417,-132.88022,133.19174,2.874521,9.312723,-5.2028227,-136.67322,-198.77179,12.187244,1.606648,-1.3553473,107.5323,805000
|
| 23 |
+
0.6422736,128.14552,0.009570788,-0.016200466,-14.192699,0.17515306,-128.00969,128.30447,3.5672905,11.471595,-9.392605,-131.5656,-202.38123,15.038885,8.117423,-7.3511224,177.55396,810000
|
| 24 |
+
0.6433419,128.90343,0.009526336,0.00096140424,-12.399079,0.18531379,-128.78532,129.0897,4.4048576,11.482181,0.08337309,-132.62561,-199.64474,15.887038,4.9076147,-4.093933,134.28865,815000
|
| 25 |
+
0.6502551,129.20847,0.009761519,0.007323243,-11.749784,0.16061103,-129.09378,129.3764,3.569388,10.516318,-4.0927734,-132.18399,-201.28163,14.085707,1.6423173,-1.5917459,127.5732,820000
|
| 26 |
+
0.6446814,131.37558,0.009322825,0.00034893377,-12.462572,0.17688714,-131.2594,131.55281,3.532832,8.996374,-2.406207,-134.63963,-199.2928,12.529206,2.014291,-1.9441289,133.74037,825000
|
| 27 |
+
0.64721817,131.84131,0.009554668,0.003256024,-12.159222,0.17455387,-131.72514,132.01912,5.0877852,11.652353,-10.576316,-135.61595,-198.56747,16.740139,3.1849527,-3.0860326,157.77979,830000
|
| 28 |
+
0.6453397,130.04822,0.009230209,-0.00095627183,-12.603602,0.1745134,-129.93188,130.22177,2.7215345,10.291263,1.2241716,-133.94621,-202.47873,13.012797,6.1706457,-6.299524,159.02301,835000
|
| 29 |
+
0.64084935,126.92525,0.009537367,-0.009708782,-13.517973,0.17995939,-126.79632,127.0955,3.0307667,9.908121,-0.79516685,-130.7631,-198.96533,12.938888,4.2857428,-3.9881723,132.00272,840000
|
| 30 |
+
0.65546834,129.61499,0.009173706,0.0068260026,-11.755917,0.16684094,-129.50714,129.78865,3.7224572,11.436128,-7.3310857,-132.4549,-199.24417,15.158585,6.1476445,-6.797014,194.6429,845000
|
| 31 |
+
0.64098686,132.26001,0.009294688,-0.0053968304,-13.080636,0.15837884,-132.13843,132.413,2.3039367,8.484801,-15.385258,-134.50342,-203.08904,10.788738,5.273377,-5.730258,128.45253,850000
|
| 32 |
+
0.6478313,128.93338,0.009321144,0.011216528,-11.296658,0.16721258,-128.8281,129.1118,2.8610492,8.918383,-8.466823,-131.53197,-203.7269,11.779432,2.9454596,-3.42423,136.57321,855000
|
| 33 |
+
0.6492537,129.1051,0.00938072,0.01026731,-11.405488,0.18059194,-128.99814,129.29596,5.082905,12.129733,-1.2686055,-132.09976,-203.16133,17.212639,5.3589997,-5.027045,187.39444,860000
|
| 34 |
+
0.63550276,128.48383,0.00946386,-0.013470848,-13.923399,0.16618153,-128.35205,128.63654,5.077002,11.0001335,-0.70482534,-131.451,-204.1331,16.077135,4.495274,-5.191594,143.43814,865000
|
| 35 |
+
0.6566656,131.52539,0.009323224,0.01663397,-10.715857,0.15464926,-131.42548,131.69667,3.1835911,9.498199,-2.646424,-134.08955,-204.39563,12.68179,1.8258946,-0.86552644,127.299736,870000
|
| 36 |
+
0.64412016,130.16954,0.009440535,0.003197818,-12.161267,0.1747391,-130.05472,130.34749,4.178552,13.522263,-8.899888,-133.1803,-204.06921,17.700815,4.4777484,-3.3986866,184.43817,875000
|
| 37 |
+
0.6443989,128.49594,0.009224106,0.013407446,-11.046477,0.17572019,-128.39404,128.68507,3.1232688,10.143659,2.9052777,-131.22801,-203.06749,13.266928,1.9489622,-1.9022636,152.25809,880000
|
| 38 |
+
0.63074386,128.56387,0.009298491,-0.022752898,-14.946945,0.14063165,-128.4249,128.68175,4.785803,11.656066,-8.058164,-131.83813,-205.03917,16.441868,1.8061006,-1.8567207,160.01138,885000
|
| 39 |
+
0.6442317,128.58682,0.009281693,-0.0046295696,-12.998785,0.16761352,-128.46616,128.74982,3.37169,11.089679,-11.585248,-131.3713,-196.8855,14.461369,3.4328735,-3.710607,126.39656,890000
|
| 40 |
+
0.64519364,125.69474,0.009499202,0.0063342173,-11.833184,0.15335318,-125.58233,125.85442,3.1347682,7.1496134,-4.020186,-128.74043,-198.20334,10.284382,1.9250258,-1.9486667,91.84657,895000
|
| 41 |
+
0.6426446,127.173645,0.009361669,0.002256682,-12.2589445,0.18344668,-127.05888,127.35935,4.7412624,12.799736,-7.038547,-131.02725,-200.16077,17.540998,2.2036493,-2.4365,163.04327,900000
|
| 42 |
+
0.6399388,126.94661,0.009385569,-0.004755646,-13.006698,0.18014127,-126.824524,127.121994,4.909626,15.566318,-8.496581,-130.07121,-195.92186,20.475945,5.287236,-5.2551184,174.73427,905000
|
| 43 |
+
0.63779473,126.26739,0.0094863465,0.0039093853,-12.0878935,0.15909421,-126.15272,126.43039,4.478255,13.123781,-3.9963746,-128.86928,-196.17088,17.602036,2.1534605,-4.8315496,186.02797,910000
|
| 44 |
+
0.6454878,129.34003,0.00938723,-0.0035451255,-12.877654,0.18055668,-129.21913,129.51704,3.117306,9.080153,-17.218676,-132.30951,-203.10294,12.197459,2.046712,-2.2278326,116.708786,915000
|
| 45 |
+
0.6422302,124.50441,0.009323686,-0.008846288,-13.448797,0.17828733,-124.37902,124.67384,4.201111,12.25677,-1.1218333,-127.91941,-197.58585,16.457882,3.9136872,-3.1602683,143.18607,920000
|
| 46 |
+
0.64021087,121.91066,0.009281595,0.006062226,-11.846855,0.16437179,-121.8007,122.0811,6.0990715,15.049962,3.8944066,-125.017876,-196.34456,21.149033,3.500462,-3.239024,194.67255,925000
|
| 47 |
+
0.644786,125.595276,0.0093422895,0.012895514,-11.119662,0.17025232,-125.491394,125.77842,6.817276,9.73454,-0.9652359,-128.84566,-206.95712,16.551815,2.1507173,-2.301363,152.67415,930000
|
| 48 |
+
0.64288694,121.231094,0.00952803,0.008221898,-11.637083,0.19055857,-121.12021,121.42988,4.5842743,10.629351,4.930255,-124.39075,-198.1186,15.213625,2.0411618,-1.6755171,193.48138,935000
|
| 49 |
+
0.6480495,124.05998,0.009059357,0.012773485,-11.090023,0.2065309,-123.95952,124.27928,5.5263057,13.419522,1.4061246,-127.204346,-200.69258,18.945827,1.689919,-1.5245591,145.0128,940000
|
| 50 |
+
0.6511786,124.84674,0.00928076,0.002270466,-12.255358,0.18170053,-124.733,125.030716,7.450448,12.994989,-9.005265,-127.835594,-201.25961,20.445438,6.303255,-5.7909985,203.43564,945000
|
| 51 |
+
0.64310426,117.26034,0.009498318,0.007908785,-11.667349,0.17451096,-117.14952,117.44276,5.955789,15.219736,-7.712293,-120.77559,-197.97006,21.175526,7.1156316,-7.8744497,220.59444,950000
|
| 52 |
+
0.651703,126.01648,0.009148379,0.001226012,-12.365986,0.1695344,-125.903336,126.18724,3.545349,9.067754,-13.766013,-129.40744,-205.36336,12.613103,2.6350546,-2.189055,129.35742,955000
|
| 53 |
+
0.64313024,120.44387,0.009256919,-0.0010328507,-12.611576,0.15393221,-120.327126,120.59677,7.247979,11.832962,3.0549827,-124.497635,-196.2892,19.08094,3.1726627,-3.438404,243.38635,960000
|
| 54 |
+
0.6394558,123.64584,0.00932082,-0.009787529,-13.550072,0.18147802,-123.51956,123.817535,5.0353656,18.827795,-5.3005047,-126.357414,-199.46487,23.863161,12.038689,-9.126397,242.81609,965000
|
| 55 |
+
0.63721246,124.655594,0.0091409655,-0.00041702797,-12.545622,0.17079978,-124.540924,124.82597,4.4291286,12.463872,-8.521346,-126.765114,-194.97328,16.893002,1.5191909,-1.6291854,136.8415,970000
|
| 56 |
+
0.6397903,124.07879,0.009181071,-0.011203054,-13.720234,0.16497211,-123.95282,124.23256,4.3115516,15.058179,-6.524496,-125.94103,-203.86855,19.36973,1.9265403,-3.1771424,183.5629,975000
|
| 57 |
+
0.6449619,126.481735,0.009062546,-0.0009479333,-12.604599,0.16729416,-126.36751,126.64809,6.01037,10.769762,-10.551891,-130.03445,-203.86125,16.780132,2.4918592,-2.373971,201.46684,980000
|
| 58 |
+
0.6468095,120.753265,0.009219097,0.0008313203,-12.409826,0.1613102,-120.63886,120.915405,3.7938745,9.473041,-5.9246945,-122.78163,-199.67693,13.266915,4.9888144,-4.2119994,131.29764,985000
|
| 59 |
+
0.6351343,118.57184,0.009111627,-0.0149091305,-14.136275,0.16454609,-118.44302,118.72147,7.1792665,13.669446,-6.0241103,-121.483696,-206.78264,20.848713,3.856965,-3.550459,216.19415,990000
|
| 60 |
+
0.638468,119.479614,0.009169005,0.005263598,-11.925936,0.18421283,-119.37026,119.66909,9.711718,17.86645,6.0359545,-122.29988,-200.24715,27.578167,3.5069063,-4.323081,292.20493,995000
|
| 61 |
+
0.6436029,125.871506,0.009214469,0.007972184,-11.634819,0.13289818,-125.76429,126.012375,6.505573,12.155992,8.654337,-128.52867,-206.0692,18.661564,3.3392067,-2.7320518,165.03264,1000000
|
| 62 |
+
0.6431514,126.82629,0.009052112,-0.005345357,-13.090509,0.14898214,-126.707794,126.96992,6.4889984,9.911747,-7.0914135,-129.74706,-199.92456,16.400745,1.4613732,-1.6025965,158.20789,1005000
|
| 63 |
+
0.64592665,122.79101,0.008986984,0.0001038335,-12.488446,0.14421284,-122.67877,122.935326,9.7251005,17.512419,9.443184,-126.27266,-204.4824,27.237518,4.529858,-4.699518,298.22696,1010000
|
| 64 |
+
0.641336,125.733345,0.009046481,0.0028280606,-12.187386,0.1599535,-125.62309,125.896126,5.2026258,15.14704,-10.193426,-128.47691,-201.45389,20.349667,1.8537345,-2.0673993,173.47496,1015000
|
| 65 |
+
0.63401616,121.418846,0.009321384,-0.010190855,-13.593277,0.17739025,-121.292145,121.586044,5.4529533,12.63087,0.6501003,-124.60589,-202.69028,18.083824,2.633357,-3.061808,167.95174,1020000
|
| 66 |
+
0.6495139,122.6859,0.008988562,0.010677432,-11.312109,0.1784961,-122.58423,122.87508,4.181917,11.206926,-0.37009484,-124.95827,-204.42694,15.388844,2.3916612,-2.2953718,137.00446,1025000
|
| 67 |
+
0.6412297,119.19217,0.008899503,0.00697735,-11.715984,0.16242287,-119.087906,119.36157,6.2200317,14.5052185,-2.2101605,-122.02984,-202.04897,20.72525,7.0335693,-8.304405,256.13074,1030000
|
| 68 |
+
0.64816236,120.73066,0.00879877,-0.0012217278,-12.638852,0.17041947,-120.61945,120.89986,4.7010016,10.829595,-2.2926445,-123.41614,-202.69545,15.530596,2.1594076,-2.1999135,163.16992,1035000
|
| 69 |
+
0.6485313,122.32833,0.009060118,0.012100244,-11.16445,0.12534398,-122.22718,122.465775,6.868324,24.0452,-3.0470943,-125.239784,-204.89436,30.913525,10.881,-12.683091,365.4353,1040000
|
| 70 |
+
0.6406615,127.33424,0.009098207,-0.0029472236,-12.823935,0.15980822,-127.217575,127.491104,5.4638276,9.355411,-1.3280982,-130.38306,-209.36145,14.819239,1.0635548,-1.0180377,133.38478,1045000
|
| 71 |
+
0.6431515,117.55626,0.008985502,0.018764593,-10.411681,0.16723211,-117.46271,117.742256,5.80049,12.332784,-3.2698796,-119.99438,-203.082,18.133274,1.6859559,-1.6478467,166.4632,1050000
|
| 72 |
+
0.64663327,123.04736,0.009013889,0.010243506,-11.363586,0.14202729,-122.94494,123.19964,4.965732,16.60391,-2.3551557,-126.003044,-206.97897,21.569643,2.8007243,-4.0174966,211.7115,1055000
|
| 73 |
+
0.6442242,115.295975,0.008986479,0.009844662,-11.404503,0.14607507,-115.19349,115.45189,5.1965623,16.74655,1.5760707,-118.7264,-207.23218,21.943111,2.6920686,-2.8448684,201.50403,1060000
|
| 74 |
+
0.6393934,123.70038,0.009166309,-0.017361557,-14.394062,0.16265428,-123.568436,123.845665,3.6160474,12.577919,-2.1845462,-125.97727,-206.28252,16.193966,1.4741958,-1.6489983,155.27928,1065000
|
| 75 |
+
0.6430768,120.15047,0.009067798,-0.0022624268,-12.749501,0.15993023,-120.03486,120.30813,9.07125,12.631204,1.0687145,-122.953575,-204.1062,21.702454,2.6803741,-2.5919428,194.23174,1070000
|
| 76 |
+
0.6445008,117.8512,0.009075134,0.0021487512,-12.2632265,0.16248877,-117.7399,118.01584,7.0098796,16.008215,1.4281921,-121.51143,-208.62712,23.018095,8.751586,-9.384328,242.74269,1075000
|
| 77 |
+
0.65046096,117.873825,0.008852489,0.023450954,-9.85092,0.16823214,-117.78662,118.06551,5.038648,16.921064,-3.4559927,-120.87598,-202.85689,21.959713,3.0602307,-3.363168,190.82669,1080000
|
| 78 |
+
0.6434744,119.3509,0.008812294,0.005576261,-11.867218,0.1463894,-119.24632,119.50287,5.414103,10.34599,2.9200203,-122.69102,-203.7399,15.760094,1.2992455,-1.1440701,156.69586,1085000
|
| 79 |
+
0.6332881,120.927185,0.008808942,-0.013748791,-14.060777,0.14988703,-120.80333,121.063324,7.2897277,17.916203,0.09635651,-123.766655,-208.48708,25.20593,8.4854355,-9.568885,280.3907,1090000
|
| 80 |
+
0.64363587,118.60824,0.008920258,-0.0055122264,-13.117945,0.15795545,-118.49123,118.76069,4.160379,10.827945,2.2171264,-122.16669,-209.33734,14.988323,1.113372,-1.4352105,132.48076,1095000
|
| 81 |
+
0.6470053,116.691696,0.009113912,0.009858234,-11.418331,0.16286854,-116.58763,116.864426,4.869993,18.055414,-1.4983546,-120.06905,-205.03075,22.925407,2.0869095,-2.533445,215.40843,1100000
|
| 82 |
+
0.64381105,120.5636,0.009032282,0.019479666,-10.343328,0.16383955,-120.47017,120.74692,4.967673,12.057758,-2.2838175,-123.11775,-206.88606,17.02543,1.3983307,-1.4608436,158.62877,1105000
|
| 83 |
+
0.641147,120.881516,0.008770132,-0.0034926517,-12.898244,0.14192674,-120.7684,121.01995,3.5765138,10.937434,-0.48328203,-123.38615,-203.82454,14.513948,1.6429541,-1.8659368,146.92435,1110000
|
| 84 |
+
0.64499515,116.68048,0.008843486,-0.0020006674,-12.726231,0.13043508,-116.56793,116.808914,5.2697024,14.193865,-8.133343,-119.54797,-207.51054,19.463568,3.6188838,-2.7531095,215.50247,1115000
|
| 85 |
+
0.64481294,118.2834,0.008762069,0.005907805,-11.825752,0.15816197,-118.17979,118.44747,4.8221974,13.75693,-1.2642927,-121.2282,-205.58162,18.579128,2.6265306,-2.621476,167.80286,1120000
|
| 86 |
+
0.648843,113.79812,0.008924771,0.008279102,-11.572346,0.17471036,-113.69484,113.98111,4.7576294,14.001288,-0.08921463,-116.73142,-207.07802,18.758919,3.2205486,-3.0653536,199.31,1125000
|
| 87 |
+
0.6534241,116.54996,0.00901529,0.021301901,-10.137136,0.15206334,-116.45857,116.72332,4.903936,13.76192,-0.3391986,-119.563286,-204.58592,18.665855,3.5787623,-3.303914,182.7084,1130000
|
| 88 |
+
0.6493373,119.51209,0.008831362,0.009395013,-11.436176,0.17248982,-119.41109,119.69398,5.607742,10.252814,-1.0966692,-121.25504,-203.25642,15.860556,2.3463595,-2.6751924,180.93805,1135000
|
| 89 |
+
0.63651764,110.757416,0.008695075,-0.009413841,-13.582664,0.18135498,-110.63931,110.92936,6.995782,15.420943,-0.87776893,-113.56602,-204.6345,22.416725,1.624832,-1.2641237,181.63391,1140000
|
| 90 |
+
0.64027953,120.73732,0.008843301,-0.006073124,-13.1867485,0.17511576,-120.620705,120.906364,4.525005,21.246851,-4.2116976,-124.808975,-206.33698,25.771856,3.8166778,-4.275342,194.12477,1145000
|
| 91 |
+
0.6476944,113.077805,0.008841113,0.010133424,-11.353829,0.14569002,-112.977425,113.23363,6.4936433,12.585855,4.52926,-115.73321,-205.40375,19.079498,2.6709132,-2.488758,195.38435,1150000
|
| 92 |
+
0.64258665,119.073975,0.00895503,-0.016029427,-14.289991,0.16087195,-118.946014,119.21882,7.100122,13.501746,1.4063656,-122.33471,-197.71037,20.601868,3.8408394,-4.341013,250.28577,1155000
|
| 93 |
+
0.6433364,113.84334,0.009020601,0.0020350327,-12.274402,0.1711415,-113.73262,114.01652,5.3910418,14.262671,-0.62449306,-116.19907,-208.1848,19.653713,1.7614827,-3.0105288,198.67708,1160000
|
| 94 |
+
0.64250344,115.421555,0.009079112,-0.008146174,-13.3972435,0.17297359,-115.29993,115.58638,12.800483,23.930128,4.1185946,-118.257034,-199.52951,36.73061,4.05628,-3.8096597,313.09235,1165000
|
| 95 |
+
0.6436531,110.91116,0.008900433,0.001668203,-12.312571,0.11992441,-110.801575,111.03276,6.0097275,13.937075,7.1140265,-113.09948,-200.16002,19.946802,2.8341112,-2.1976385,233.8071,1170000
|
| 96 |
+
0.64033985,114.935905,0.008942113,-0.005576592,-13.123632,0.14018813,-114.81854,115.07052,6.224197,16.683495,2.5274677,-118.32869,-203.18135,22.907692,2.3693988,-2.8971376,233.62556,1175000
|
| 97 |
+
0.64147836,119.90997,0.008830091,-0.014686868,-14.163275,0.18468255,-119.78491,120.07997,6.886258,23.731117,1.4195355,-123.47017,-205.64088,30.617374,7.224556,-4.6502905,426.9449,1180000
|
| 98 |
+
0.63770413,113.691345,0.008855352,-0.009772188,-13.603535,0.1487444,-113.570885,113.830315,6.701122,14.211255,4.158659,-116.49475,-208.98463,20.912376,1.47606,-2.220014,190.69266,1185000
|
| 99 |
+
0.6511342,115.96462,0.008953001,0.014697286,-10.858396,0.15459505,-115.86742,116.13391,4.33658,14.328055,10.5042095,-117.94667,-204.92564,18.664635,2.652356,-2.7399647,182.02916,1190000
|
| 100 |
+
0.6386027,106.60608,0.009015845,-0.0021253582,-12.735736,0.13437891,-106.49126,106.73833,14.264702,17.393402,-4.6719804,-109.80898,-207.09148,31.658104,3.9873161,-4.0583134,337.3333,1195000
|
| 101 |
+
0.6360383,107.42423,0.008991176,-0.015470767,-14.220661,0.14421996,-107.29637,107.55298,5.311237,14.378943,6.951978,-110.82977,-206.01114,19.69018,2.347659,-2.2013845,186.00365,1200000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f701afd083e7d07c36a09a50962eb47bf2a95d79e068a9b1ece792ed53c35648
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8e47980aec32073fe86ad2237b9f35db2426fdd12f963757af96d27ba6e4acb
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acec66aa1af76396a08e43d04c20837151d383a3825173415beef507010498f9
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14e84e661b71df414ff4847e101738cdfbf3c9c1ed400b491582d287b1be4ec4
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5823011a09bff02ee1b1a0c77c7d8213f81423780298a52377c3bd943f6162ce
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3b14b8eb992d1c7aa713cb8bf65c3a7bfeaff9bbc196b413970fa5736ab33bf
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85d049de67849f520bc1b4cbdb4fe4d03f4e0890b79cb25aca0717e8f2c12705
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1837b2db0010bab57eb0b6e6988c866500a5bcb86ec640f195a98895c9314ac8
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88f4da953b6dcb9a2f117fc899b9e695cc0cdf24516dc529d3adc3b8cacc9a7a
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:997a48c94314cb60133a660020f8ec2fd19d632d3f07f68110344ba70f7d4588
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_005645/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/tj5bmnmt
|