Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1150000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1200000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.019578055199786174,-0.011269075087626161,-0.019109701726833364,-0.009126848244162307,31.954991433303423,10.41399999999924,0.82,5163.94,-0.28,-345.76,206.28,0.9430085897445679,850000
|
| 3 |
+
0.0,0.0,-0.04136239362513198,0.010216450224325777,-0.03996281404788762,-0.01077549136879532,31.754723543191332,7.91299999999936,0.88,14314.84,-0.14,-231.34,156.26,0.6541470098495483,900000
|
| 4 |
+
0.0,0.0,-0.04178376027891513,-5.632733224624781e-05,-0.040328969987277107,-0.002996880662274512,33.48145704313381,6.66799999999973,0.96,22099.42,-0.04,-182.1,131.36,0.6086168050765991,950000
|
| 5 |
+
0.0,0.0,-0.025576161963293764,0.017448279491254843,-0.023430029461382132,0.023806483399769336,34.29714923253659,6.984999999999629,0.94,28869.66,-0.1,-208.26,137.7,0.6028055477142334,1000000
|
| 6 |
+
0.0,0.0,-0.04466660208619256,0.025298144239289642,-0.04217346257510956,0.017251235261987945,34.07550746105516,6.1429999999997325,0.98,35299.18,-0.02,-168.08,120.86,0.514926061630249,1050000
|
| 7 |
+
0.0,0.0,-0.0532971265168325,0.029369042822244434,-0.05066930063219372,0.024033016855302746,34.76573983273956,4.6389999999997995,1.0,40939.1,0.0,-131.32,90.78,0.4130169057846069,1100000
|
| 8 |
+
0.0,0.0,-0.043565875036844386,0.053435883829381095,-0.0406731390953118,0.023080594093398726,33.88244454796426,4.743999999999735,1.0,45627.0,0.0,-136.48,92.88,0.4289014530181885,1150000
|
| 9 |
+
0.0,0.0,-0.03746212854542908,0.036921185307463064,-0.03515683812674663,0.02460303294370872,32.22281709079693,5.8399999999996455,0.94,51458.1,-0.06,-183.06,114.8,0.4805546188354492,1200000
|
| 10 |
+
0.0,0.0,-0.06066823217186648,0.03370884396128769,-0.05688451357290281,0.03243632756720202,34.89465642056672,3.600999999999893,1.0,56326.96,0.0,-105.08,70.02,0.3073910903930664,1250000
|
| 11 |
+
0.0,0.0,-0.065843398699879,0.031311326535999974,-0.06250014072131607,0.02895211345430387,34.409031450556874,4.287999999999823,0.98,60520.24,-0.02,-115.38,83.76,0.39982683658599855,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.019578055199786174,-0.011269075087626161,-0.019109701726833364,-0.009126848244162307,31.954991433303423,10.41399999999924,0.82,5163.94,-0.28,-345.76,206.28,0.9430085897445679,850000
|
| 3 |
+
0.0,0.0,-0.04136239362513198,0.010216450224325777,-0.03996281404788762,-0.01077549136879532,31.754723543191332,7.91299999999936,0.88,14314.84,-0.14,-231.34,156.26,0.6541470098495483,900000
|
| 4 |
+
0.0,0.0,-0.04178376027891513,-5.632733224624781e-05,-0.040328969987277107,-0.002996880662274512,33.48145704313381,6.66799999999973,0.96,22099.42,-0.04,-182.1,131.36,0.6086168050765991,950000
|
| 5 |
+
0.0,0.0,-0.025576161963293764,0.017448279491254843,-0.023430029461382132,0.023806483399769336,34.29714923253659,6.984999999999629,0.94,28869.66,-0.1,-208.26,137.7,0.6028055477142334,1000000
|
| 6 |
+
0.0,0.0,-0.04466660208619256,0.025298144239289642,-0.04217346257510956,0.017251235261987945,34.07550746105516,6.1429999999997325,0.98,35299.18,-0.02,-168.08,120.86,0.514926061630249,1050000
|
| 7 |
+
0.0,0.0,-0.0532971265168325,0.029369042822244434,-0.05066930063219372,0.024033016855302746,34.76573983273956,4.6389999999997995,1.0,40939.1,0.0,-131.32,90.78,0.4130169057846069,1100000
|
| 8 |
+
0.0,0.0,-0.043565875036844386,0.053435883829381095,-0.0406731390953118,0.023080594093398726,33.88244454796426,4.743999999999735,1.0,45627.0,0.0,-136.48,92.88,0.4289014530181885,1150000
|
| 9 |
+
0.0,0.0,-0.03746212854542908,0.036921185307463064,-0.03515683812674663,0.02460303294370872,32.22281709079693,5.8399999999996455,0.94,51458.1,-0.06,-183.06,114.8,0.4805546188354492,1200000
|
| 10 |
+
0.0,0.0,-0.06066823217186648,0.03370884396128769,-0.05688451357290281,0.03243632756720202,34.89465642056672,3.600999999999893,1.0,56326.96,0.0,-105.08,70.02,0.3073910903930664,1250000
|
| 11 |
+
0.0,0.0,-0.065843398699879,0.031311326535999974,-0.06250014072131607,0.02895211345430387,34.409031450556874,4.287999999999823,0.98,60520.24,-0.02,-115.38,83.76,0.39982683658599855,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.64530706,151.45154,0.0071283975,0.0039018842,-11.952628,0.19129601,-151.36633,151.64674,1.946989,3.764349,-43.19062,-154.18723,-194.7333,5.711338,1.6045392,-1.5209478,59.659332,805000
|
| 3 |
+
0.64778996,147.44556,0.0077615296,-0.008926482,-13.650093,0.19778866,-147.3396,147.63441,1.9322551,6.253452,-34.117447,-150.06123,-193.53798,8.185707,2.234766,-2.7194905,89.24094,810000
|
| 4 |
+
0.64080274,144.31929,0.008799769,-0.008743407,-13.493595,0.19734813,-144.20053,144.50789,1.6041905,5.17741,-42.39156,-147.24944,-193.16669,6.7816005,0.5052182,-0.85741657,53.693893,815000
|
| 5 |
+
0.6381637,139.14365,0.0091969725,-0.009806095,-13.566231,0.16819853,-139.01889,139.30203,4.3599787,9.68357,-9.43463,-143.37065,-201.3088,14.043549,2.0484245,-2.2449026,130.23145,820000
|
| 6 |
+
0.64582455,138.06465,0.009048228,0.0042560697,-12.029624,0.16679254,-137.95581,138.2357,2.6890614,8.729525,-49.738777,-141.13708,-201.1968,11.418586,0.9534511,-1.0779656,79.04982,825000
|
| 7 |
+
0.646403,136.56752,0.009007165,0.0076863817,-11.646637,0.1743981,-136.46262,136.7496,3.4507592,6.3948073,-32.522446,-139.08946,-197.8874,9.845567,4.955686,-4.5787716,112.66143,830000
|
| 8 |
+
0.6468451,137.1506,0.008984512,0.00013275721,-12.485224,0.17908798,-137.03842,137.32983,3.6096458,6.51197,-8.661832,-139.74847,-197.03651,10.121616,3.6167061,-3.3629735,109.54373,835000
|
| 9 |
+
0.63946056,136.57735,0.009138573,-0.014386287,-14.074238,0.18641861,-136.44873,136.74937,3.4819372,12.248917,-17.559185,-140.29103,-200.11787,15.730854,6.3223586,-6.5211773,140.78856,840000
|
| 10 |
+
0.64497316,135.94107,0.009571445,-0.00041384716,-12.543238,0.16752937,-135.82101,136.10818,3.2366714,6.485897,-16.441423,-138.90538,-198.28952,9.7225685,2.1301107,-1.8733666,90.327194,845000
|
| 11 |
+
0.64214855,136.24722,0.009655323,-0.0054118745,-13.060507,0.17602482,-136.12112,136.41783,3.2837055,9.746523,-1.9645768,-139.34282,-197.28459,13.030229,1.1283288,-1.4893548,121.95651,850000
|
| 12 |
+
0.6387469,130.44458,0.00950909,-0.010884558,-13.644648,0.18512529,-130.31485,130.61882,5.0602493,11.499225,-4.5960817,-134.10628,-197.76358,16.559475,7.569109,-6.915238,202.48105,855000
|
| 13 |
+
0.63597625,131.54105,0.009436453,-0.010416738,-13.603883,0.18895352,-131.41269,131.71957,3.4336464,8.557866,-16.336914,-134.97337,-201.94922,11.991512,2.0119822,-2.0964508,91.50578,860000
|
| 14 |
+
0.6473262,133.5199,0.009659564,-0.0058859284,-13.109337,0.18265426,-133.39325,133.69666,4.5276227,7.6472125,-30.946589,-136.19719,-200.49179,12.174835,2.3002136,-1.7486906,145.02754,865000
|
| 15 |
+
0.6435719,130.24225,0.00954603,-0.0074375346,-13.279123,0.15957046,-130.11548,130.3944,2.6802511,7.0118456,-19.340858,-133.07523,-197.11592,9.692097,1.0593324,-1.0205172,76.793236,870000
|
| 16 |
+
0.64371914,134.16681,0.009646865,-0.008289667,-13.359312,0.15864417,-134.03792,134.31717,2.597853,10.0781355,-23.25231,-137.82315,-202.03552,12.675988,2.8861115,-3.433244,129.47644,875000
|
| 17 |
+
0.6384182,134.73788,0.009523511,-0.0033488723,-12.851643,0.16106829,-134.6155,134.89561,3.6973045,11.6148815,-2.1888685,-138.08067,-200.68903,15.312186,1.9792695,-2.2276893,129.10948,880000
|
| 18 |
+
0.6387728,134.235,0.009341059,-0.0027508384,-12.794489,0.1404204,-134.1155,134.37268,7.8477015,16.63822,-31.722506,-137.32108,-201.50786,24.485922,5.5378027,-5.814643,230.14438,885000
|
| 19 |
+
0.6460577,132.14188,0.009542244,-0.00634399,-13.164832,0.17813972,-132.01625,132.31367,3.0712292,8.073055,-19.706179,-134.57567,-205.83273,11.144284,2.0217018,-2.1197557,103.49298,890000
|
| 20 |
+
0.64369124,128.93604,0.00939073,0.009587433,-11.4790535,0.15425014,-128.82825,129.09987,2.5253081,8.429105,-1.7357129,-131.70494,-200.05612,10.954412,1.892551,-1.8036768,99.3125,895000
|
| 21 |
+
0.6336833,123.64557,0.009638239,-0.0032889978,-12.841245,0.20613681,-123.521805,123.84842,3.1233003,8.807258,0.9685744,-127.155815,-202.76634,11.930558,6.2629633,-5.992218,133.83966,900000
|
| 22 |
+
0.64646703,129.61545,0.009605452,0.004071748,-12.0761,0.17531925,-129.49945,129.79485,3.0743368,11.87222,-10.910489,-133.12503,-201.25401,14.946557,4.1566277,-3.809247,126.87405,905000
|
| 23 |
+
0.6372495,125.97975,0.009509402,-0.01539024,-14.118423,0.15800947,-125.845505,126.122375,4.271411,8.601952,-11.84675,-129.36516,-200.00891,12.873363,4.131432,-2.9272683,127.76545,910000
|
| 24 |
+
0.64200926,124.775406,0.009568,0.0028348062,-12.20372,0.19566771,-124.658646,124.973915,3.6070564,10.992043,0.8751895,-129.14403,-206.85716,14.599099,10.164488,-9.389187,208.66998,915000
|
| 25 |
+
0.6485127,129.24744,0.009567539,0.0047987974,-11.998429,0.16412434,-129.13263,129.41635,3.6843953,12.117945,-2.5786371,-131.88127,-202.6602,15.80234,7.418913,-6.7387333,157.86917,920000
|
| 26 |
+
0.64305043,130.71681,0.009461757,-0.007969109,-13.342244,0.1747335,-130.59058,130.88358,3.8654923,8.022582,-7.6632204,-133.92299,-198.00703,11.888075,3.0206022,-1.4140596,109.01419,925000
|
| 27 |
+
0.6493245,130.2719,0.009417187,0.009829143,-11.456255,0.16706479,-130.164,130.44879,3.7411842,12.047646,-5.378246,-133.74205,-206.01443,15.78883,2.5857537,-3.0816195,140.85968,930000
|
| 28 |
+
0.6352143,127.00627,0.009560685,-0.01243791,-13.800943,0.18414296,-126.87432,127.17798,2.7595425,13.819522,2.1839423,-130.26884,-200.64621,16.579063,3.3815682,-2.7306888,138.87216,935000
|
| 29 |
+
0.6396308,124.88336,0.009243012,-0.0068211043,-13.237974,0.21149899,-124.761,125.08804,4.713974,10.277672,-11.991817,-128.37024,-203.25159,14.991646,4.3375163,-4.846834,156.22133,940000
|
| 30 |
+
0.6549991,127.29137,0.009084781,0.009004571,-11.508829,0.1703541,-127.1868,127.470726,9.574971,10.717213,0.42268813,-130.31137,-202.7935,20.292183,3.623092,-2.4339974,237.89262,945000
|
| 31 |
+
0.648085,129.26913,0.009306116,0.0062638535,-11.82691,0.18396509,-129.15907,129.45937,2.6724584,8.705113,3.3706195,-131.11339,-204.36172,11.377572,6.071621,-6.52353,145.72362,950000
|
| 32 |
+
0.64283085,124.91946,0.009268761,0.00083231594,-12.410202,0.17649093,-124.80443,125.09678,2.33236,9.647229,-4.415162,-128.37865,-203.45605,11.979589,4.295574,-3.9597216,140.09016,955000
|
| 33 |
+
0.6398686,128.10672,0.009197108,0.0050142403,-11.9548025,0.16161518,-127.99678,128.27336,6.19904,14.949328,-7.6854954,-131.22617,-201.9682,21.148369,5.846786,-5.7091455,282.38208,960000
|
| 34 |
+
0.633834,126.51166,0.009270171,-0.014299853,-14.042566,0.1833516,-126.381485,126.68071,5.1353087,13.535263,-2.0781572,-130.38359,-202.05853,18.670572,2.3987296,-2.9906862,173.86717,965000
|
| 35 |
+
0.6526637,129.27945,0.009067093,0.01502206,-10.843233,0.17309235,-129.18112,129.46756,3.8580265,8.908418,-3.8630464,-131.5659,-202.01045,12.766444,2.3070388,-1.9413198,149.11673,970000
|
| 36 |
+
0.6482518,129.09827,0.009242492,0.0073989048,-11.699469,0.15623128,-128.99013,129.2619,4.096471,10.511378,-4.9869633,-132.04176,-204.25061,14.607849,4.293025,-4.1829195,195.66927,975000
|
| 37 |
+
0.648094,127.91079,0.009221876,0.012711811,-11.121559,0.15795715,-127.80823,128.08145,3.0247827,11.743599,1.652974,-129.93605,-202.4037,14.768381,1.5803292,-1.4001548,131.79373,980000
|
| 38 |
+
0.6262717,124.840866,0.009067669,-0.033476185,-16.191818,0.16534077,-124.694046,124.97273,3.6806142,10.304584,-6.5996127,-127.93963,-198.62473,13.985198,2.812267,-3.118621,132.45428,985000
|
| 39 |
+
0.6516476,125.477936,0.009109811,0.0085051665,-11.566373,0.154639,-125.372574,125.64108,3.5983658,12.343293,5.3442435,-127.89007,-196.59073,15.941659,2.4201841,-2.4988332,166.42148,990000
|
| 40 |
+
0.6361518,123.10919,0.008952323,-0.0015794134,-12.676425,0.19172975,-122.995705,123.29934,2.8808472,12.34013,0.9983201,-125.98496,-206.37018,15.220977,2.1284478,-1.272212,110.8873,995000
|
| 41 |
+
0.6419613,128.31447,0.009379377,-0.012819967,-13.866825,0.1425274,-128.1844,128.44418,5.7957516,19.876371,-15.185081,-131.86624,-204.07536,25.672123,2.8091931,-3.1722734,260.10995,1000000
|
| 42 |
+
0.6414403,122.97156,0.009426342,-0.008208405,-13.370794,0.15206194,-122.84552,123.11541,5.6284738,10.551465,-2.8885527,-126.441795,-201.089,16.17994,4.459067,-3.9681387,138.99858,1005000
|
| 43 |
+
0.6335872,124.71059,0.008935046,-0.001847516,-12.706772,0.15157737,-124.597046,124.86032,7.737613,11.251699,-7.9901605,-127.493,-202.00919,18.989313,1.1814945,-1.2889532,158.24274,1010000
|
| 44 |
+
0.6447632,125.38285,0.009036677,0.0007208479,-12.420231,0.15936273,-125.270615,125.54293,2.9831538,11.179778,0.6246758,-128.37756,-201.61462,14.162931,4.2437606,-6.4575915,181.34703,1015000
|
| 45 |
+
0.64373016,122.58633,0.008926134,0.0055760327,-11.875314,0.17193592,-122.480316,122.76384,2.8420384,9.403734,-0.3499058,-125.82975,-202.59935,12.245772,1.783332,-1.7742308,110.437,1020000
|
| 46 |
+
0.63591284,120.34452,0.0090353545,0.011556195,-11.221003,0.18668321,-120.24313,120.54276,3.8062704,12.823054,-5.5159793,-123.62289,-199.35257,16.629324,4.418092,-3.8486297,167.17308,1025000
|
| 47 |
+
0.6417389,125.9348,0.008885633,0.00211528,-12.261944,0.1782994,-125.82584,126.11521,4.2040887,10.489898,0.46938378,-128.62085,-202.40022,14.693987,1.6466022,-1.7262478,129.86987,1030000
|
| 48 |
+
0.64039594,120.50253,0.009109911,-0.003973058,-12.936125,0.19240403,-120.38469,120.69096,6.585654,10.121231,-5.150677,-123.24656,-196.52623,16.706884,3.1107054,-1.7434717,169.26146,1035000
|
| 49 |
+
0.6502667,123.33198,0.008805683,0.0052252333,-11.906607,0.12575838,-123.227135,123.46296,4.753125,14.178517,1.3936784,-126.71087,-201.9305,18.931643,2.9474378,-3.0746727,208.22192,1040000
|
| 50 |
+
0.63774514,126.11377,0.008993127,-0.019801775,-14.701879,0.17314675,-125.98155,126.26712,4.8370676,15.311411,-16.543993,-129.67627,-202.34277,20.14848,4.2073517,-4.7344823,218.67862,1045000
|
| 51 |
+
0.6369139,115.44011,0.008951268,-0.0011627098,-12.629893,0.14698759,-115.32706,115.58594,5.2979927,13.606287,-7.139892,-118.24066,-201.38965,18.90428,4.423138,-4.4940643,185.28714,1050000
|
| 52 |
+
0.64057326,126.43199,0.008806267,-0.009438542,-13.571798,0.1538648,-126.31248,126.576416,6.2865148,10.371971,5.164221,-128.94112,-199.4168,16.658485,1.4401855,-1.4502019,163.82767,1055000
|
| 53 |
+
0.6430394,125.29396,0.008925845,0.0012870842,-12.355803,0.17055085,-125.18368,125.4658,3.2043457,11.045119,3.0528643,-128.31938,-203.51682,14.249465,6.5502353,-7.1335692,159.20297,1060000
|
| 54 |
+
0.6474498,125.9054,0.008829122,0.0033216143,-12.123789,0.16772383,-125.798355,126.07645,3.2896135,9.5638075,-7.2307005,-128.65549,-205.59143,12.853421,2.8234432,-2.1085727,152.23788,1065000
|
| 55 |
+
0.6402246,122.37058,0.008848122,0.006864278,-11.724211,0.18512477,-122.266846,122.56258,4.0216117,11.715304,-6.2930684,-124.680786,-203.51048,15.736916,1.8328145,-1.8222253,140.21796,1070000
|
| 56 |
+
0.64027935,120.727264,0.008951841,-0.00042556794,-12.54754,0.17398402,-120.61493,120.90082,6.4230165,14.102671,-3.5859928,-123.882935,-204.16862,20.525688,2.1335008,-2.516254,224.95184,1075000
|
| 57 |
+
0.63630944,125.0544,0.0090376595,-0.0033149992,-12.866798,0.17456657,-124.93812,125.22565,4.8103943,10.9070425,-2.4047513,-128.5908,-204.87625,15.717437,1.0270673,-1.0001901,115.306854,1080000
|
| 58 |
+
0.63865906,120.21718,0.009000673,-0.004929453,-13.047676,0.16347052,-120.09975,120.37572,4.901005,10.711132,-0.18953872,-122.390335,-200.92003,15.612137,2.5577683,-2.5598915,156.91612,1085000
|
| 59 |
+
0.6325461,112.727295,0.0089335935,-0.004204781,-12.970671,0.13425481,-112.61142,112.857346,10.285979,14.851138,0.33221596,-116.22283,-198.9915,25.137117,4.469312,-4.373122,236.9112,1090000
|
| 60 |
+
0.63822013,118.43169,0.009034493,0.0070778765,-11.716572,0.14792976,-118.325836,118.58669,30.750147,14.182797,1.3088117,-121.33264,-203.51306,44.932945,8.055429,-8.687659,228.93695,1095000
|
| 61 |
+
0.64747125,124.92998,0.009052215,-0.0042077187,-12.964828,0.1582554,-124.81262,125.08402,5.5732903,12.828023,-1.1521324,-127.44454,-199.26945,18.401314,4.5200167,-4.446531,223.49661,1100000
|
| 62 |
+
0.64335465,121.84859,0.009021789,0.0026992422,-12.200809,0.16838184,-121.73852,122.01967,4.8450027,10.828073,-7.1644588,-125.04272,-201.78134,15.673075,1.0276833,-0.8939016,122.46297,1105000
|
| 63 |
+
0.64151627,119.04775,0.009030964,-0.0011368113,-12.625879,0.14925756,-118.93373,119.19587,4.016229,10.710135,-4.4565725,-122.62154,-200.65144,14.726364,2.4761379,-2.431656,122.764626,1110000
|
| 64 |
+
0.63749737,120.244446,0.009051581,0.007823418,-11.635685,0.13484535,-120.13913,120.38711,4.380832,13.570641,-5.1136475,-123.3998,-203.47577,17.951473,3.0773797,-1.9099047,158.98387,1115000
|
| 65 |
+
0.63891244,118.42381,0.009246706,-0.00961116,-13.539414,0.16066878,-118.298615,118.57487,3.365495,12.731094,8.52302,-121.46726,-201.6844,16.09659,4.5901284,-4.738214,179.8122,1120000
|
| 66 |
+
0.6420221,120.63182,0.009095726,-0.0018284336,-12.701021,0.1754812,-120.5163,120.80547,4.330212,12.564938,5.0376577,-123.27093,-202.67134,16.89515,7.4697847,-7.610998,192.14871,1125000
|
| 67 |
+
0.6423286,114.55643,0.009202527,-0.0030562286,-12.832108,0.15021926,-114.43834,114.70359,3.213144,12.205401,-3.7241104,-117.61372,-205.366,15.418546,1.607938,-1.9042472,138.75562,1130000
|
| 68 |
+
0.64889014,114.322876,0.009080649,0.0048412243,-11.966864,0.16816385,-114.21421,114.49589,5.7513933,8.555379,9.515275,-117.60525,-204.43233,14.306772,4.8888164,-5.033836,172.1196,1135000
|
| 69 |
+
0.6442645,117.38443,0.0089912275,0.015409641,-10.786147,0.17976427,-117.287445,117.579605,4.4486814,11.413592,6.9388123,-120.49725,-200.15926,15.862274,4.9661474,-5.67609,176.9141,1140000
|
| 70 |
+
0.6399818,122.85323,0.00931683,-0.008391381,-13.400669,0.16647306,-122.72838,123.011314,3.9086087,11.265607,0.79158896,-126.007996,-199.69624,15.174215,3.1140208,-3.2011726,162.71822,1145000
|
| 71 |
+
0.6359494,114.36154,0.00895561,-0.0076191043,-13.350763,0.13642992,-114.24198,114.49035,11.5581875,12.212228,3.03378,-116.68398,-202.12794,23.770416,3.8421316,-5.139534,261.6341,1150000
|
| 72 |
+
0.6441986,119.64505,0.00900115,0.0061497735,-11.816779,0.16510203,-119.53868,119.8163,8.989821,14.263605,-3.288331,-122.018265,-200.61362,23.253426,2.8998253,-3.264515,213.27899,1155000
|
| 73 |
+
0.63930994,114.34569,0.008958736,-0.008404898,-13.438179,0.17461729,-114.22531,114.511894,5.8479123,12.458501,-0.9938708,-117.41206,-203.66331,18.306414,2.0447383,-2.4165726,185.13705,1160000
|
| 74 |
+
0.6435765,117.71646,0.0092446655,-0.0049175764,-13.031937,0.18249275,-117.59599,117.894035,2.6522443,13.453914,-2.4171164,-120.973564,-204.45055,16.106157,4.7511406,-4.8530803,165.42174,1165000
|
| 75 |
+
0.6441177,115.79048,0.008940378,0.0025394973,-12.215952,0.12301375,-115.68127,115.91604,3.191152,10.792172,3.3246257,-118.97512,-204.66556,13.983324,1.3016728,-0.9511538,120.95566,1170000
|
| 76 |
+
0.63996714,114.658325,0.008945248,-0.006444326,-13.220419,0.13263686,-114.54006,114.784515,5.6182294,12.919925,3.588457,-118.13485,-203.87958,18.538155,2.3675346,-2.4253607,175.35168,1175000
|
| 77 |
+
0.6472302,114.61462,0.008931046,0.008293083,-11.571432,0.16970901,-114.51126,114.79262,4.107263,10.300577,-1.297009,-117.15,-202.4347,14.407841,3.1233022,-2.330678,148.71701,1180000
|
| 78 |
+
0.63812673,117.321655,0.009025415,-0.019413298,-14.650959,0.1528407,-117.18942,117.45508,3.8654854,12.609277,0.16729374,-120.67201,-204.33228,16.474762,2.1686172,-2.2013063,163.2712,1185000
|
| 79 |
+
0.63457733,118.61914,0.008904741,-0.01680014,-14.386651,0.16019544,-118.49103,118.762535,4.7007265,14.521354,-0.11960555,-121.11697,-199.53914,19.22208,2.4849174,-3.4842577,194.86765,1190000
|
| 80 |
+
0.6419711,115.17522,0.009057091,-0.003061783,-12.838054,0.1581711,-115.058945,115.33033,4.0616336,12.323306,2.6754103,-118.43673,-201.73927,16.38494,3.7936509,-3.4912312,179.9932,1195000
|
| 81 |
+
0.6394017,113.08376,0.008952216,0.005153115,-11.924376,0.13653684,-112.97701,113.22545,5.434844,21.786493,-4.744319,-117.58152,-204.23679,27.221336,18.331938,-19.037392,352.15814,1200000
|
| 82 |
+
0.6452251,114.158646,0.009151237,0.0040949713,-12.052523,0.13933654,-114.04835,114.30208,4.7481875,10.679305,-1.9141788,-117.13181,-204.65437,15.427492,1.3316841,-1.379427,136.29532,1205000
|
| 83 |
+
0.6417044,117.31653,0.0088636195,0.0014102319,-12.340897,0.15411162,-117.207146,117.47205,4.457092,9.469447,-2.1437001,-120.07549,-200.9081,13.926538,3.9012382,-2.8173084,158.09586,1210000
|
| 84 |
+
0.6478798,111.687935,0.009085928,0.011598593,-11.223455,0.16143486,-111.58595,111.86097,6.0767236,12.375046,-4.426555,-114.31807,-200.4281,18.451769,3.427331,-2.909831,180.42212,1215000
|
| 85 |
+
0.6425679,113.764046,0.008899554,-0.009781246,-13.5990715,0.19986562,-113.64302,113.95413,5.080354,10.585074,0.78503126,-117.14629,-198.44113,15.665428,2.3134422,-2.6875365,159.91138,1220000
|
| 86 |
+
0.6483133,114.335915,0.008943102,0.004711091,-11.973215,0.15933302,-114.228836,114.499954,5.1511803,14.4333105,-6.565956,-117.49387,-205.42143,19.584492,5.421847,-4.9954576,216.45692,1225000
|
| 87 |
+
0.6500518,114.09095,0.008938311,0.0073450967,-11.678246,0.15606585,-113.986565,114.254364,3.8946435,14.421097,-4.813753,-117.46484,-198.62079,18.31574,3.3998652,-3.3849719,199.30556,1230000
|
| 88 |
+
0.654586,116.65885,0.0090113925,0.023943437,-9.842981,0.17528483,-116.57015,116.85808,4.5858417,12.052828,-10.10899,-117.87087,-204.42686,16.63867,1.6840478,-1.9306474,178.63008,1235000
|
| 89 |
+
0.63838553,107.77483,0.008940681,-0.0022575266,-12.752501,0.15575528,-107.66081,107.92833,5.176726,18.016459,-1.4063989,-110.79207,-204.96379,23.193184,2.993135,-3.0509832,202.66487,1240000
|
| 90 |
+
0.645451,117.234116,0.00907391,0.0056982967,-11.872013,0.14591734,-117.126396,117.385735,6.9706726,15.473946,-5.150408,-120.55778,-200.54639,22.444618,4.710768,-3.8986478,305.13263,1245000
|
| 91 |
+
0.64949185,110.87115,0.009087471,0.006438022,-11.79155,0.14777866,-110.76399,111.02537,5.3136725,13.25802,7.2506413,-113.72986,-208.58847,18.571693,2.6872373,-2.1588652,220.47086,1250000
|
| 92 |
+
0.6372615,117.17987,0.008921282,-0.0024610404,-12.775862,0.17742355,-117.065895,117.35483,5.0350966,12.602782,9.785912,-120.23745,-206.75592,17.637878,3.055278,-4.2225165,166.03589,1255000
|
| 93 |
+
0.65055084,110.43919,0.009024921,0.008213692,-11.589888,0.14858694,-110.334595,110.596,6.6452317,13.530911,-2.5738738,-113.08174,-203.25798,20.176144,5.2041273,-4.761938,221.09059,1260000
|
| 94 |
+
0.6435777,113.13107,0.00903432,-0.0023665358,-12.76195,0.1561312,-113.01578,113.284836,4.91951,14.443294,4.902821,-116.49963,-204.79015,19.362804,2.5970795,-2.689025,209.6231,1265000
|
| 95 |
+
0.64414823,108.17973,0.00913213,0.00499328,-11.953218,0.13622221,-108.07058,108.320946,3.720113,11.68262,2.335027,-110.92887,-200.20403,15.402733,4.2302055,-3.2527492,156.41862,1270000
|
| 96 |
+
0.6392997,110.40303,0.009118833,-0.00067598827,-12.574131,0.19309235,-110.288376,110.59544,6.030208,14.079801,1.1412252,-113.40552,-202.61775,20.110008,3.9566097,-3.446022,196.08131,1275000
|
| 97 |
+
0.6327103,112.52719,0.00886264,-0.004035678,-12.9553585,0.17756154,-112.41238,112.700714,5.0299544,12.811571,2.0910602,-115.87813,-204.64185,17.841526,2.0840948,-1.8709232,153.90244,1280000
|
| 98 |
+
0.63721836,111.99739,0.009156889,-0.00071136496,-12.577686,0.15725172,-111.88222,112.15393,4.3236184,14.843093,4.8121514,-113.69462,-204.43098,19.166712,2.3622663,-1.945218,173.32361,1285000
|
| 99 |
+
0.6413306,109.357574,0.009260495,-0.000783866,-12.584646,0.15024629,-109.241035,109.507034,6.104498,18.207094,-4.0980577,-112.131485,-202.13612,24.311592,6.4269576,-6.5627136,235.332,1290000
|
| 100 |
+
0.63601035,105.85593,0.009156147,-0.009152462,-13.499598,0.16604869,-105.732315,106.01282,9.187842,16.397789,-5.7188263,-109.06525,-208.11346,25.585632,2.1719406,-2.1633742,224.60982,1295000
|
| 101 |
+
0.6370215,105.81694,0.009157164,-0.0072517735,-13.2919235,0.16424513,-105.69522,105.97393,6.200055,13.875284,-2.6775959,-108.841064,-203.3774,20.07534,2.491329,-2.5157256,178.3866,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.64530706,151.45154,0.0071283975,0.0039018842,-11.952628,0.19129601,-151.36633,151.64674,1.946989,3.764349,-43.19062,-154.18723,-194.7333,5.711338,1.6045392,-1.5209478,59.659332,805000
|
| 3 |
+
0.64778996,147.44556,0.0077615296,-0.008926482,-13.650093,0.19778866,-147.3396,147.63441,1.9322551,6.253452,-34.117447,-150.06123,-193.53798,8.185707,2.234766,-2.7194905,89.24094,810000
|
| 4 |
+
0.64080274,144.31929,0.008799769,-0.008743407,-13.493595,0.19734813,-144.20053,144.50789,1.6041905,5.17741,-42.39156,-147.24944,-193.16669,6.7816005,0.5052182,-0.85741657,53.693893,815000
|
| 5 |
+
0.6381637,139.14365,0.0091969725,-0.009806095,-13.566231,0.16819853,-139.01889,139.30203,4.3599787,9.68357,-9.43463,-143.37065,-201.3088,14.043549,2.0484245,-2.2449026,130.23145,820000
|
| 6 |
+
0.64582455,138.06465,0.009048228,0.0042560697,-12.029624,0.16679254,-137.95581,138.2357,2.6890614,8.729525,-49.738777,-141.13708,-201.1968,11.418586,0.9534511,-1.0779656,79.04982,825000
|
| 7 |
+
0.646403,136.56752,0.009007165,0.0076863817,-11.646637,0.1743981,-136.46262,136.7496,3.4507592,6.3948073,-32.522446,-139.08946,-197.8874,9.845567,4.955686,-4.5787716,112.66143,830000
|
| 8 |
+
0.6468451,137.1506,0.008984512,0.00013275721,-12.485224,0.17908798,-137.03842,137.32983,3.6096458,6.51197,-8.661832,-139.74847,-197.03651,10.121616,3.6167061,-3.3629735,109.54373,835000
|
| 9 |
+
0.63946056,136.57735,0.009138573,-0.014386287,-14.074238,0.18641861,-136.44873,136.74937,3.4819372,12.248917,-17.559185,-140.29103,-200.11787,15.730854,6.3223586,-6.5211773,140.78856,840000
|
| 10 |
+
0.64497316,135.94107,0.009571445,-0.00041384716,-12.543238,0.16752937,-135.82101,136.10818,3.2366714,6.485897,-16.441423,-138.90538,-198.28952,9.7225685,2.1301107,-1.8733666,90.327194,845000
|
| 11 |
+
0.64214855,136.24722,0.009655323,-0.0054118745,-13.060507,0.17602482,-136.12112,136.41783,3.2837055,9.746523,-1.9645768,-139.34282,-197.28459,13.030229,1.1283288,-1.4893548,121.95651,850000
|
| 12 |
+
0.6387469,130.44458,0.00950909,-0.010884558,-13.644648,0.18512529,-130.31485,130.61882,5.0602493,11.499225,-4.5960817,-134.10628,-197.76358,16.559475,7.569109,-6.915238,202.48105,855000
|
| 13 |
+
0.63597625,131.54105,0.009436453,-0.010416738,-13.603883,0.18895352,-131.41269,131.71957,3.4336464,8.557866,-16.336914,-134.97337,-201.94922,11.991512,2.0119822,-2.0964508,91.50578,860000
|
| 14 |
+
0.6473262,133.5199,0.009659564,-0.0058859284,-13.109337,0.18265426,-133.39325,133.69666,4.5276227,7.6472125,-30.946589,-136.19719,-200.49179,12.174835,2.3002136,-1.7486906,145.02754,865000
|
| 15 |
+
0.6435719,130.24225,0.00954603,-0.0074375346,-13.279123,0.15957046,-130.11548,130.3944,2.6802511,7.0118456,-19.340858,-133.07523,-197.11592,9.692097,1.0593324,-1.0205172,76.793236,870000
|
| 16 |
+
0.64371914,134.16681,0.009646865,-0.008289667,-13.359312,0.15864417,-134.03792,134.31717,2.597853,10.0781355,-23.25231,-137.82315,-202.03552,12.675988,2.8861115,-3.433244,129.47644,875000
|
| 17 |
+
0.6384182,134.73788,0.009523511,-0.0033488723,-12.851643,0.16106829,-134.6155,134.89561,3.6973045,11.6148815,-2.1888685,-138.08067,-200.68903,15.312186,1.9792695,-2.2276893,129.10948,880000
|
| 18 |
+
0.6387728,134.235,0.009341059,-0.0027508384,-12.794489,0.1404204,-134.1155,134.37268,7.8477015,16.63822,-31.722506,-137.32108,-201.50786,24.485922,5.5378027,-5.814643,230.14438,885000
|
| 19 |
+
0.6460577,132.14188,0.009542244,-0.00634399,-13.164832,0.17813972,-132.01625,132.31367,3.0712292,8.073055,-19.706179,-134.57567,-205.83273,11.144284,2.0217018,-2.1197557,103.49298,890000
|
| 20 |
+
0.64369124,128.93604,0.00939073,0.009587433,-11.4790535,0.15425014,-128.82825,129.09987,2.5253081,8.429105,-1.7357129,-131.70494,-200.05612,10.954412,1.892551,-1.8036768,99.3125,895000
|
| 21 |
+
0.6336833,123.64557,0.009638239,-0.0032889978,-12.841245,0.20613681,-123.521805,123.84842,3.1233003,8.807258,0.9685744,-127.155815,-202.76634,11.930558,6.2629633,-5.992218,133.83966,900000
|
| 22 |
+
0.64646703,129.61545,0.009605452,0.004071748,-12.0761,0.17531925,-129.49945,129.79485,3.0743368,11.87222,-10.910489,-133.12503,-201.25401,14.946557,4.1566277,-3.809247,126.87405,905000
|
| 23 |
+
0.6372495,125.97975,0.009509402,-0.01539024,-14.118423,0.15800947,-125.845505,126.122375,4.271411,8.601952,-11.84675,-129.36516,-200.00891,12.873363,4.131432,-2.9272683,127.76545,910000
|
| 24 |
+
0.64200926,124.775406,0.009568,0.0028348062,-12.20372,0.19566771,-124.658646,124.973915,3.6070564,10.992043,0.8751895,-129.14403,-206.85716,14.599099,10.164488,-9.389187,208.66998,915000
|
| 25 |
+
0.6485127,129.24744,0.009567539,0.0047987974,-11.998429,0.16412434,-129.13263,129.41635,3.6843953,12.117945,-2.5786371,-131.88127,-202.6602,15.80234,7.418913,-6.7387333,157.86917,920000
|
| 26 |
+
0.64305043,130.71681,0.009461757,-0.007969109,-13.342244,0.1747335,-130.59058,130.88358,3.8654923,8.022582,-7.6632204,-133.92299,-198.00703,11.888075,3.0206022,-1.4140596,109.01419,925000
|
| 27 |
+
0.6493245,130.2719,0.009417187,0.009829143,-11.456255,0.16706479,-130.164,130.44879,3.7411842,12.047646,-5.378246,-133.74205,-206.01443,15.78883,2.5857537,-3.0816195,140.85968,930000
|
| 28 |
+
0.6352143,127.00627,0.009560685,-0.01243791,-13.800943,0.18414296,-126.87432,127.17798,2.7595425,13.819522,2.1839423,-130.26884,-200.64621,16.579063,3.3815682,-2.7306888,138.87216,935000
|
| 29 |
+
0.6396308,124.88336,0.009243012,-0.0068211043,-13.237974,0.21149899,-124.761,125.08804,4.713974,10.277672,-11.991817,-128.37024,-203.25159,14.991646,4.3375163,-4.846834,156.22133,940000
|
| 30 |
+
0.6549991,127.29137,0.009084781,0.009004571,-11.508829,0.1703541,-127.1868,127.470726,9.574971,10.717213,0.42268813,-130.31137,-202.7935,20.292183,3.623092,-2.4339974,237.89262,945000
|
| 31 |
+
0.648085,129.26913,0.009306116,0.0062638535,-11.82691,0.18396509,-129.15907,129.45937,2.6724584,8.705113,3.3706195,-131.11339,-204.36172,11.377572,6.071621,-6.52353,145.72362,950000
|
| 32 |
+
0.64283085,124.91946,0.009268761,0.00083231594,-12.410202,0.17649093,-124.80443,125.09678,2.33236,9.647229,-4.415162,-128.37865,-203.45605,11.979589,4.295574,-3.9597216,140.09016,955000
|
| 33 |
+
0.6398686,128.10672,0.009197108,0.0050142403,-11.9548025,0.16161518,-127.99678,128.27336,6.19904,14.949328,-7.6854954,-131.22617,-201.9682,21.148369,5.846786,-5.7091455,282.38208,960000
|
| 34 |
+
0.633834,126.51166,0.009270171,-0.014299853,-14.042566,0.1833516,-126.381485,126.68071,5.1353087,13.535263,-2.0781572,-130.38359,-202.05853,18.670572,2.3987296,-2.9906862,173.86717,965000
|
| 35 |
+
0.6526637,129.27945,0.009067093,0.01502206,-10.843233,0.17309235,-129.18112,129.46756,3.8580265,8.908418,-3.8630464,-131.5659,-202.01045,12.766444,2.3070388,-1.9413198,149.11673,970000
|
| 36 |
+
0.6482518,129.09827,0.009242492,0.0073989048,-11.699469,0.15623128,-128.99013,129.2619,4.096471,10.511378,-4.9869633,-132.04176,-204.25061,14.607849,4.293025,-4.1829195,195.66927,975000
|
| 37 |
+
0.648094,127.91079,0.009221876,0.012711811,-11.121559,0.15795715,-127.80823,128.08145,3.0247827,11.743599,1.652974,-129.93605,-202.4037,14.768381,1.5803292,-1.4001548,131.79373,980000
|
| 38 |
+
0.6262717,124.840866,0.009067669,-0.033476185,-16.191818,0.16534077,-124.694046,124.97273,3.6806142,10.304584,-6.5996127,-127.93963,-198.62473,13.985198,2.812267,-3.118621,132.45428,985000
|
| 39 |
+
0.6516476,125.477936,0.009109811,0.0085051665,-11.566373,0.154639,-125.372574,125.64108,3.5983658,12.343293,5.3442435,-127.89007,-196.59073,15.941659,2.4201841,-2.4988332,166.42148,990000
|
| 40 |
+
0.6361518,123.10919,0.008952323,-0.0015794134,-12.676425,0.19172975,-122.995705,123.29934,2.8808472,12.34013,0.9983201,-125.98496,-206.37018,15.220977,2.1284478,-1.272212,110.8873,995000
|
| 41 |
+
0.6419613,128.31447,0.009379377,-0.012819967,-13.866825,0.1425274,-128.1844,128.44418,5.7957516,19.876371,-15.185081,-131.86624,-204.07536,25.672123,2.8091931,-3.1722734,260.10995,1000000
|
| 42 |
+
0.6414403,122.97156,0.009426342,-0.008208405,-13.370794,0.15206194,-122.84552,123.11541,5.6284738,10.551465,-2.8885527,-126.441795,-201.089,16.17994,4.459067,-3.9681387,138.99858,1005000
|
| 43 |
+
0.6335872,124.71059,0.008935046,-0.001847516,-12.706772,0.15157737,-124.597046,124.86032,7.737613,11.251699,-7.9901605,-127.493,-202.00919,18.989313,1.1814945,-1.2889532,158.24274,1010000
|
| 44 |
+
0.6447632,125.38285,0.009036677,0.0007208479,-12.420231,0.15936273,-125.270615,125.54293,2.9831538,11.179778,0.6246758,-128.37756,-201.61462,14.162931,4.2437606,-6.4575915,181.34703,1015000
|
| 45 |
+
0.64373016,122.58633,0.008926134,0.0055760327,-11.875314,0.17193592,-122.480316,122.76384,2.8420384,9.403734,-0.3499058,-125.82975,-202.59935,12.245772,1.783332,-1.7742308,110.437,1020000
|
| 46 |
+
0.63591284,120.34452,0.0090353545,0.011556195,-11.221003,0.18668321,-120.24313,120.54276,3.8062704,12.823054,-5.5159793,-123.62289,-199.35257,16.629324,4.418092,-3.8486297,167.17308,1025000
|
| 47 |
+
0.6417389,125.9348,0.008885633,0.00211528,-12.261944,0.1782994,-125.82584,126.11521,4.2040887,10.489898,0.46938378,-128.62085,-202.40022,14.693987,1.6466022,-1.7262478,129.86987,1030000
|
| 48 |
+
0.64039594,120.50253,0.009109911,-0.003973058,-12.936125,0.19240403,-120.38469,120.69096,6.585654,10.121231,-5.150677,-123.24656,-196.52623,16.706884,3.1107054,-1.7434717,169.26146,1035000
|
| 49 |
+
0.6502667,123.33198,0.008805683,0.0052252333,-11.906607,0.12575838,-123.227135,123.46296,4.753125,14.178517,1.3936784,-126.71087,-201.9305,18.931643,2.9474378,-3.0746727,208.22192,1040000
|
| 50 |
+
0.63774514,126.11377,0.008993127,-0.019801775,-14.701879,0.17314675,-125.98155,126.26712,4.8370676,15.311411,-16.543993,-129.67627,-202.34277,20.14848,4.2073517,-4.7344823,218.67862,1045000
|
| 51 |
+
0.6369139,115.44011,0.008951268,-0.0011627098,-12.629893,0.14698759,-115.32706,115.58594,5.2979927,13.606287,-7.139892,-118.24066,-201.38965,18.90428,4.423138,-4.4940643,185.28714,1050000
|
| 52 |
+
0.64057326,126.43199,0.008806267,-0.009438542,-13.571798,0.1538648,-126.31248,126.576416,6.2865148,10.371971,5.164221,-128.94112,-199.4168,16.658485,1.4401855,-1.4502019,163.82767,1055000
|
| 53 |
+
0.6430394,125.29396,0.008925845,0.0012870842,-12.355803,0.17055085,-125.18368,125.4658,3.2043457,11.045119,3.0528643,-128.31938,-203.51682,14.249465,6.5502353,-7.1335692,159.20297,1060000
|
| 54 |
+
0.6474498,125.9054,0.008829122,0.0033216143,-12.123789,0.16772383,-125.798355,126.07645,3.2896135,9.5638075,-7.2307005,-128.65549,-205.59143,12.853421,2.8234432,-2.1085727,152.23788,1065000
|
| 55 |
+
0.6402246,122.37058,0.008848122,0.006864278,-11.724211,0.18512477,-122.266846,122.56258,4.0216117,11.715304,-6.2930684,-124.680786,-203.51048,15.736916,1.8328145,-1.8222253,140.21796,1070000
|
| 56 |
+
0.64027935,120.727264,0.008951841,-0.00042556794,-12.54754,0.17398402,-120.61493,120.90082,6.4230165,14.102671,-3.5859928,-123.882935,-204.16862,20.525688,2.1335008,-2.516254,224.95184,1075000
|
| 57 |
+
0.63630944,125.0544,0.0090376595,-0.0033149992,-12.866798,0.17456657,-124.93812,125.22565,4.8103943,10.9070425,-2.4047513,-128.5908,-204.87625,15.717437,1.0270673,-1.0001901,115.306854,1080000
|
| 58 |
+
0.63865906,120.21718,0.009000673,-0.004929453,-13.047676,0.16347052,-120.09975,120.37572,4.901005,10.711132,-0.18953872,-122.390335,-200.92003,15.612137,2.5577683,-2.5598915,156.91612,1085000
|
| 59 |
+
0.6325461,112.727295,0.0089335935,-0.004204781,-12.970671,0.13425481,-112.61142,112.857346,10.285979,14.851138,0.33221596,-116.22283,-198.9915,25.137117,4.469312,-4.373122,236.9112,1090000
|
| 60 |
+
0.63822013,118.43169,0.009034493,0.0070778765,-11.716572,0.14792976,-118.325836,118.58669,30.750147,14.182797,1.3088117,-121.33264,-203.51306,44.932945,8.055429,-8.687659,228.93695,1095000
|
| 61 |
+
0.64747125,124.92998,0.009052215,-0.0042077187,-12.964828,0.1582554,-124.81262,125.08402,5.5732903,12.828023,-1.1521324,-127.44454,-199.26945,18.401314,4.5200167,-4.446531,223.49661,1100000
|
| 62 |
+
0.64335465,121.84859,0.009021789,0.0026992422,-12.200809,0.16838184,-121.73852,122.01967,4.8450027,10.828073,-7.1644588,-125.04272,-201.78134,15.673075,1.0276833,-0.8939016,122.46297,1105000
|
| 63 |
+
0.64151627,119.04775,0.009030964,-0.0011368113,-12.625879,0.14925756,-118.93373,119.19587,4.016229,10.710135,-4.4565725,-122.62154,-200.65144,14.726364,2.4761379,-2.431656,122.764626,1110000
|
| 64 |
+
0.63749737,120.244446,0.009051581,0.007823418,-11.635685,0.13484535,-120.13913,120.38711,4.380832,13.570641,-5.1136475,-123.3998,-203.47577,17.951473,3.0773797,-1.9099047,158.98387,1115000
|
| 65 |
+
0.63891244,118.42381,0.009246706,-0.00961116,-13.539414,0.16066878,-118.298615,118.57487,3.365495,12.731094,8.52302,-121.46726,-201.6844,16.09659,4.5901284,-4.738214,179.8122,1120000
|
| 66 |
+
0.6420221,120.63182,0.009095726,-0.0018284336,-12.701021,0.1754812,-120.5163,120.80547,4.330212,12.564938,5.0376577,-123.27093,-202.67134,16.89515,7.4697847,-7.610998,192.14871,1125000
|
| 67 |
+
0.6423286,114.55643,0.009202527,-0.0030562286,-12.832108,0.15021926,-114.43834,114.70359,3.213144,12.205401,-3.7241104,-117.61372,-205.366,15.418546,1.607938,-1.9042472,138.75562,1130000
|
| 68 |
+
0.64889014,114.322876,0.009080649,0.0048412243,-11.966864,0.16816385,-114.21421,114.49589,5.7513933,8.555379,9.515275,-117.60525,-204.43233,14.306772,4.8888164,-5.033836,172.1196,1135000
|
| 69 |
+
0.6442645,117.38443,0.0089912275,0.015409641,-10.786147,0.17976427,-117.287445,117.579605,4.4486814,11.413592,6.9388123,-120.49725,-200.15926,15.862274,4.9661474,-5.67609,176.9141,1140000
|
| 70 |
+
0.6399818,122.85323,0.00931683,-0.008391381,-13.400669,0.16647306,-122.72838,123.011314,3.9086087,11.265607,0.79158896,-126.007996,-199.69624,15.174215,3.1140208,-3.2011726,162.71822,1145000
|
| 71 |
+
0.6359494,114.36154,0.00895561,-0.0076191043,-13.350763,0.13642992,-114.24198,114.49035,11.5581875,12.212228,3.03378,-116.68398,-202.12794,23.770416,3.8421316,-5.139534,261.6341,1150000
|
| 72 |
+
0.6441986,119.64505,0.00900115,0.0061497735,-11.816779,0.16510203,-119.53868,119.8163,8.989821,14.263605,-3.288331,-122.018265,-200.61362,23.253426,2.8998253,-3.264515,213.27899,1155000
|
| 73 |
+
0.63930994,114.34569,0.008958736,-0.008404898,-13.438179,0.17461729,-114.22531,114.511894,5.8479123,12.458501,-0.9938708,-117.41206,-203.66331,18.306414,2.0447383,-2.4165726,185.13705,1160000
|
| 74 |
+
0.6435765,117.71646,0.0092446655,-0.0049175764,-13.031937,0.18249275,-117.59599,117.894035,2.6522443,13.453914,-2.4171164,-120.973564,-204.45055,16.106157,4.7511406,-4.8530803,165.42174,1165000
|
| 75 |
+
0.6441177,115.79048,0.008940378,0.0025394973,-12.215952,0.12301375,-115.68127,115.91604,3.191152,10.792172,3.3246257,-118.97512,-204.66556,13.983324,1.3016728,-0.9511538,120.95566,1170000
|
| 76 |
+
0.63996714,114.658325,0.008945248,-0.006444326,-13.220419,0.13263686,-114.54006,114.784515,5.6182294,12.919925,3.588457,-118.13485,-203.87958,18.538155,2.3675346,-2.4253607,175.35168,1175000
|
| 77 |
+
0.6472302,114.61462,0.008931046,0.008293083,-11.571432,0.16970901,-114.51126,114.79262,4.107263,10.300577,-1.297009,-117.15,-202.4347,14.407841,3.1233022,-2.330678,148.71701,1180000
|
| 78 |
+
0.63812673,117.321655,0.009025415,-0.019413298,-14.650959,0.1528407,-117.18942,117.45508,3.8654854,12.609277,0.16729374,-120.67201,-204.33228,16.474762,2.1686172,-2.2013063,163.2712,1185000
|
| 79 |
+
0.63457733,118.61914,0.008904741,-0.01680014,-14.386651,0.16019544,-118.49103,118.762535,4.7007265,14.521354,-0.11960555,-121.11697,-199.53914,19.22208,2.4849174,-3.4842577,194.86765,1190000
|
| 80 |
+
0.6419711,115.17522,0.009057091,-0.003061783,-12.838054,0.1581711,-115.058945,115.33033,4.0616336,12.323306,2.6754103,-118.43673,-201.73927,16.38494,3.7936509,-3.4912312,179.9932,1195000
|
| 81 |
+
0.6394017,113.08376,0.008952216,0.005153115,-11.924376,0.13653684,-112.97701,113.22545,5.434844,21.786493,-4.744319,-117.58152,-204.23679,27.221336,18.331938,-19.037392,352.15814,1200000
|
| 82 |
+
0.6452251,114.158646,0.009151237,0.0040949713,-12.052523,0.13933654,-114.04835,114.30208,4.7481875,10.679305,-1.9141788,-117.13181,-204.65437,15.427492,1.3316841,-1.379427,136.29532,1205000
|
| 83 |
+
0.6417044,117.31653,0.0088636195,0.0014102319,-12.340897,0.15411162,-117.207146,117.47205,4.457092,9.469447,-2.1437001,-120.07549,-200.9081,13.926538,3.9012382,-2.8173084,158.09586,1210000
|
| 84 |
+
0.6478798,111.687935,0.009085928,0.011598593,-11.223455,0.16143486,-111.58595,111.86097,6.0767236,12.375046,-4.426555,-114.31807,-200.4281,18.451769,3.427331,-2.909831,180.42212,1215000
|
| 85 |
+
0.6425679,113.764046,0.008899554,-0.009781246,-13.5990715,0.19986562,-113.64302,113.95413,5.080354,10.585074,0.78503126,-117.14629,-198.44113,15.665428,2.3134422,-2.6875365,159.91138,1220000
|
| 86 |
+
0.6483133,114.335915,0.008943102,0.004711091,-11.973215,0.15933302,-114.228836,114.499954,5.1511803,14.4333105,-6.565956,-117.49387,-205.42143,19.584492,5.421847,-4.9954576,216.45692,1225000
|
| 87 |
+
0.6500518,114.09095,0.008938311,0.0073450967,-11.678246,0.15606585,-113.986565,114.254364,3.8946435,14.421097,-4.813753,-117.46484,-198.62079,18.31574,3.3998652,-3.3849719,199.30556,1230000
|
| 88 |
+
0.654586,116.65885,0.0090113925,0.023943437,-9.842981,0.17528483,-116.57015,116.85808,4.5858417,12.052828,-10.10899,-117.87087,-204.42686,16.63867,1.6840478,-1.9306474,178.63008,1235000
|
| 89 |
+
0.63838553,107.77483,0.008940681,-0.0022575266,-12.752501,0.15575528,-107.66081,107.92833,5.176726,18.016459,-1.4063989,-110.79207,-204.96379,23.193184,2.993135,-3.0509832,202.66487,1240000
|
| 90 |
+
0.645451,117.234116,0.00907391,0.0056982967,-11.872013,0.14591734,-117.126396,117.385735,6.9706726,15.473946,-5.150408,-120.55778,-200.54639,22.444618,4.710768,-3.8986478,305.13263,1245000
|
| 91 |
+
0.64949185,110.87115,0.009087471,0.006438022,-11.79155,0.14777866,-110.76399,111.02537,5.3136725,13.25802,7.2506413,-113.72986,-208.58847,18.571693,2.6872373,-2.1588652,220.47086,1250000
|
| 92 |
+
0.6372615,117.17987,0.008921282,-0.0024610404,-12.775862,0.17742355,-117.065895,117.35483,5.0350966,12.602782,9.785912,-120.23745,-206.75592,17.637878,3.055278,-4.2225165,166.03589,1255000
|
| 93 |
+
0.65055084,110.43919,0.009024921,0.008213692,-11.589888,0.14858694,-110.334595,110.596,6.6452317,13.530911,-2.5738738,-113.08174,-203.25798,20.176144,5.2041273,-4.761938,221.09059,1260000
|
| 94 |
+
0.6435777,113.13107,0.00903432,-0.0023665358,-12.76195,0.1561312,-113.01578,113.284836,4.91951,14.443294,4.902821,-116.49963,-204.79015,19.362804,2.5970795,-2.689025,209.6231,1265000
|
| 95 |
+
0.64414823,108.17973,0.00913213,0.00499328,-11.953218,0.13622221,-108.07058,108.320946,3.720113,11.68262,2.335027,-110.92887,-200.20403,15.402733,4.2302055,-3.2527492,156.41862,1270000
|
| 96 |
+
0.6392997,110.40303,0.009118833,-0.00067598827,-12.574131,0.19309235,-110.288376,110.59544,6.030208,14.079801,1.1412252,-113.40552,-202.61775,20.110008,3.9566097,-3.446022,196.08131,1275000
|
| 97 |
+
0.6327103,112.52719,0.00886264,-0.004035678,-12.9553585,0.17756154,-112.41238,112.700714,5.0299544,12.811571,2.0910602,-115.87813,-204.64185,17.841526,2.0840948,-1.8709232,153.90244,1280000
|
| 98 |
+
0.63721836,111.99739,0.009156889,-0.00071136496,-12.577686,0.15725172,-111.88222,112.15393,4.3236184,14.843093,4.8121514,-113.69462,-204.43098,19.166712,2.3622663,-1.945218,173.32361,1285000
|
| 99 |
+
0.6413306,109.357574,0.009260495,-0.000783866,-12.584646,0.15024629,-109.241035,109.507034,6.104498,18.207094,-4.0980577,-112.131485,-202.13612,24.311592,6.4269576,-6.5627136,235.332,1290000
|
| 100 |
+
0.63601035,105.85593,0.009156147,-0.009152462,-13.499598,0.16604869,-105.732315,106.01282,9.187842,16.397789,-5.7188263,-109.06525,-208.11346,25.585632,2.1719406,-2.1633742,224.60982,1295000
|
| 101 |
+
0.6370215,105.81694,0.009157164,-0.0072517735,-13.2919235,0.16424513,-105.69522,105.97393,6.200055,13.875284,-2.6775959,-108.841064,-203.3774,20.07534,2.491329,-2.5157256,178.3866,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48166aeb681e44739cffa79406f05adf204cfa927ec986794847188dbef213ec
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cae334196d1e63212b2fb37c69bc21cff1cbb097f66ea7034530b7ba86ed63d
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c34bdaa77befe98a98a070516c33e1b7e14979154a82dd00a53125fd95c2e21
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f8e3b9d8811da5c1ee8e5082a5cec59dacd7b6bbc55ee5cd5d02d3fb593d443
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09f8b85ff2f43bd1a523bf403b8112066f95cb94a966c51a17950648ed9b41c6
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31430896fd53f0d48b97eb82660448b3d3e2595aa69e008bfa5ab47c1ff8baf2
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14a74633ec4774b591b4a464e5467675e9fe7fa774e7e4cb644cd3c19593fea3
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5cd781ea19b38017180295b7f997c9a635659c7e082291053d0545da7aa3f30f
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3ced43df9086341492b11325c70209b92892ee9a2d3b50ee0c2fc2ec687ec4f
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:403dd687169192386c65f06e9d5ee1cb9fd2997e308837dc233539590348743a
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_095711/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/flxin00z
|