Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/env.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.1028424364196591,0.0006273020790528771,-0.10273438129371823,0.0024887501005695645,15.838186445072933,49.289000000014966,0.02,25337.8,-0.98,-984.44,983.78,2.9349680519104004,450000
|
| 3 |
+
0.0,0.0,-0.10295276606487938,-0.003251146774002188,-0.10308446640593916,-0.0033358566091565454,27.70901364389337,50.10000000001527,0.0,76689.0,-1.0,-1000.0,1000.0,3.180800347328186,500000
|
| 4 |
+
0.0,0.0,-0.09448511884491151,-0.004255320533913187,-0.0947207782006742,-0.004382917356270594,28.200361386107303,49.21000000001495,0.02,127816.8,-1.0,-990.16,982.2,3.15831573009491,550000
|
| 5 |
+
0.0,0.0,-0.11531461727539216,-0.000932228817201221,-0.1153848577947184,-0.0011909701394915812,20.141176545456894,50.10000000001527,0.0,179799.0,-1.1,-1058.54,1000.0,3.140068144798279,600000
|
| 6 |
+
0.0,0.0,-0.10771217592050929,-0.0011199772490169636,-0.10779621596454178,-0.0014005623890072255,25.293958552369077,50.10000000001527,0.0,231799.0,-1.0,-1000.0,1000.0,3.207478232383728,650000
|
| 7 |
+
0.0,0.0,-0.1041154077641363,-0.001565134628380042,-0.10424467148153228,-0.0028695218048973557,27.95941049496263,49.17200000001496,0.02,282926.68,-1.0,-997.04,981.44,3.162386598587036,700000
|
| 8 |
+
0.0,0.0,-0.09960844059118928,-0.0008653899334400333,-0.09965596559983585,-0.001169801064049342,19.619013764817993,50.10000000001527,0.0,334871.0,-1.1,-1042.04,1000.0,3.130853323936462,750000
|
| 9 |
+
0.0,0.0,-0.10089200077659036,-0.0009741722139127479,-0.10094130733478125,-0.0010248350483280395,28.69760435633301,50.10000000001527,0.0,386871.0,-1.02,-1019.64,1000.0,3.224875774383545,800000
|
| 10 |
+
0.0,0.0,-0.11823973629228174,-0.0015011109408926315,-0.11837097787538417,-0.0025984699626976065,27.223505836306494,50.10000000001527,0.0,438871.0,-1.02,-1003.84,1000.0,3.210327482223511,850000
|
| 11 |
+
0.0,0.0,-0.12678478700237106,-0.0012893313403210893,-0.12685057239090872,-0.001341709767863316,22.824835970341667,49.34300000001498,0.02,490431.94,-1.04,-1024.48,984.86,3.1338221502304076,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.1028424364196591,0.0006273020790528771,-0.10273438129371823,0.0024887501005695645,15.838186445072933,49.289000000014966,0.02,25337.8,-0.98,-984.44,983.78,2.9349680519104004,450000
|
| 3 |
+
0.0,0.0,-0.10295276606487938,-0.003251146774002188,-0.10308446640593916,-0.0033358566091565454,27.70901364389337,50.10000000001527,0.0,76689.0,-1.0,-1000.0,1000.0,3.180800347328186,500000
|
| 4 |
+
0.0,0.0,-0.09448511884491151,-0.004255320533913187,-0.0947207782006742,-0.004382917356270594,28.200361386107303,49.21000000001495,0.02,127816.8,-1.0,-990.16,982.2,3.15831573009491,550000
|
| 5 |
+
0.0,0.0,-0.11531461727539216,-0.000932228817201221,-0.1153848577947184,-0.0011909701394915812,20.141176545456894,50.10000000001527,0.0,179799.0,-1.1,-1058.54,1000.0,3.140068144798279,600000
|
| 6 |
+
0.0,0.0,-0.10771217592050929,-0.0011199772490169636,-0.10779621596454178,-0.0014005623890072255,25.293958552369077,50.10000000001527,0.0,231799.0,-1.0,-1000.0,1000.0,3.207478232383728,650000
|
| 7 |
+
0.0,0.0,-0.1041154077641363,-0.001565134628380042,-0.10424467148153228,-0.0028695218048973557,27.95941049496263,49.17200000001496,0.02,282926.68,-1.0,-997.04,981.44,3.162386598587036,700000
|
| 8 |
+
0.0,0.0,-0.09960844059118928,-0.0008653899334400333,-0.09965596559983585,-0.001169801064049342,19.619013764817993,50.10000000001527,0.0,334871.0,-1.1,-1042.04,1000.0,3.130853323936462,750000
|
| 9 |
+
0.0,0.0,-0.10089200077659036,-0.0009741722139127479,-0.10094130733478125,-0.0010248350483280395,28.69760435633301,50.10000000001527,0.0,386871.0,-1.02,-1019.64,1000.0,3.224875774383545,800000
|
| 10 |
+
0.0,0.0,-0.11823973629228174,-0.0015011109408926315,-0.11837097787538417,-0.0025984699626976065,27.223505836306494,50.10000000001527,0.0,438871.0,-1.02,-1003.84,1000.0,3.210327482223511,850000
|
| 11 |
+
0.0,0.0,-0.12678478700237106,-0.0012893313403210893,-0.12685057239090872,-0.001341709767863316,22.824835970341667,49.34300000001498,0.02,490431.94,-1.04,-1024.48,984.86,3.1338221502304076,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.65777576,286.2387,0.0043688696,-0.0058244374,-13.833168,0.19124553,-286.17825,286.42413,4.602918,37.411324,-113.48078,-287.4548,-302.93402,42.01424,9.782691,-9.395115,332.65448,405000
|
| 3 |
+
0.66484314,283.14642,0.004531941,0.0043779872,-11.533971,0.18151787,-283.09412,283.3323,2.4132216,5.800167,-153.34193,-283.94492,-302.7867,8.213388,4.3679423,-3.061497,165.07124,410000
|
| 4 |
+
0.643561,279.89133,0.004328691,-0.0022389041,-13.017224,0.22689164,-279.83496,280.116,1.9741777,5.404739,-103.43752,-280.62515,-302.8149,7.3789167,0.5338774,-0.6207844,76.24657,415000
|
| 5 |
+
0.6515242,285.9378,0.004074832,0.00044677674,-12.390357,0.17150408,-285.88727,286.10977,2.0441465,4.975637,-172.43262,-287.1694,-302.6491,7.0197835,2.021884,-1.6794242,97.16882,420000
|
| 6 |
+
0.6425659,282.19733,0.004221519,-0.009844476,-14.831975,0.21109831,-282.13474,282.39856,1.7567666,4.736975,-105.97365,-283.63388,-302.80106,6.493742,0.65635586,-0.5470581,71.83242,425000
|
| 7 |
+
0.66511166,282.87598,0.0040940875,0.0060505406,-11.022127,0.20757331,-282.83087,283.0896,1.5211914,3.6555498,1.2542198,-283.83527,-302.59045,5.176741,0.68858814,-0.69464165,66.58798,430000
|
| 8 |
+
0.66057,287.1335,0.0040622465,0.0049433047,-11.283111,0.17368807,-287.0877,287.31213,1.5880116,5.4547105,-103.27681,-287.57407,-302.7342,7.042722,0.7526107,-0.8434743,93.1994,435000
|
| 9 |
+
0.6639598,282.2492,0.0044977623,0.0016852883,-12.125305,0.20861104,-282.19464,282.4595,1.7928759,7.9227877,-101.89276,-282.68555,-302.28278,9.715664,3.8086073,-3.652063,120.84007,440000
|
| 10 |
+
0.6579338,282.69128,0.0043312325,0.0016745145,-12.113386,0.19922689,-282.6388,282.89218,1.3764117,3.9846294,-99.808365,-283.4558,-302.87305,5.361041,0.406014,-0.47376734,67.75493,445000
|
| 11 |
+
0.6635614,281.38623,0.004240995,0.006134044,-11.053631,0.1747652,-281.33936,281.56714,1.3687917,4.217381,-101.21222,-282.17776,-303.3144,5.5861726,0.6727085,-0.5703892,68.9735,450000
|
| 12 |
+
0.6473163,281.2316,0.0042631337,-0.0010573512,-12.748022,0.17549762,-281.17725,281.40604,2.03662,4.2015047,-101.570625,-282.40558,-302.8451,6.238125,1.9957787,-1.8035789,104.21101,455000
|
| 13 |
+
0.6588652,281.46906,0.004131644,-0.001490058,-12.860645,0.20731878,-281.41592,281.67487,1.9008435,4.5409293,-101.35432,-282.48178,-302.74652,6.441773,1.2861012,-0.83129036,90.13878,460000
|
| 14 |
+
0.6555925,283.30344,0.0040887324,0.00067760027,-12.334276,0.1872018,-283.253,283.4913,1.6134785,4.8648124,-101.340965,-284.35455,-302.71185,6.478291,0.65421987,-0.5702749,81.90708,465000
|
| 15 |
+
0.64430267,275.83557,0.0039874366,-0.00028204743,-12.570734,0.1989052,-275.78546,276.0342,2.2736754,4.6226892,-99.96793,-276.99918,-303.04764,6.8963647,1.0704606,-0.77871346,84.70085,470000
|
| 16 |
+
0.6424428,274.75723,0.0043020886,-0.015211099,-16.035748,0.19362412,-274.68826,274.93567,4.8248057,8.5596,-37.053986,-275.88913,-302.26834,13.384405,2.7987986,-2.733929,185.2145,475000
|
| 17 |
+
0.6428447,276.01517,0.0041619227,-0.017834926,-16.785261,0.19927755,-275.9453,276.19662,2.0736983,4.9688888,-101.277885,-277.2692,-302.4938,7.0425873,0.5188356,-0.48158282,74.978134,480000
|
| 18 |
+
0.6527853,278.3581,0.004348925,-0.00037986983,-12.587348,0.16083136,-278.30338,278.51855,1.9322634,6.7203,-69.89604,-279.1411,-302.2465,8.652563,1.1990683,-0.81142724,94.71803,485000
|
| 19 |
+
0.64392287,278.38773,0.004257482,-0.002514538,-13.090616,0.18314369,-278.33197,278.56836,1.7886165,7.594345,-100.31534,-279.3383,-302.15817,9.382961,0.5245527,-0.5821067,74.75274,490000
|
| 20 |
+
0.65475404,278.48904,0.0042512827,-0.0004662733,-12.609678,0.18878198,-278.43542,278.67737,1.6314347,3.5924385,-100.64765,-279.44278,-302.53516,5.223873,0.51113063,-0.43821287,66.75864,495000
|
| 21 |
+
0.6398633,275.591,0.0041859993,-0.011196487,-15.1747465,0.1862495,-275.5275,275.76605,1.813138,6.487021,-101.16662,-277.05942,-302.3382,8.300159,2.4702225,-2.3254802,98.488754,500000
|
| 22 |
+
0.66557217,278.42065,0.0043634693,0.004410434,-11.489237,0.21572632,-278.37054,278.6408,1.9359106,4.155012,-101.23635,-279.59732,-302.62888,6.090923,0.69092953,-0.87205356,69.88994,505000
|
| 23 |
+
0.6497343,278.6211,0.0042842436,-0.004876799,-13.63831,0.21381727,-278.56268,278.83002,1.9659092,4.518036,-100.417725,-279.53452,-302.22247,6.483945,0.44262838,-0.4729781,70.45741,510000
|
| 24 |
+
0.6316272,275.14636,0.0041847,-0.010805198,-15.082072,0.18401146,-275.08325,275.31958,1.8957462,14.241051,-100.4533,-276.48874,-302.17874,16.136797,3.9939694,-4.0240393,142.66756,515000
|
| 25 |
+
0.65047467,272.76514,0.0041568116,0.0049227513,-11.315739,0.17586342,-272.71808,272.94592,1.5557191,4.8189883,-100.545845,-273.17023,-302.53656,6.374707,0.64840984,-0.64553905,84.06355,520000
|
| 26 |
+
0.6751094,279.9757,0.00397356,0.012152452,-9.441671,0.17466286,-279.93817,280.1625,2.0324066,4.5430946,-100.53836,-280.56866,-302.55136,6.5755014,2.9621282,-1.4267627,104.70213,525000
|
| 27 |
+
0.6623017,276.56177,0.0041829324,0.0044278903,-11.441439,0.20019893,-276.51392,276.7664,1.417243,3.9836583,-100.28535,-277.8501,-302.89606,5.4009013,0.46793902,-0.62123984,66.47359,530000
|
| 28 |
+
0.65802926,277.88666,0.003913545,0.0060008494,-10.966646,0.20672569,-277.84375,278.0994,1.4917208,3.6354127,-100.80983,-278.83075,-302.65198,5.1271334,0.75008625,-0.37577063,67.51988,535000
|
| 29 |
+
0.6569367,274.08795,0.004175057,0.0038323451,-11.582086,0.17079502,-274.03958,274.2626,1.3122361,3.0053673,-100.66043,-274.64902,-302.482,4.317603,0.3310232,-0.46320003,52.036034,540000
|
| 30 |
+
0.65817845,271.922,0.00382845,0.0068464377,-10.711695,0.18750855,-271.88098,272.11633,1.6439565,5.2958293,-100.547646,-272.92545,-302.5723,6.939786,0.50153345,-0.4963703,76.523926,545000
|
| 31 |
+
0.65229857,277.7599,0.0038073722,0.0019307988,-11.992879,0.17290005,-277.71423,277.93472,2.6405149,5.448932,-100.531136,-278.3386,-302.37842,8.089447,2.4758358,-2.406524,127.93605,550000
|
| 32 |
+
0.6614218,275.8272,0.0042680884,-0.00076824095,-12.6799965,0.19097953,-275.77307,276.01743,1.4471179,4.802998,-100.81175,-276.54965,-302.13907,6.250116,0.42075124,-0.3630106,64.66987,555000
|
| 33 |
+
0.6545285,270.812,0.0037861483,0.0015348442,-12.094616,0.18350247,-270.76617,270.99704,1.4305108,5.1155167,-100.44838,-271.8216,-302.9296,6.546027,0.6285704,-0.38880485,70.41169,560000
|
| 34 |
+
0.6525392,271.52573,0.0038975405,0.0021965667,-11.936422,0.18933354,-271.47925,271.71725,2.0557783,4.466287,-100.448814,-272.64352,-302.3297,6.522065,0.8171565,-0.46863696,79.12474,565000
|
| 35 |
+
0.6585264,271.02734,0.0040647658,0.008208976,-10.480455,0.186795,-270.98474,271.22235,4.145801,7.472179,-100.539024,-272.04388,-302.25824,11.61798,2.0519223,-2.4369524,108.6438,570000
|
| 36 |
+
0.65001523,272.44867,0.003920929,0.00097212923,-12.252067,0.20315096,-272.40063,272.6528,1.5633615,11.126044,-100.60723,-273.54147,-302.484,12.689405,3.3422155,-3.1536455,159.47836,575000
|
| 37 |
+
0.6409866,273.25018,0.0038908762,-0.0117652975,-15.523817,0.17622308,-273.18976,273.4146,1.2775005,3.8822,-100.74821,-274.26022,-303.3022,5.1597004,0.47107258,-0.3467852,61.2726,580000
|
| 38 |
+
0.65693295,267.84805,0.004030488,-0.00027664402,-12.568638,0.1804011,-267.79736,268.02817,1.7190441,3.7835464,-99.949,-268.3449,-302.4153,5.5025907,0.6766064,-0.5834172,67.20445,585000
|
| 39 |
+
0.6527162,268.68372,0.0039267815,0.0026871618,-11.815683,0.18157864,-268.63733,268.86798,1.1164014,4.0748825,-100.643005,-269.39127,-302.13397,5.191284,0.71636075,-0.6906779,66.9693,590000
|
| 40 |
+
0.6490048,275.9734,0.003846571,-0.005001079,-13.800139,0.1799522,-275.9203,276.14835,1.3044199,3.7203126,-100.53833,-276.7446,-302.30365,5.0247326,0.47455654,-0.35491484,54.020584,595000
|
| 41 |
+
0.6517196,268.56226,0.0038112083,-0.003648754,-13.457375,0.20605221,-268.511,268.76465,2.0356777,4.4876266,-100.305046,-268.9824,-302.174,6.523304,0.8562514,-0.82949954,89.4772,600000
|
| 42 |
+
0.64766836,267.204,0.003849377,-0.0017338342,-12.950419,0.18489233,-267.15414,267.38718,1.2699257,4.0045724,-100.58731,-267.83936,-302.1232,5.274498,0.6556224,-0.6897132,68.82459,605000
|
| 43 |
+
0.64823544,270.76212,0.0038195702,-0.00084718375,-12.721801,0.18055418,-270.71353,270.9418,1.3690509,4.654655,-100.53259,-271.8281,-302.02383,6.023706,0.7471346,-0.43228492,65.30638,610000
|
| 44 |
+
0.65005064,267.5726,0.0036858406,-0.0011888848,-12.822555,0.1709446,-267.52536,267.74237,1.1079116,20.612848,-100.15631,-268.2735,-302.13718,21.72076,1.4232594,-1.3864632,83.2501,615000
|
| 45 |
+
0.6538719,272.15735,0.0037565322,0.00036914166,-12.401733,0.17873988,-272.11075,272.33646,1.1421475,3.6426377,-100.512474,-272.8609,-302.1668,4.7847853,0.42237765,-0.48748362,54.842216,620000
|
| 46 |
+
0.6558896,273.50537,0.00387492,-0.0005050039,-12.630326,0.16236824,-273.45642,273.6672,1.1954454,3.6211011,-100.5661,-274.34946,-302.34454,4.8165464,0.34171605,-0.34527758,52.290237,625000
|
| 47 |
+
0.66177267,273.48633,0.003974191,-0.0013489515,-12.839428,0.15773506,-273.4353,273.64273,1.7578983,4.0835757,-99.97734,-274.7754,-302.42227,5.841474,0.44704354,-0.38047028,62.909954,630000
|
| 48 |
+
0.65872467,271.05377,0.003778132,0.008597666,-10.22436,0.16912341,-271.01517,271.2315,1.9143807,6.115305,-38.161705,-271.2909,-302.16403,8.029686,0.6697246,-0.72154343,99.265594,635000
|
| 49 |
+
0.65310025,273.35004,0.003728637,-0.0055427602,-13.986538,0.181842,-273.29785,273.52634,1.4231325,4.4647956,-100.741554,-274.40698,-302.48495,5.887928,0.52856183,-0.52045035,70.89748,640000
|
| 50 |
+
0.6523478,266.24347,0.003839018,-0.00015777092,-12.541097,0.1744662,-266.1953,266.4178,0.86750776,3.2324586,-100.2193,-266.71497,-302.16107,4.0999665,0.41854823,-0.7575118,58.506126,645000
|
| 51 |
+
0.6763391,275.19373,0.0037004182,0.008222245,-10.278023,0.19382495,-275.1557,275.39575,1.5847858,4.114941,-100.56127,-276.22803,-302.33795,5.699727,4.124382,-3.8501616,118.24188,650000
|
| 52 |
+
0.64919144,268.31848,0.0036250544,0.0013892372,-12.116768,0.19212562,-268.27454,268.51202,1.1010379,3.3499253,-100.654236,-269.2237,-302.44778,4.450963,0.55497086,-0.38480103,53.815643,655000
|
| 53 |
+
0.6563669,267.503,0.0037328051,0.0034577048,-11.573698,0.19734704,-267.4598,267.7038,1.3870534,9.1251135,-100.504524,-267.77884,-302.3812,10.512167,3.486534,-3.1588726,183.43533,660000
|
| 54 |
+
0.6524409,268.08008,0.003985536,-0.0036084177,-13.405378,0.18119828,-268.02664,268.2577,1.1264433,3.8177202,-100.65399,-269.4706,-302.13928,4.9441633,0.5961592,-0.4595372,62.192085,665000
|
| 55 |
+
0.65943694,273.08978,0.00391928,-0.0048394836,-13.734789,0.18334374,-273.03598,273.26828,1.503837,4.8108644,-100.29718,-273.9697,-302.34665,6.3147016,3.633148,-4.1283636,116.25984,670000
|
| 56 |
+
0.656742,265.07684,0.0037997148,0.00010089804,-12.473446,0.1899961,-265.02945,265.26694,1.2707785,5.387325,-48.535477,-266.2669,-302.3441,6.6581035,0.70949894,-0.4192162,64.572556,675000
|
| 57 |
+
0.6697962,265.18674,0.003803253,0.008380855,-10.296398,0.16795674,-265.14758,265.3631,0.9197872,3.450071,-100.51791,-266.16718,-302.23373,4.3698583,0.42152536,-0.3579899,50.63488,680000
|
| 58 |
+
0.6440201,270.4571,0.003869318,-0.0042481036,-13.597895,0.16984355,-270.40448,270.62268,1.1417674,11.121091,-100.32641,-271.36017,-302.17673,12.262858,1.364107,-1.1989826,106.812035,685000
|
| 59 |
+
0.6490077,263.78864,0.0040109647,-0.002149289,-13.035853,0.17247106,-263.7364,263.95898,1.7137526,3.6669495,-100.10452,-264.78525,-302.10388,5.380702,0.41188216,-0.65329564,62.04017,690000
|
| 60 |
+
0.66502243,271.4598,0.0038012879,0.0036772846,-11.532621,0.19362207,-271.41602,271.6571,1.149114,3.1761587,-100.3217,-272.1019,-302.4118,4.3252726,0.5353682,-0.6744158,59.68843,695000
|
| 61 |
+
0.6628389,265.97748,0.0037018105,0.011503729,-9.392405,0.20553851,-265.94272,266.19452,1.1232303,6.082333,-100.14306,-266.96494,-302.2301,7.2055635,1.2801148,-0.54911005,79.049805,700000
|
| 62 |
+
0.66792524,265.12756,0.0038155124,0.005728883,-10.9985285,0.18945515,-265.08557,265.32275,1.2316157,3.2707543,-98.32225,-265.76373,-302.69815,4.50237,0.3399579,-0.3367729,51.45264,705000
|
| 63 |
+
0.65584743,262.99445,0.0037476528,-0.00095978705,-12.7561035,0.16650872,-262.94666,263.16,1.2919266,3.3655548,-55.11795,-263.8392,-302.3269,4.657481,0.34141415,-0.3343301,50.006203,710000
|
| 64 |
+
0.65781385,259.23697,0.004057475,0.002293327,-11.93479,0.17323872,-259.18857,259.4125,1.7178026,5.7142224,-100.24843,-259.86807,-302.07547,7.432025,0.5878282,-0.7405029,72.844025,715000
|
| 65 |
+
0.6600269,255.67462,0.0036932188,0.007837795,-10.377788,0.16907993,-255.63629,255.85155,1.1016797,3.278366,-100.42798,-256.34814,-302.1751,4.380046,0.32970732,-0.37303326,48.506794,720000
|
| 66 |
+
0.6439877,267.15875,0.0035645133,-0.004540674,-13.773855,0.16080952,-267.10965,267.315,2.9271188,11.985636,-100.37282,-268.24445,-302.2857,14.912754,0.8882229,-1.1268097,98.02903,725000
|
| 67 |
+
0.6611746,262.95074,0.003585592,0.0007371388,-12.294416,0.18381852,-262.90665,263.13528,2.0847604,6.941232,-100.59156,-264.19943,-302.11478,9.025992,4.4490647,-4.5494156,198.22101,730000
|
| 68 |
+
0.6635295,260.92734,0.0036617604,-0.00085690507,-12.7340145,0.17437458,-260.88068,261.10086,1.3609599,5.3552785,-100.43349,-261.47186,-301.94196,6.7162385,1.2968422,-1.1850786,80.013275,735000
|
| 69 |
+
0.66503507,268.88138,0.0035477157,0.0075655635,-10.367483,0.15755492,-268.8446,269.0465,1.1212142,2.8344,-100.381294,-269.72745,-302.0661,3.955614,0.39808416,-0.3757504,48.217247,740000
|
| 70 |
+
0.6468453,269.77673,0.0034535185,-0.0055961586,-14.120422,0.1690745,-269.72797,269.94022,1.3196585,3.320074,-100.22369,-270.5367,-302.3597,4.6397324,0.42696238,-0.5635065,60.867455,745000
|
| 71 |
+
0.66062003,262.29077,0.003431902,0.0031096244,-11.593906,0.14026155,-262.25098,262.43414,1.1611735,6.9319696,-100.48274,-263.16385,-302.89093,8.093143,2.4940248,-2.4175303,91.06827,750000
|
| 72 |
+
0.6521812,263.2069,0.0035675808,-0.0037251487,-13.544167,0.17847559,-263.1586,263.38165,1.6038483,4.2804146,-100.21178,-264.4099,-302.04803,5.884263,0.50776553,-0.69809747,63.90651,755000
|
| 73 |
+
0.6550729,263.37164,0.0034771895,0.0007491084,-12.284565,0.19373032,-263.32892,263.56613,3.674694,5.508619,-100.48436,-264.32257,-302.1228,9.183313,1.1618555,-1.0039964,101.96025,760000
|
| 74 |
+
0.6751434,265.93674,0.0037625018,0.0064296117,-10.791134,0.16954145,-265.89612,266.11273,1.2753996,2.9756002,-100.59431,-266.753,-302.2741,4.251,0.4560074,-0.5010601,51.591515,765000
|
| 75 |
+
0.6569673,257.816,0.003460145,-0.0013516918,-12.890646,0.17219272,-257.77142,257.98685,1.1579093,3.263764,-100.44112,-258.47635,-302.20847,4.4216733,0.34097916,-0.31973374,53.43991,770000
|
| 76 |
+
0.65126264,267.30176,0.0035468938,-0.005020387,-13.915432,0.1724834,-267.25238,267.4692,1.2050211,6.4175262,-100.31884,-268.16153,-302.67633,7.622547,1.3974489,-0.5807275,61.15274,775000
|
| 77 |
+
0.64933974,262.57587,0.0036670705,0.002783687,-11.740896,0.1734583,-262.5328,262.7521,0.99861974,3.0345356,-100.5672,-263.18887,-302.0209,4.0331554,0.454913,-0.3298229,46.647137,780000
|
| 78 |
+
0.6530802,263.2072,0.0036270118,-0.0060099917,-14.157009,0.18896875,-263.15588,263.39017,1.3061988,4.6743255,-50.955795,-263.9532,-301.96115,5.980524,1.8295739,-1.6879585,64.47211,785000
|
| 79 |
+
0.6821132,257.26736,0.0037291618,0.010791679,-9.606138,0.18600953,-257.23157,257.46417,1.5925318,2.982882,-97.68749,-258.27206,-301.97418,4.5754137,0.42074943,-0.3942139,64.96476,790000
|
| 80 |
+
0.656937,262.6109,0.0035105157,0.0003288129,-12.406335,0.18733752,-262.56732,262.79858,1.3665179,3.3723373,-100.41332,-263.10297,-302.53564,4.7388554,0.41259122,-0.44608298,52.46952,795000
|
| 81 |
+
0.6651002,260.74304,0.0034826105,0.005621977,-10.8857,0.16495104,-260.70514,260.9136,1.1262925,3.447675,-100.48271,-261.54596,-302.26355,4.5739675,0.46754345,-0.42198122,56.593094,800000
|
| 82 |
+
0.6626007,262.56537,0.0034492463,0.009028436,-9.88249,0.17096968,-262.5313,262.74536,2.4560494,5.883519,-100.42192,-263.0576,-302.40768,8.339569,1.3391376,-1.5317918,108.66876,805000
|
| 83 |
+
0.65040284,262.90195,0.0036657767,-0.0066518276,-14.314575,0.18906927,-262.8495,263.08435,1.1653712,4.4891753,-100.32879,-264.2189,-302.20874,5.6545467,0.8205674,-0.49737954,59.52724,810000
|
| 84 |
+
0.66200024,254.8385,0.003358908,0.0029729162,-11.614916,0.17502092,-254.7995,255.0165,0.9564673,2.942375,-100.374916,-255.47868,-302.43347,3.8988423,0.38844615,-0.32686037,45.500137,815000
|
| 85 |
+
0.65247387,262.62796,0.003554384,-0.0023381982,-13.157835,0.17206821,-262.58118,262.79767,1.200571,3.5139275,-100.24698,-263.30447,-301.80292,4.7144985,0.50287116,-0.49398282,53.022915,820000
|
| 86 |
+
0.6472079,263.6805,0.0033900887,-0.0062039527,-14.330027,0.16103868,-263.63193,263.83536,1.0829505,3.4031022,-100.408646,-263.9637,-302.3506,4.4860525,0.545757,-0.8175769,69.36981,825000
|
| 87 |
+
0.6432897,259.8344,0.003343529,-0.007055955,-14.610332,0.16791373,-259.78558,259.99527,1.8657563,3.976806,-98.170586,-260.77182,-302.03766,5.842562,0.43746844,-0.4325712,62.178513,830000
|
| 88 |
+
0.65876114,257.61987,0.0035624162,0.0042539877,-11.30587,0.17628302,-257.5796,257.80038,1.4900447,3.5727441,-100.20424,-258.4614,-302.05002,5.062789,0.4323218,-0.4354363,59.789566,835000
|
| 89 |
+
0.6576915,256.4889,0.003284452,0.0041109747,-11.248353,0.17862049,-256.4519,256.67163,1.7968464,3.984544,-100.33307,-257.19537,-302.53012,5.78139,2.0300677,-3.127503,100.52718,840000
|
| 90 |
+
0.6739897,252.99161,0.0033698154,0.0039745094,-11.320556,0.16195339,-252.95346,253.15753,1.1821458,4.618448,-99.14985,-253.56815,-301.97662,5.8005934,0.5924565,-0.66367555,63.65896,845000
|
| 91 |
+
0.66595256,257.6371,0.0034139904,0.00392248,-11.351057,0.17194971,-257.59833,257.81296,0.9062449,5.726176,-100.10459,-258.43427,-301.95712,6.6324205,2.23449,-1.72801,76.319954,850000
|
| 92 |
+
0.6640179,259.6067,0.003487054,0.002478489,-11.789231,0.17143318,-259.56555,259.7806,1.03579,3.0446954,-100.39171,-260.4625,-302.19894,4.0804853,0.9403114,-0.9726518,57.67702,855000
|
| 93 |
+
0.663341,250.28857,0.0034744728,0.0029309767,-11.656425,0.15970895,-250.24808,250.45122,1.4705893,3.185194,-99.42021,-250.98824,-302.0316,4.655783,0.5012129,-0.3778851,57.934307,860000
|
| 94 |
+
0.65888673,254.44775,0.003422969,-0.0002585925,-12.575546,0.15801167,-254.4047,254.6055,1.1894253,3.4097638,-100.119316,-255.22978,-302.65915,4.5991893,0.52387774,-0.36910158,58.49611,865000
|
| 95 |
+
0.6471192,258.5127,0.0033797089,-0.004302591,-13.773066,0.1407532,-258.46616,258.64914,1.4127803,3.504381,-100.12853,-259.47037,-302.04263,4.917161,0.9715753,-0.9156258,58.372993,870000
|
| 96 |
+
0.66123503,253.9089,0.0033372215,-0.0042367354,-13.76954,0.15046579,-253.86293,254.05513,1.3206987,4.9679832,-100.22023,-254.50928,-302.02277,6.288682,1.6275266,-1.6369475,69.68054,875000
|
| 97 |
+
0.65092635,263.01294,0.0032300008,0.0026197336,-11.688937,0.19279438,-262.9752,263.20834,1.1386191,4.1485515,-100.345436,-264.04007,-302.20316,5.2871704,0.6521909,-0.69188774,68.239586,880000
|
| 98 |
+
0.6439127,262.289,0.0031453823,-0.003293008,-13.546934,0.14439304,-262.2464,262.43008,2.1266446,5.9532905,-100.359276,-263.0424,-302.15247,8.079935,2.1435452,-1.5300612,89.26518,885000
|
| 99 |
+
0.64830166,254.85828,0.0034362331,-0.006326792,-14.3412,0.17169482,-254.809,255.02364,1.0895646,6.4481707,-100.50789,-255.82706,-302.17038,7.537735,0.5981569,-1.183158,70.63412,890000
|
| 100 |
+
0.6574274,253.92728,0.0033766546,-0.0039003282,-13.6550865,0.15111661,-253.88116,254.0745,1.3703245,4.2046866,-100.36088,-254.9893,-301.72754,5.5750113,0.5531093,-0.39045647,63.31022,895000
|
| 101 |
+
0.6542596,260.48315,0.0033274668,-0.006377982,-14.416768,0.18010712,-260.43518,260.6569,1.3362123,4.3864913,-100.25507,-261.5942,-301.93683,5.7227035,0.45228893,-0.43879944,59.584667,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.65777576,286.2387,0.0043688696,-0.0058244374,-13.833168,0.19124553,-286.17825,286.42413,4.602918,37.411324,-113.48078,-287.4548,-302.93402,42.01424,9.782691,-9.395115,332.65448,405000
|
| 3 |
+
0.66484314,283.14642,0.004531941,0.0043779872,-11.533971,0.18151787,-283.09412,283.3323,2.4132216,5.800167,-153.34193,-283.94492,-302.7867,8.213388,4.3679423,-3.061497,165.07124,410000
|
| 4 |
+
0.643561,279.89133,0.004328691,-0.0022389041,-13.017224,0.22689164,-279.83496,280.116,1.9741777,5.404739,-103.43752,-280.62515,-302.8149,7.3789167,0.5338774,-0.6207844,76.24657,415000
|
| 5 |
+
0.6515242,285.9378,0.004074832,0.00044677674,-12.390357,0.17150408,-285.88727,286.10977,2.0441465,4.975637,-172.43262,-287.1694,-302.6491,7.0197835,2.021884,-1.6794242,97.16882,420000
|
| 6 |
+
0.6425659,282.19733,0.004221519,-0.009844476,-14.831975,0.21109831,-282.13474,282.39856,1.7567666,4.736975,-105.97365,-283.63388,-302.80106,6.493742,0.65635586,-0.5470581,71.83242,425000
|
| 7 |
+
0.66511166,282.87598,0.0040940875,0.0060505406,-11.022127,0.20757331,-282.83087,283.0896,1.5211914,3.6555498,1.2542198,-283.83527,-302.59045,5.176741,0.68858814,-0.69464165,66.58798,430000
|
| 8 |
+
0.66057,287.1335,0.0040622465,0.0049433047,-11.283111,0.17368807,-287.0877,287.31213,1.5880116,5.4547105,-103.27681,-287.57407,-302.7342,7.042722,0.7526107,-0.8434743,93.1994,435000
|
| 9 |
+
0.6639598,282.2492,0.0044977623,0.0016852883,-12.125305,0.20861104,-282.19464,282.4595,1.7928759,7.9227877,-101.89276,-282.68555,-302.28278,9.715664,3.8086073,-3.652063,120.84007,440000
|
| 10 |
+
0.6579338,282.69128,0.0043312325,0.0016745145,-12.113386,0.19922689,-282.6388,282.89218,1.3764117,3.9846294,-99.808365,-283.4558,-302.87305,5.361041,0.406014,-0.47376734,67.75493,445000
|
| 11 |
+
0.6635614,281.38623,0.004240995,0.006134044,-11.053631,0.1747652,-281.33936,281.56714,1.3687917,4.217381,-101.21222,-282.17776,-303.3144,5.5861726,0.6727085,-0.5703892,68.9735,450000
|
| 12 |
+
0.6473163,281.2316,0.0042631337,-0.0010573512,-12.748022,0.17549762,-281.17725,281.40604,2.03662,4.2015047,-101.570625,-282.40558,-302.8451,6.238125,1.9957787,-1.8035789,104.21101,455000
|
| 13 |
+
0.6588652,281.46906,0.004131644,-0.001490058,-12.860645,0.20731878,-281.41592,281.67487,1.9008435,4.5409293,-101.35432,-282.48178,-302.74652,6.441773,1.2861012,-0.83129036,90.13878,460000
|
| 14 |
+
0.6555925,283.30344,0.0040887324,0.00067760027,-12.334276,0.1872018,-283.253,283.4913,1.6134785,4.8648124,-101.340965,-284.35455,-302.71185,6.478291,0.65421987,-0.5702749,81.90708,465000
|
| 15 |
+
0.64430267,275.83557,0.0039874366,-0.00028204743,-12.570734,0.1989052,-275.78546,276.0342,2.2736754,4.6226892,-99.96793,-276.99918,-303.04764,6.8963647,1.0704606,-0.77871346,84.70085,470000
|
| 16 |
+
0.6424428,274.75723,0.0043020886,-0.015211099,-16.035748,0.19362412,-274.68826,274.93567,4.8248057,8.5596,-37.053986,-275.88913,-302.26834,13.384405,2.7987986,-2.733929,185.2145,475000
|
| 17 |
+
0.6428447,276.01517,0.0041619227,-0.017834926,-16.785261,0.19927755,-275.9453,276.19662,2.0736983,4.9688888,-101.277885,-277.2692,-302.4938,7.0425873,0.5188356,-0.48158282,74.978134,480000
|
| 18 |
+
0.6527853,278.3581,0.004348925,-0.00037986983,-12.587348,0.16083136,-278.30338,278.51855,1.9322634,6.7203,-69.89604,-279.1411,-302.2465,8.652563,1.1990683,-0.81142724,94.71803,485000
|
| 19 |
+
0.64392287,278.38773,0.004257482,-0.002514538,-13.090616,0.18314369,-278.33197,278.56836,1.7886165,7.594345,-100.31534,-279.3383,-302.15817,9.382961,0.5245527,-0.5821067,74.75274,490000
|
| 20 |
+
0.65475404,278.48904,0.0042512827,-0.0004662733,-12.609678,0.18878198,-278.43542,278.67737,1.6314347,3.5924385,-100.64765,-279.44278,-302.53516,5.223873,0.51113063,-0.43821287,66.75864,495000
|
| 21 |
+
0.6398633,275.591,0.0041859993,-0.011196487,-15.1747465,0.1862495,-275.5275,275.76605,1.813138,6.487021,-101.16662,-277.05942,-302.3382,8.300159,2.4702225,-2.3254802,98.488754,500000
|
| 22 |
+
0.66557217,278.42065,0.0043634693,0.004410434,-11.489237,0.21572632,-278.37054,278.6408,1.9359106,4.155012,-101.23635,-279.59732,-302.62888,6.090923,0.69092953,-0.87205356,69.88994,505000
|
| 23 |
+
0.6497343,278.6211,0.0042842436,-0.004876799,-13.63831,0.21381727,-278.56268,278.83002,1.9659092,4.518036,-100.417725,-279.53452,-302.22247,6.483945,0.44262838,-0.4729781,70.45741,510000
|
| 24 |
+
0.6316272,275.14636,0.0041847,-0.010805198,-15.082072,0.18401146,-275.08325,275.31958,1.8957462,14.241051,-100.4533,-276.48874,-302.17874,16.136797,3.9939694,-4.0240393,142.66756,515000
|
| 25 |
+
0.65047467,272.76514,0.0041568116,0.0049227513,-11.315739,0.17586342,-272.71808,272.94592,1.5557191,4.8189883,-100.545845,-273.17023,-302.53656,6.374707,0.64840984,-0.64553905,84.06355,520000
|
| 26 |
+
0.6751094,279.9757,0.00397356,0.012152452,-9.441671,0.17466286,-279.93817,280.1625,2.0324066,4.5430946,-100.53836,-280.56866,-302.55136,6.5755014,2.9621282,-1.4267627,104.70213,525000
|
| 27 |
+
0.6623017,276.56177,0.0041829324,0.0044278903,-11.441439,0.20019893,-276.51392,276.7664,1.417243,3.9836583,-100.28535,-277.8501,-302.89606,5.4009013,0.46793902,-0.62123984,66.47359,530000
|
| 28 |
+
0.65802926,277.88666,0.003913545,0.0060008494,-10.966646,0.20672569,-277.84375,278.0994,1.4917208,3.6354127,-100.80983,-278.83075,-302.65198,5.1271334,0.75008625,-0.37577063,67.51988,535000
|
| 29 |
+
0.6569367,274.08795,0.004175057,0.0038323451,-11.582086,0.17079502,-274.03958,274.2626,1.3122361,3.0053673,-100.66043,-274.64902,-302.482,4.317603,0.3310232,-0.46320003,52.036034,540000
|
| 30 |
+
0.65817845,271.922,0.00382845,0.0068464377,-10.711695,0.18750855,-271.88098,272.11633,1.6439565,5.2958293,-100.547646,-272.92545,-302.5723,6.939786,0.50153345,-0.4963703,76.523926,545000
|
| 31 |
+
0.65229857,277.7599,0.0038073722,0.0019307988,-11.992879,0.17290005,-277.71423,277.93472,2.6405149,5.448932,-100.531136,-278.3386,-302.37842,8.089447,2.4758358,-2.406524,127.93605,550000
|
| 32 |
+
0.6614218,275.8272,0.0042680884,-0.00076824095,-12.6799965,0.19097953,-275.77307,276.01743,1.4471179,4.802998,-100.81175,-276.54965,-302.13907,6.250116,0.42075124,-0.3630106,64.66987,555000
|
| 33 |
+
0.6545285,270.812,0.0037861483,0.0015348442,-12.094616,0.18350247,-270.76617,270.99704,1.4305108,5.1155167,-100.44838,-271.8216,-302.9296,6.546027,0.6285704,-0.38880485,70.41169,560000
|
| 34 |
+
0.6525392,271.52573,0.0038975405,0.0021965667,-11.936422,0.18933354,-271.47925,271.71725,2.0557783,4.466287,-100.448814,-272.64352,-302.3297,6.522065,0.8171565,-0.46863696,79.12474,565000
|
| 35 |
+
0.6585264,271.02734,0.0040647658,0.008208976,-10.480455,0.186795,-270.98474,271.22235,4.145801,7.472179,-100.539024,-272.04388,-302.25824,11.61798,2.0519223,-2.4369524,108.6438,570000
|
| 36 |
+
0.65001523,272.44867,0.003920929,0.00097212923,-12.252067,0.20315096,-272.40063,272.6528,1.5633615,11.126044,-100.60723,-273.54147,-302.484,12.689405,3.3422155,-3.1536455,159.47836,575000
|
| 37 |
+
0.6409866,273.25018,0.0038908762,-0.0117652975,-15.523817,0.17622308,-273.18976,273.4146,1.2775005,3.8822,-100.74821,-274.26022,-303.3022,5.1597004,0.47107258,-0.3467852,61.2726,580000
|
| 38 |
+
0.65693295,267.84805,0.004030488,-0.00027664402,-12.568638,0.1804011,-267.79736,268.02817,1.7190441,3.7835464,-99.949,-268.3449,-302.4153,5.5025907,0.6766064,-0.5834172,67.20445,585000
|
| 39 |
+
0.6527162,268.68372,0.0039267815,0.0026871618,-11.815683,0.18157864,-268.63733,268.86798,1.1164014,4.0748825,-100.643005,-269.39127,-302.13397,5.191284,0.71636075,-0.6906779,66.9693,590000
|
| 40 |
+
0.6490048,275.9734,0.003846571,-0.005001079,-13.800139,0.1799522,-275.9203,276.14835,1.3044199,3.7203126,-100.53833,-276.7446,-302.30365,5.0247326,0.47455654,-0.35491484,54.020584,595000
|
| 41 |
+
0.6517196,268.56226,0.0038112083,-0.003648754,-13.457375,0.20605221,-268.511,268.76465,2.0356777,4.4876266,-100.305046,-268.9824,-302.174,6.523304,0.8562514,-0.82949954,89.4772,600000
|
| 42 |
+
0.64766836,267.204,0.003849377,-0.0017338342,-12.950419,0.18489233,-267.15414,267.38718,1.2699257,4.0045724,-100.58731,-267.83936,-302.1232,5.274498,0.6556224,-0.6897132,68.82459,605000
|
| 43 |
+
0.64823544,270.76212,0.0038195702,-0.00084718375,-12.721801,0.18055418,-270.71353,270.9418,1.3690509,4.654655,-100.53259,-271.8281,-302.02383,6.023706,0.7471346,-0.43228492,65.30638,610000
|
| 44 |
+
0.65005064,267.5726,0.0036858406,-0.0011888848,-12.822555,0.1709446,-267.52536,267.74237,1.1079116,20.612848,-100.15631,-268.2735,-302.13718,21.72076,1.4232594,-1.3864632,83.2501,615000
|
| 45 |
+
0.6538719,272.15735,0.0037565322,0.00036914166,-12.401733,0.17873988,-272.11075,272.33646,1.1421475,3.6426377,-100.512474,-272.8609,-302.1668,4.7847853,0.42237765,-0.48748362,54.842216,620000
|
| 46 |
+
0.6558896,273.50537,0.00387492,-0.0005050039,-12.630326,0.16236824,-273.45642,273.6672,1.1954454,3.6211011,-100.5661,-274.34946,-302.34454,4.8165464,0.34171605,-0.34527758,52.290237,625000
|
| 47 |
+
0.66177267,273.48633,0.003974191,-0.0013489515,-12.839428,0.15773506,-273.4353,273.64273,1.7578983,4.0835757,-99.97734,-274.7754,-302.42227,5.841474,0.44704354,-0.38047028,62.909954,630000
|
| 48 |
+
0.65872467,271.05377,0.003778132,0.008597666,-10.22436,0.16912341,-271.01517,271.2315,1.9143807,6.115305,-38.161705,-271.2909,-302.16403,8.029686,0.6697246,-0.72154343,99.265594,635000
|
| 49 |
+
0.65310025,273.35004,0.003728637,-0.0055427602,-13.986538,0.181842,-273.29785,273.52634,1.4231325,4.4647956,-100.741554,-274.40698,-302.48495,5.887928,0.52856183,-0.52045035,70.89748,640000
|
| 50 |
+
0.6523478,266.24347,0.003839018,-0.00015777092,-12.541097,0.1744662,-266.1953,266.4178,0.86750776,3.2324586,-100.2193,-266.71497,-302.16107,4.0999665,0.41854823,-0.7575118,58.506126,645000
|
| 51 |
+
0.6763391,275.19373,0.0037004182,0.008222245,-10.278023,0.19382495,-275.1557,275.39575,1.5847858,4.114941,-100.56127,-276.22803,-302.33795,5.699727,4.124382,-3.8501616,118.24188,650000
|
| 52 |
+
0.64919144,268.31848,0.0036250544,0.0013892372,-12.116768,0.19212562,-268.27454,268.51202,1.1010379,3.3499253,-100.654236,-269.2237,-302.44778,4.450963,0.55497086,-0.38480103,53.815643,655000
|
| 53 |
+
0.6563669,267.503,0.0037328051,0.0034577048,-11.573698,0.19734704,-267.4598,267.7038,1.3870534,9.1251135,-100.504524,-267.77884,-302.3812,10.512167,3.486534,-3.1588726,183.43533,660000
|
| 54 |
+
0.6524409,268.08008,0.003985536,-0.0036084177,-13.405378,0.18119828,-268.02664,268.2577,1.1264433,3.8177202,-100.65399,-269.4706,-302.13928,4.9441633,0.5961592,-0.4595372,62.192085,665000
|
| 55 |
+
0.65943694,273.08978,0.00391928,-0.0048394836,-13.734789,0.18334374,-273.03598,273.26828,1.503837,4.8108644,-100.29718,-273.9697,-302.34665,6.3147016,3.633148,-4.1283636,116.25984,670000
|
| 56 |
+
0.656742,265.07684,0.0037997148,0.00010089804,-12.473446,0.1899961,-265.02945,265.26694,1.2707785,5.387325,-48.535477,-266.2669,-302.3441,6.6581035,0.70949894,-0.4192162,64.572556,675000
|
| 57 |
+
0.6697962,265.18674,0.003803253,0.008380855,-10.296398,0.16795674,-265.14758,265.3631,0.9197872,3.450071,-100.51791,-266.16718,-302.23373,4.3698583,0.42152536,-0.3579899,50.63488,680000
|
| 58 |
+
0.6440201,270.4571,0.003869318,-0.0042481036,-13.597895,0.16984355,-270.40448,270.62268,1.1417674,11.121091,-100.32641,-271.36017,-302.17673,12.262858,1.364107,-1.1989826,106.812035,685000
|
| 59 |
+
0.6490077,263.78864,0.0040109647,-0.002149289,-13.035853,0.17247106,-263.7364,263.95898,1.7137526,3.6669495,-100.10452,-264.78525,-302.10388,5.380702,0.41188216,-0.65329564,62.04017,690000
|
| 60 |
+
0.66502243,271.4598,0.0038012879,0.0036772846,-11.532621,0.19362207,-271.41602,271.6571,1.149114,3.1761587,-100.3217,-272.1019,-302.4118,4.3252726,0.5353682,-0.6744158,59.68843,695000
|
| 61 |
+
0.6628389,265.97748,0.0037018105,0.011503729,-9.392405,0.20553851,-265.94272,266.19452,1.1232303,6.082333,-100.14306,-266.96494,-302.2301,7.2055635,1.2801148,-0.54911005,79.049805,700000
|
| 62 |
+
0.66792524,265.12756,0.0038155124,0.005728883,-10.9985285,0.18945515,-265.08557,265.32275,1.2316157,3.2707543,-98.32225,-265.76373,-302.69815,4.50237,0.3399579,-0.3367729,51.45264,705000
|
| 63 |
+
0.65584743,262.99445,0.0037476528,-0.00095978705,-12.7561035,0.16650872,-262.94666,263.16,1.2919266,3.3655548,-55.11795,-263.8392,-302.3269,4.657481,0.34141415,-0.3343301,50.006203,710000
|
| 64 |
+
0.65781385,259.23697,0.004057475,0.002293327,-11.93479,0.17323872,-259.18857,259.4125,1.7178026,5.7142224,-100.24843,-259.86807,-302.07547,7.432025,0.5878282,-0.7405029,72.844025,715000
|
| 65 |
+
0.6600269,255.67462,0.0036932188,0.007837795,-10.377788,0.16907993,-255.63629,255.85155,1.1016797,3.278366,-100.42798,-256.34814,-302.1751,4.380046,0.32970732,-0.37303326,48.506794,720000
|
| 66 |
+
0.6439877,267.15875,0.0035645133,-0.004540674,-13.773855,0.16080952,-267.10965,267.315,2.9271188,11.985636,-100.37282,-268.24445,-302.2857,14.912754,0.8882229,-1.1268097,98.02903,725000
|
| 67 |
+
0.6611746,262.95074,0.003585592,0.0007371388,-12.294416,0.18381852,-262.90665,263.13528,2.0847604,6.941232,-100.59156,-264.19943,-302.11478,9.025992,4.4490647,-4.5494156,198.22101,730000
|
| 68 |
+
0.6635295,260.92734,0.0036617604,-0.00085690507,-12.7340145,0.17437458,-260.88068,261.10086,1.3609599,5.3552785,-100.43349,-261.47186,-301.94196,6.7162385,1.2968422,-1.1850786,80.013275,735000
|
| 69 |
+
0.66503507,268.88138,0.0035477157,0.0075655635,-10.367483,0.15755492,-268.8446,269.0465,1.1212142,2.8344,-100.381294,-269.72745,-302.0661,3.955614,0.39808416,-0.3757504,48.217247,740000
|
| 70 |
+
0.6468453,269.77673,0.0034535185,-0.0055961586,-14.120422,0.1690745,-269.72797,269.94022,1.3196585,3.320074,-100.22369,-270.5367,-302.3597,4.6397324,0.42696238,-0.5635065,60.867455,745000
|
| 71 |
+
0.66062003,262.29077,0.003431902,0.0031096244,-11.593906,0.14026155,-262.25098,262.43414,1.1611735,6.9319696,-100.48274,-263.16385,-302.89093,8.093143,2.4940248,-2.4175303,91.06827,750000
|
| 72 |
+
0.6521812,263.2069,0.0035675808,-0.0037251487,-13.544167,0.17847559,-263.1586,263.38165,1.6038483,4.2804146,-100.21178,-264.4099,-302.04803,5.884263,0.50776553,-0.69809747,63.90651,755000
|
| 73 |
+
0.6550729,263.37164,0.0034771895,0.0007491084,-12.284565,0.19373032,-263.32892,263.56613,3.674694,5.508619,-100.48436,-264.32257,-302.1228,9.183313,1.1618555,-1.0039964,101.96025,760000
|
| 74 |
+
0.6751434,265.93674,0.0037625018,0.0064296117,-10.791134,0.16954145,-265.89612,266.11273,1.2753996,2.9756002,-100.59431,-266.753,-302.2741,4.251,0.4560074,-0.5010601,51.591515,765000
|
| 75 |
+
0.6569673,257.816,0.003460145,-0.0013516918,-12.890646,0.17219272,-257.77142,257.98685,1.1579093,3.263764,-100.44112,-258.47635,-302.20847,4.4216733,0.34097916,-0.31973374,53.43991,770000
|
| 76 |
+
0.65126264,267.30176,0.0035468938,-0.005020387,-13.915432,0.1724834,-267.25238,267.4692,1.2050211,6.4175262,-100.31884,-268.16153,-302.67633,7.622547,1.3974489,-0.5807275,61.15274,775000
|
| 77 |
+
0.64933974,262.57587,0.0036670705,0.002783687,-11.740896,0.1734583,-262.5328,262.7521,0.99861974,3.0345356,-100.5672,-263.18887,-302.0209,4.0331554,0.454913,-0.3298229,46.647137,780000
|
| 78 |
+
0.6530802,263.2072,0.0036270118,-0.0060099917,-14.157009,0.18896875,-263.15588,263.39017,1.3061988,4.6743255,-50.955795,-263.9532,-301.96115,5.980524,1.8295739,-1.6879585,64.47211,785000
|
| 79 |
+
0.6821132,257.26736,0.0037291618,0.010791679,-9.606138,0.18600953,-257.23157,257.46417,1.5925318,2.982882,-97.68749,-258.27206,-301.97418,4.5754137,0.42074943,-0.3942139,64.96476,790000
|
| 80 |
+
0.656937,262.6109,0.0035105157,0.0003288129,-12.406335,0.18733752,-262.56732,262.79858,1.3665179,3.3723373,-100.41332,-263.10297,-302.53564,4.7388554,0.41259122,-0.44608298,52.46952,795000
|
| 81 |
+
0.6651002,260.74304,0.0034826105,0.005621977,-10.8857,0.16495104,-260.70514,260.9136,1.1262925,3.447675,-100.48271,-261.54596,-302.26355,4.5739675,0.46754345,-0.42198122,56.593094,800000
|
| 82 |
+
0.6626007,262.56537,0.0034492463,0.009028436,-9.88249,0.17096968,-262.5313,262.74536,2.4560494,5.883519,-100.42192,-263.0576,-302.40768,8.339569,1.3391376,-1.5317918,108.66876,805000
|
| 83 |
+
0.65040284,262.90195,0.0036657767,-0.0066518276,-14.314575,0.18906927,-262.8495,263.08435,1.1653712,4.4891753,-100.32879,-264.2189,-302.20874,5.6545467,0.8205674,-0.49737954,59.52724,810000
|
| 84 |
+
0.66200024,254.8385,0.003358908,0.0029729162,-11.614916,0.17502092,-254.7995,255.0165,0.9564673,2.942375,-100.374916,-255.47868,-302.43347,3.8988423,0.38844615,-0.32686037,45.500137,815000
|
| 85 |
+
0.65247387,262.62796,0.003554384,-0.0023381982,-13.157835,0.17206821,-262.58118,262.79767,1.200571,3.5139275,-100.24698,-263.30447,-301.80292,4.7144985,0.50287116,-0.49398282,53.022915,820000
|
| 86 |
+
0.6472079,263.6805,0.0033900887,-0.0062039527,-14.330027,0.16103868,-263.63193,263.83536,1.0829505,3.4031022,-100.408646,-263.9637,-302.3506,4.4860525,0.545757,-0.8175769,69.36981,825000
|
| 87 |
+
0.6432897,259.8344,0.003343529,-0.007055955,-14.610332,0.16791373,-259.78558,259.99527,1.8657563,3.976806,-98.170586,-260.77182,-302.03766,5.842562,0.43746844,-0.4325712,62.178513,830000
|
| 88 |
+
0.65876114,257.61987,0.0035624162,0.0042539877,-11.30587,0.17628302,-257.5796,257.80038,1.4900447,3.5727441,-100.20424,-258.4614,-302.05002,5.062789,0.4323218,-0.4354363,59.789566,835000
|
| 89 |
+
0.6576915,256.4889,0.003284452,0.0041109747,-11.248353,0.17862049,-256.4519,256.67163,1.7968464,3.984544,-100.33307,-257.19537,-302.53012,5.78139,2.0300677,-3.127503,100.52718,840000
|
| 90 |
+
0.6739897,252.99161,0.0033698154,0.0039745094,-11.320556,0.16195339,-252.95346,253.15753,1.1821458,4.618448,-99.14985,-253.56815,-301.97662,5.8005934,0.5924565,-0.66367555,63.65896,845000
|
| 91 |
+
0.66595256,257.6371,0.0034139904,0.00392248,-11.351057,0.17194971,-257.59833,257.81296,0.9062449,5.726176,-100.10459,-258.43427,-301.95712,6.6324205,2.23449,-1.72801,76.319954,850000
|
| 92 |
+
0.6640179,259.6067,0.003487054,0.002478489,-11.789231,0.17143318,-259.56555,259.7806,1.03579,3.0446954,-100.39171,-260.4625,-302.19894,4.0804853,0.9403114,-0.9726518,57.67702,855000
|
| 93 |
+
0.663341,250.28857,0.0034744728,0.0029309767,-11.656425,0.15970895,-250.24808,250.45122,1.4705893,3.185194,-99.42021,-250.98824,-302.0316,4.655783,0.5012129,-0.3778851,57.934307,860000
|
| 94 |
+
0.65888673,254.44775,0.003422969,-0.0002585925,-12.575546,0.15801167,-254.4047,254.6055,1.1894253,3.4097638,-100.119316,-255.22978,-302.65915,4.5991893,0.52387774,-0.36910158,58.49611,865000
|
| 95 |
+
0.6471192,258.5127,0.0033797089,-0.004302591,-13.773066,0.1407532,-258.46616,258.64914,1.4127803,3.504381,-100.12853,-259.47037,-302.04263,4.917161,0.9715753,-0.9156258,58.372993,870000
|
| 96 |
+
0.66123503,253.9089,0.0033372215,-0.0042367354,-13.76954,0.15046579,-253.86293,254.05513,1.3206987,4.9679832,-100.22023,-254.50928,-302.02277,6.288682,1.6275266,-1.6369475,69.68054,875000
|
| 97 |
+
0.65092635,263.01294,0.0032300008,0.0026197336,-11.688937,0.19279438,-262.9752,263.20834,1.1386191,4.1485515,-100.345436,-264.04007,-302.20316,5.2871704,0.6521909,-0.69188774,68.239586,880000
|
| 98 |
+
0.6439127,262.289,0.0031453823,-0.003293008,-13.546934,0.14439304,-262.2464,262.43008,2.1266446,5.9532905,-100.359276,-263.0424,-302.15247,8.079935,2.1435452,-1.5300612,89.26518,885000
|
| 99 |
+
0.64830166,254.85828,0.0034362331,-0.006326792,-14.3412,0.17169482,-254.809,255.02364,1.0895646,6.4481707,-100.50789,-255.82706,-302.17038,7.537735,0.5981569,-1.183158,70.63412,890000
|
| 100 |
+
0.6574274,253.92728,0.0033766546,-0.0039003282,-13.6550865,0.15111661,-253.88116,254.0745,1.3703245,4.2046866,-100.36088,-254.9893,-301.72754,5.5750113,0.5531093,-0.39045647,63.31022,895000
|
| 101 |
+
0.6542596,260.48315,0.0033274668,-0.006377982,-14.416768,0.18010712,-260.43518,260.6569,1.3362123,4.3864913,-100.25507,-261.5942,-301.93683,5.7227035,0.45228893,-0.43879944,59.584667,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c15870a265c25acfaf1e44612363394caf8d3327f2b3e4bbfd3b52bc875fc3e
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73ef513260b1732d346813f3cfa474e328337cae96cdbc5a8c4d90c0a23dd9e5
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfc779b87fb90d2a5eb289bd54485b401fe05dad187e54a310fb90957875e5c9
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efde82ccf3f1e6bfe411ba95d010d844495cf516e39242c21fe1dbfaf92f4386
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec5023f2ae4bb8e0f3fb55cb4f9d894701c8f6bf340d2a96f3033bcd4419fb0a
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d4523e45e624fd67272b9824eec117f5c7fd627b2d3685942426e790c9d1ebd
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22ee419a91afd8d09cd6e41ea22b3315b43d0d55f63c587c4480adf3d72858e6
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd32852526a5ff6fb755939c8741515da80905e9b7e69b863344e057ee832cbb
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0300481777fc5f73e5aa19704f2995bb78a1031bd821e943e62d6649d01a40c9
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eabb1790a6ce071516b52f61f2b177087f17ce43edb0da04c49582698cda43c6
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_191355/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/j59u12xv
|