Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_350000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_400000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,0.0014015566573819932,0.02052476967208715,0.0035025450959028227,0.019398999113287324,30.941310163748703,8.30699999999943,0.86,3463.4,-0.18,-243.62,164.14,0.5115316534042358,250000
|
| 3 |
+
0.0,0.0,-0.02966561831333487,0.04710352845868965,-0.026904833631437027,0.04322143727623007,33.58057536575843,8.441999999999174,0.76,12367.72,-0.36,-253.8,166.84,0.5299467945098877,300000
|
| 4 |
+
0.0,0.0,-0.04387316084189692,0.054718134072248806,-0.040823872770228344,0.05689418850939529,35.785069315917184,4.118999999999739,0.94,19368.48,-0.06,-106.02,80.38,0.2605641937255859,350000
|
| 5 |
+
0.0,0.0,-0.03917428484565,0.05676132131494888,-0.0360178351356399,0.05992959914842817,35.06914915861033,3.46499999999982,0.96,22755.1,-0.04,-91.16,67.3,0.22735042572021485,400000
|
| 6 |
+
0.0,0.0,-0.04776688943403392,0.04270178574866578,-0.04452682464262707,0.06286286185044081,35.562580437021985,3.4909999999998496,0.98,26244.66,-0.04,-104.88,67.82,0.21967871189117433,450000
|
| 7 |
+
0.0,0.0,-0.049762012316352716,0.054874463916925284,-0.04644272774357189,0.0637822828863226,35.257924694016545,2.764999999999985,1.0,29453.4,0.0,-75.84,53.3,0.18054044246673584,500000
|
| 8 |
+
0.0,0.0,-0.06310706781789552,0.06194610184912978,-0.05899542510803357,0.08293804157885132,35.44843206946023,2.515999999999954,1.0,32121.42,0.0,-71.06,48.32,0.16247326850891114,550000
|
| 9 |
+
0.0,0.0,-0.04865124927804081,0.06782622245895502,-0.04457879093637416,0.06947242354627023,35.67831907414461,2.570999999999951,1.0,34620.56,0.0,-71.82,49.42,0.169788236618042,600000
|
| 10 |
+
0.0,0.0,-0.055689566696783224,0.0683202499068078,-0.05207282419852225,0.074293100622177,35.53113129283498,2.358999999999962,1.0,37102.0,0.0,-65.88,45.18,0.15302257537841796,650000
|
| 11 |
+
0.0,0.0,-0.0531353159367734,0.07121595133544967,-0.04970122343568861,0.06747991650429126,35.82145737605262,2.3559999999999617,1.0,39457.16,0.0,-67.62,45.12,0.15097173690795898,700000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,0.0014015566573819932,0.02052476967208715,0.0035025450959028227,0.019398999113287324,30.941310163748703,8.30699999999943,0.86,3463.4,-0.18,-243.62,164.14,0.5115316534042358,250000
|
| 3 |
+
0.0,0.0,-0.02966561831333487,0.04710352845868965,-0.026904833631437027,0.04322143727623007,33.58057536575843,8.441999999999174,0.76,12367.72,-0.36,-253.8,166.84,0.5299467945098877,300000
|
| 4 |
+
0.0,0.0,-0.04387316084189692,0.054718134072248806,-0.040823872770228344,0.05689418850939529,35.785069315917184,4.118999999999739,0.94,19368.48,-0.06,-106.02,80.38,0.2605641937255859,350000
|
| 5 |
+
0.0,0.0,-0.03917428484565,0.05676132131494888,-0.0360178351356399,0.05992959914842817,35.06914915861033,3.46499999999982,0.96,22755.1,-0.04,-91.16,67.3,0.22735042572021485,400000
|
| 6 |
+
0.0,0.0,-0.04776688943403392,0.04270178574866578,-0.04452682464262707,0.06286286185044081,35.562580437021985,3.4909999999998496,0.98,26244.66,-0.04,-104.88,67.82,0.21967871189117433,450000
|
| 7 |
+
0.0,0.0,-0.049762012316352716,0.054874463916925284,-0.04644272774357189,0.0637822828863226,35.257924694016545,2.764999999999985,1.0,29453.4,0.0,-75.84,53.3,0.18054044246673584,500000
|
| 8 |
+
0.0,0.0,-0.06310706781789552,0.06194610184912978,-0.05899542510803357,0.08293804157885132,35.44843206946023,2.515999999999954,1.0,32121.42,0.0,-71.06,48.32,0.16247326850891114,550000
|
| 9 |
+
0.0,0.0,-0.04865124927804081,0.06782622245895502,-0.04457879093637416,0.06947242354627023,35.67831907414461,2.570999999999951,1.0,34620.56,0.0,-71.82,49.42,0.169788236618042,600000
|
| 10 |
+
0.0,0.0,-0.055689566696783224,0.0683202499068078,-0.05207282419852225,0.074293100622177,35.53113129283498,2.358999999999962,1.0,37102.0,0.0,-65.88,45.18,0.15302257537841796,650000
|
| 11 |
+
0.0,0.0,-0.0531353159367734,0.07121595133544967,-0.04970122343568861,0.06747991650429126,35.82145737605262,2.3559999999999617,1.0,39457.16,0.0,-67.62,45.12,0.15097173690795898,700000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0000001,0.028237823,2.8237824,1.0282379,0.66316956,-24.114088,-99.010544,-158.92021,0.19089164,-0.1537139,13.731147,205000
|
| 3 |
+
1.0,1.0,0.028011397,2.8011396,1.0280114,0.9473737,-20.321049,-98.287224,-168.86946,0.3800224,-0.38110262,18.082298,210000
|
| 4 |
+
1.0,1.0,0.024017302,2.40173,1.0240173,0.846563,-24.1487,-101.90232,-169.20532,0.3580949,-0.36109248,15.390954,215000
|
| 5 |
+
1.0,1.0,0.023988463,2.3988466,1.0239885,0.9432165,-25.823854,-104.32532,-183.4562,0.10772827,-0.14399529,12.792468,220000
|
| 6 |
+
1.0,1.0,0.022929244,2.2929244,1.0229292,1.0359716,-39.229965,-105.217896,-179.09558,0.3903123,-0.4820905,16.293993,225000
|
| 7 |
+
1.0,0.9999999,0.024026452,2.402645,1.0240263,1.5170143,-35.098557,-103.4611,-190.57439,0.72623146,-0.74213964,33.10499,230000
|
| 8 |
+
1.0,1.0,0.025758851,2.5758853,1.0257589,2.8633013,-29.984985,-102.90188,-169.55783,1.1638793,-1.3744454,65.34968,235000
|
| 9 |
+
1.0,1.0,0.025393795,2.5393796,1.0253938,1.6541151,-22.41477,-103.01426,-181.84538,1.4299624,-1.4990445,37.636105,240000
|
| 10 |
+
1.0,1.0,0.02456621,2.4566212,1.0245662,2.9396322,-35.534832,-101.55543,-187.57126,0.5376804,-1.1131678,41.22278,245000
|
| 11 |
+
1.0,1.0000001,0.029431429,2.943143,1.0294316,1.5928487,-17.117231,-98.55435,-172.03717,0.21365374,-0.22733942,21.787903,250000
|
| 12 |
+
1.0,1.0,0.030107807,3.0107808,1.0301079,2.117268,-4.4961233,-93.345695,-166.74638,0.48368698,-0.5037136,29.670536,255000
|
| 13 |
+
1.0,0.99999994,0.030912865,3.0912867,1.0309128,1.4224459,-5.862222,-90.192825,-178.5348,0.29063138,-0.26539072,18.896208,260000
|
| 14 |
+
1.0,1.0,0.027938595,2.7938595,1.0279386,1.4941605,-19.29959,-91.40295,-171.41371,0.25194705,-0.17658952,17.755468,265000
|
| 15 |
+
1.0,0.99999994,0.028364057,2.8364058,1.028364,1.592652,-8.800746,-87.25762,-177.06198,0.40454867,-0.39241785,19.484688,270000
|
| 16 |
+
1.0,0.9999999,0.030967845,3.0967844,1.0309677,1.7804024,-13.1575,-90.37158,-177.78185,0.27705732,-0.30576286,22.971075,275000
|
| 17 |
+
1.0,1.0000001,0.03131074,3.1310744,1.0313109,1.622537,-12.604931,-93.57477,-181.69759,0.26672593,-0.26115063,21.342302,280000
|
| 18 |
+
1.0,1.0000001,0.027982794,2.7982793,1.027983,1.9554188,-7.3077335,-91.92236,-191.05193,2.8497999,-2.7193234,40.078842,285000
|
| 19 |
+
1.0,1.0,0.029831456,2.983146,1.0298314,1.4923588,-16.098644,-92.11515,-186.36896,0.27173916,-0.26700053,21.62629,290000
|
| 20 |
+
1.0,1.0,0.030770885,3.0770884,1.0307709,1.4149591,-2.5354047,-89.58128,-175.81635,0.14671545,-0.15590051,14.810236,295000
|
| 21 |
+
1.0,1.0,0.029182572,2.9182572,1.0291826,1.7665471,-13.768302,-85.88307,-169.19826,0.23156632,-0.22199973,20.418362,300000
|
| 22 |
+
1.0,1.0,0.0310952,3.10952,1.0310951,1.3509604,-15.288047,-88.21416,-171.25534,0.17965423,-0.18550757,17.549274,305000
|
| 23 |
+
1.0,1.0,0.030315215,3.0315213,1.0303152,1.1506014,1.1589068,-86.28311,-156.07329,0.11453954,-0.25547102,14.41164,310000
|
| 24 |
+
1.0,1.0,0.029898759,2.9898758,1.0298988,1.5525779,0.8788389,-83.84837,-144.56448,0.35088143,-0.65530694,28.915222,315000
|
| 25 |
+
1.0,1.0000001,0.02968375,2.968375,1.0296838,1.4294354,-8.43236,-84.83683,-154.93753,0.22706248,-0.2162217,19.789997,320000
|
| 26 |
+
1.0,1.0,0.030058917,3.0058918,1.0300589,4.016275,-8.297227,-87.06612,-157.45317,0.47152498,-0.4306037,30.67752,325000
|
| 27 |
+
1.0,0.99999994,0.03162483,3.1624832,1.0316248,2.5495198,-0.4668678,-87.170586,-170.32596,0.41146114,-0.39988688,28.577013,330000
|
| 28 |
+
1.0,0.999882,0.030983685,3.0983686,1.0308657,1.439372,2.0077972,-84.715996,-160.85765,0.16595757,-0.12607631,14.372553,335000
|
| 29 |
+
1.0,0.99999994,0.03135385,3.1353853,1.0313538,1.2581819,-5.2099924,-80.98067,-164.40395,0.29189864,-0.25556502,17.011326,340000
|
| 30 |
+
1.0,1.0,0.030606613,3.0606613,1.0306066,1.52421,-5.65726,-85.59112,-185.86285,0.1847412,-0.1578846,17.110273,345000
|
| 31 |
+
1.0,1.0,0.030419141,3.0419145,1.0304191,1.0420033,-1.032603,-83.69224,-173.63013,0.16154385,-0.15844333,14.108566,350000
|
| 32 |
+
1.0,0.9999999,0.02825858,2.825858,1.0282584,1.5701602,-2.1982,-83.540276,-155.67047,0.3553234,-0.43377733,27.373854,355000
|
| 33 |
+
1.0,1.0000001,0.030708548,3.0708547,1.0307087,2.7066224,-6.375726,-86.650345,-170.5454,0.24326141,-0.26679805,24.431252,360000
|
| 34 |
+
1.0,1.0,0.0313686,3.1368601,1.0313686,2.010262,-1.4613363,-82.9186,-162.98332,1.3600547,-1.9170982,52.401047,365000
|
| 35 |
+
1.0,0.9999999,0.031865686,3.1865687,1.0318656,1.4794757,-3.4631205,-81.06778,-171.31438,0.17847642,-0.21953419,15.585812,370000
|
| 36 |
+
1.0,0.99999994,0.031859558,3.185956,1.0318595,1.4113823,-9.186458,-86.55242,-174.09804,0.22517544,-0.27733824,15.403831,375000
|
| 37 |
+
1.0,0.9998389,0.028534498,2.8534498,1.0283734,0.96002,2.0992067,-84.09124,-170.04305,0.27200183,-0.1399847,15.832279,380000
|
| 38 |
+
1.0,1.0,0.032457925,3.2457924,1.032458,0.94503844,-1.4423074,-79.10052,-153.97305,0.15170301,-0.13842091,12.846035,385000
|
| 39 |
+
1.0,1.0,0.02996755,2.9967551,1.0299675,1.388177,0.45671183,-78.989944,-178.66641,0.33632442,-0.22878036,17.576515,390000
|
| 40 |
+
1.0,0.99999994,0.031292018,3.129202,1.031292,1.5452943,-6.01936,-81.77672,-177.22888,0.1991866,-0.22193602,17.710115,395000
|
| 41 |
+
1.0,1.0,0.032431312,3.2431316,1.0324314,1.4310498,-7.347571,-81.336136,-175.8729,0.25619677,-0.3611488,23.24096,400000
|
| 42 |
+
1.0,1.0,0.031377323,3.1377323,1.0313773,2.0568502,-5.8056054,-79.498856,-153.69475,0.36365044,-0.2579865,22.086159,405000
|
| 43 |
+
1.0,1.0,0.031281937,3.1281939,1.031282,4.416882,-0.21645977,-81.918045,-150.53535,0.87985706,-0.62387985,49.661217,410000
|
| 44 |
+
1.0,0.99999994,0.03140043,3.1400433,1.0314003,2.437575,-4.874737,-79.85715,-155.60728,0.2608129,-0.21628079,21.9558,415000
|
| 45 |
+
1.0,1.0,0.029253673,2.9253674,1.0292537,1.4437917,-2.4806716,-78.35574,-164.71419,0.3538501,-0.3460322,21.493078,420000
|
| 46 |
+
1.0,1.0000001,0.030844264,3.0844264,1.0308443,1.9985535,0.17460492,-77.36448,-147.09822,0.25033838,-0.25439447,22.448338,425000
|
| 47 |
+
1.0,1.0,0.03249896,3.2498956,1.032499,1.2129637,1.498961,-79.555084,-154.13965,0.19304352,-0.13261087,16.055042,430000
|
| 48 |
+
1.0,1.0,0.030828552,3.0828552,1.0308286,4.714972,-1.3205184,-77.06228,-156.75659,1.676339,-1.5143799,38.707706,435000
|
| 49 |
+
1.0,0.9999306,0.031609453,3.1609452,1.03154,1.20639,1.93135,-80.23257,-166.95975,0.17797227,-0.1668192,14.7962055,440000
|
| 50 |
+
1.0,1.0,0.032491907,3.2491913,1.0324919,1.4200523,-7.276107,-80.71316,-154.08221,0.31965247,-0.27857754,21.08955,445000
|
| 51 |
+
1.0,0.99999994,0.031203512,3.1203513,1.0312035,1.6781937,-1.9573224,-76.51711,-149.87233,0.3371867,-0.31978476,19.001892,450000
|
| 52 |
+
1.0,0.99999994,0.03108197,3.108197,1.0310819,1.3605283,1.4478425,-81.41493,-162.99773,0.13524778,-0.20028152,16.046515,455000
|
| 53 |
+
1.0,1.0,0.031850424,3.1850424,1.0318505,1.046276,1.9963506,-77.70357,-169.09915,0.2322996,-0.29529703,14.1539545,460000
|
| 54 |
+
1.0,0.99999994,0.032808132,3.2808135,1.0328081,1.2183393,-2.5496738,-80.08202,-169.62915,0.37365752,-0.28200012,18.139694,465000
|
| 55 |
+
1.0,1.0,0.030085307,3.0085306,1.0300853,1.5790929,0.25371307,-79.29227,-147.82382,0.8710084,-0.6934527,30.535254,470000
|
| 56 |
+
1.0,1.0,0.029145379,2.914538,1.0291454,1.3395525,-3.441834,-78.65687,-171.25876,0.22008543,-0.21538225,14.86774,475000
|
| 57 |
+
1.0,0.9999999,0.030149072,3.0149074,1.030149,1.1539869,-7.141144,-80.71755,-162.89246,0.13832076,-0.30301645,16.009424,480000
|
| 58 |
+
1.0,1.0,0.029961033,2.9961033,1.029961,1.351595,-5.912219,-78.11903,-155.67294,0.2800072,-0.35694912,18.65776,485000
|
| 59 |
+
1.0,1.0000001,0.028795846,2.8795848,1.028796,1.3220056,-1.6795725,-75.43495,-167.94781,1.1372762,-1.1556201,22.081915,490000
|
| 60 |
+
1.0,0.9999904,0.029855046,2.9855046,1.0298455,1.2013062,0.5268147,-77.88159,-160.6494,0.23556311,-0.36117846,17.15471,495000
|
| 61 |
+
1.0,1.0,0.030500736,3.0500739,1.0305008,1.5332049,0.89389586,-80.64691,-160.6646,0.3213295,-0.36695215,22.557518,500000
|
| 62 |
+
1.0,1.0,0.032274663,3.2274666,1.0322747,2.3817253,1.117083,-80.818825,-159.21274,0.847115,-0.89207494,35.32521,505000
|
| 63 |
+
1.0,1.0,0.033299163,3.329916,1.0332992,1.2369092,0.077856764,-76.87699,-163.98514,0.2465963,-0.21333976,17.779009,510000
|
| 64 |
+
1.0,1.0,0.029012252,2.9012256,1.0290122,1.4509493,-2.3543015,-76.43716,-145.6221,0.5598326,-0.52984536,20.263166,515000
|
| 65 |
+
1.0,1.0000001,0.029145047,2.9145048,1.0291451,0.8698225,-1.7509633,-76.437256,-155.71065,0.21443285,-0.20390035,14.075952,520000
|
| 66 |
+
1.0,1.0,0.030380925,3.0380926,1.030381,1.41098,-2.1640887,-76.760254,-154.9049,0.20193774,-0.3221006,18.748135,525000
|
| 67 |
+
1.0,1.0,0.031988166,3.1988168,1.0319881,2.0473852,1.5490704,-75.80947,-140.50632,0.38068146,-0.31706455,25.437197,530000
|
| 68 |
+
1.0,1.0,0.031145304,3.1145306,1.0311453,1.3522594,-3.277514,-75.67664,-171.92535,0.24615896,-0.25093386,17.20178,535000
|
| 69 |
+
1.0,1.0,0.031993404,3.1993406,1.0319934,1.1810012,5.8862963,-76.341354,-151.70148,0.4211687,-0.45292774,16.360771,540000
|
| 70 |
+
1.0,1.0,0.030577129,3.0577128,1.0305772,1.3209032,0.33546966,-78.91277,-154.12442,0.34312364,-0.2994794,18.571129,545000
|
| 71 |
+
1.0,1.0,0.028948756,2.8948758,1.0289488,1.0591663,-3.2787068,-73.11145,-155.65604,0.13465649,-0.16850844,13.42425,550000
|
| 72 |
+
1.0,0.9998354,0.03053857,3.0538573,1.0303739,1.0975431,5.798842,-77.73905,-160.53787,0.32339287,-0.33805028,19.085014,555000
|
| 73 |
+
1.0,1.0,0.029981364,2.9981365,1.0299814,1.6146172,-0.41024968,-72.040245,-165.08347,0.44545317,-0.63966453,23.904284,560000
|
| 74 |
+
1.0,0.9999999,0.03144631,3.1446314,1.0314462,0.82964957,-6.1339846,-76.61248,-153.78323,0.1169815,-0.11413987,9.68123,565000
|
| 75 |
+
1.0,1.0000001,0.030358613,3.0358613,1.0303588,0.97058624,-2.4853566,-73.18885,-142.02686,0.29847685,-0.25728807,13.64438,570000
|
| 76 |
+
1.0,0.99999994,0.030620087,3.0620086,1.03062,0.94892883,0.60441864,-72.66813,-163.75407,0.2465959,-0.1878143,14.36038,575000
|
| 77 |
+
1.0,1.0,0.029339537,2.933954,1.0293396,1.4069014,-1.9012929,-74.35607,-145.04733,4.2590013,-4.2132053,45.364952,580000
|
| 78 |
+
1.0,0.99999994,0.030276276,3.027628,1.0302762,1.1617506,-3.9985723,-74.426186,-146.62067,0.35909027,-0.28260678,19.451,585000
|
| 79 |
+
1.0,0.9999999,0.034184806,3.4184804,1.0341847,0.946505,-0.7771944,-74.23197,-155.59006,0.2975629,-0.30618468,14.081929,590000
|
| 80 |
+
1.0,1.0,0.031023877,3.1023874,1.0310239,0.8744917,-3.4328,-73.45901,-139.10728,0.11035528,-0.22243449,9.545625,595000
|
| 81 |
+
1.0,0.9999999,0.02987929,2.987929,1.0298792,0.8614351,-5.6872096,-71.7231,-141.25444,0.14974447,-0.22954665,12.751015,600000
|
| 82 |
+
1.0,0.9999999,0.030979244,3.0979247,1.0309792,1.107437,-2.9265149,-71.743835,-146.82838,0.22294378,-0.14600557,14.812841,605000
|
| 83 |
+
1.0,1.0,0.03224872,3.224872,1.0322487,1.0618403,-2.364348,-73.65596,-146.10487,0.245281,-0.24714561,14.892716,610000
|
| 84 |
+
1.0,0.9999998,0.030732192,3.0732193,1.030732,0.8814149,0.09992102,-72.30663,-142.08357,0.1543987,-0.21309137,12.655043,615000
|
| 85 |
+
1.0,1.0,0.03180063,3.180063,1.0318006,0.88567686,-2.5908768,-70.88125,-154.24501,1.1901262,-0.80033875,17.818352,620000
|
| 86 |
+
1.0,1.0,0.031212986,3.1212986,1.031213,0.9174347,-1.4725027,-69.43783,-171.77214,0.1344833,-0.22509411,12.827198,625000
|
| 87 |
+
1.0,1.0,0.030416552,3.041655,1.0304166,1.0232195,-3.5521512,-70.19109,-147.21318,0.22218212,-0.23218468,13.394439,630000
|
| 88 |
+
1.0,1.0,0.033170365,3.3170366,1.0331703,1.1533549,-1.7205235,-75.30202,-163.02487,0.3090855,-0.2025495,15.671915,635000
|
| 89 |
+
1.0,1.0,0.030691935,3.0691934,1.030692,1.8229395,-1.737347,-68.387474,-154.5168,0.31494543,-0.32493997,20.730549,640000
|
| 90 |
+
1.0,0.9999999,0.031163484,3.1163483,1.0311633,1.6407639,-1.3121344,-74.000145,-134.80934,0.32862943,-0.37480047,23.223103,645000
|
| 91 |
+
1.0,0.99999994,0.02963058,2.9630582,1.0296305,1.0199043,-4.8180795,-68.83584,-153.2892,0.19796856,-0.30410412,15.534991,650000
|
| 92 |
+
1.0,0.99999994,0.03284984,3.2849844,1.0328498,0.9752413,2.1423984,-73.300224,-154.44049,0.22596359,-0.22738943,13.355074,655000
|
| 93 |
+
1.0,1.0,0.0313209,3.13209,1.0313209,1.2997421,-2.5187285,-71.497696,-135.1802,0.33221573,-0.39862326,20.132072,660000
|
| 94 |
+
1.0,1.0,0.03345702,3.3457017,1.033457,1.3776156,-0.63896596,-70.39292,-138.54129,0.2614699,-0.2071697,15.138164,665000
|
| 95 |
+
1.0,1.0000001,0.032534555,3.2534554,1.0325347,0.89035696,-2.6658297,-69.52831,-129.90323,0.305494,-0.27815568,12.584045,670000
|
| 96 |
+
1.0,1.0,0.03000249,3.0002491,1.0300025,0.9322708,-2.5420017,-69.8063,-155.13002,0.12459258,-0.21550915,13.242807,675000
|
| 97 |
+
1.0,0.999959,0.033283103,3.32831,1.0332421,1.8211697,0.9922099,-72.17238,-147.34123,1.4635212,-1.3936031,30.857166,680000
|
| 98 |
+
1.0,0.99999994,0.03253537,3.253537,1.0325353,0.7820879,-2.3383803,-68.995804,-163.51712,0.21477246,-0.284114,11.978713,685000
|
| 99 |
+
1.0,1.0,0.030495383,3.0495381,1.0304954,1.041303,-0.39875978,-69.799515,-149.21193,0.34633097,-0.38598168,17.749357,690000
|
| 100 |
+
1.0,1.0,0.029893875,2.9893875,1.0298939,1.3992919,-3.222465,-66.52111,-161.41667,0.81703764,-0.8086956,22.862597,695000
|
| 101 |
+
1.0,0.99999994,0.028871637,2.8871639,1.0288715,1.1437153,-0.8859671,-67.24562,-151.3075,0.97736984,-1.0099361,19.322903,700000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0000001,0.028237823,2.8237824,1.0282379,0.66316956,-24.114088,-99.010544,-158.92021,0.19089164,-0.1537139,13.731147,205000
|
| 3 |
+
1.0,1.0,0.028011397,2.8011396,1.0280114,0.9473737,-20.321049,-98.287224,-168.86946,0.3800224,-0.38110262,18.082298,210000
|
| 4 |
+
1.0,1.0,0.024017302,2.40173,1.0240173,0.846563,-24.1487,-101.90232,-169.20532,0.3580949,-0.36109248,15.390954,215000
|
| 5 |
+
1.0,1.0,0.023988463,2.3988466,1.0239885,0.9432165,-25.823854,-104.32532,-183.4562,0.10772827,-0.14399529,12.792468,220000
|
| 6 |
+
1.0,1.0,0.022929244,2.2929244,1.0229292,1.0359716,-39.229965,-105.217896,-179.09558,0.3903123,-0.4820905,16.293993,225000
|
| 7 |
+
1.0,0.9999999,0.024026452,2.402645,1.0240263,1.5170143,-35.098557,-103.4611,-190.57439,0.72623146,-0.74213964,33.10499,230000
|
| 8 |
+
1.0,1.0,0.025758851,2.5758853,1.0257589,2.8633013,-29.984985,-102.90188,-169.55783,1.1638793,-1.3744454,65.34968,235000
|
| 9 |
+
1.0,1.0,0.025393795,2.5393796,1.0253938,1.6541151,-22.41477,-103.01426,-181.84538,1.4299624,-1.4990445,37.636105,240000
|
| 10 |
+
1.0,1.0,0.02456621,2.4566212,1.0245662,2.9396322,-35.534832,-101.55543,-187.57126,0.5376804,-1.1131678,41.22278,245000
|
| 11 |
+
1.0,1.0000001,0.029431429,2.943143,1.0294316,1.5928487,-17.117231,-98.55435,-172.03717,0.21365374,-0.22733942,21.787903,250000
|
| 12 |
+
1.0,1.0,0.030107807,3.0107808,1.0301079,2.117268,-4.4961233,-93.345695,-166.74638,0.48368698,-0.5037136,29.670536,255000
|
| 13 |
+
1.0,0.99999994,0.030912865,3.0912867,1.0309128,1.4224459,-5.862222,-90.192825,-178.5348,0.29063138,-0.26539072,18.896208,260000
|
| 14 |
+
1.0,1.0,0.027938595,2.7938595,1.0279386,1.4941605,-19.29959,-91.40295,-171.41371,0.25194705,-0.17658952,17.755468,265000
|
| 15 |
+
1.0,0.99999994,0.028364057,2.8364058,1.028364,1.592652,-8.800746,-87.25762,-177.06198,0.40454867,-0.39241785,19.484688,270000
|
| 16 |
+
1.0,0.9999999,0.030967845,3.0967844,1.0309677,1.7804024,-13.1575,-90.37158,-177.78185,0.27705732,-0.30576286,22.971075,275000
|
| 17 |
+
1.0,1.0000001,0.03131074,3.1310744,1.0313109,1.622537,-12.604931,-93.57477,-181.69759,0.26672593,-0.26115063,21.342302,280000
|
| 18 |
+
1.0,1.0000001,0.027982794,2.7982793,1.027983,1.9554188,-7.3077335,-91.92236,-191.05193,2.8497999,-2.7193234,40.078842,285000
|
| 19 |
+
1.0,1.0,0.029831456,2.983146,1.0298314,1.4923588,-16.098644,-92.11515,-186.36896,0.27173916,-0.26700053,21.62629,290000
|
| 20 |
+
1.0,1.0,0.030770885,3.0770884,1.0307709,1.4149591,-2.5354047,-89.58128,-175.81635,0.14671545,-0.15590051,14.810236,295000
|
| 21 |
+
1.0,1.0,0.029182572,2.9182572,1.0291826,1.7665471,-13.768302,-85.88307,-169.19826,0.23156632,-0.22199973,20.418362,300000
|
| 22 |
+
1.0,1.0,0.0310952,3.10952,1.0310951,1.3509604,-15.288047,-88.21416,-171.25534,0.17965423,-0.18550757,17.549274,305000
|
| 23 |
+
1.0,1.0,0.030315215,3.0315213,1.0303152,1.1506014,1.1589068,-86.28311,-156.07329,0.11453954,-0.25547102,14.41164,310000
|
| 24 |
+
1.0,1.0,0.029898759,2.9898758,1.0298988,1.5525779,0.8788389,-83.84837,-144.56448,0.35088143,-0.65530694,28.915222,315000
|
| 25 |
+
1.0,1.0000001,0.02968375,2.968375,1.0296838,1.4294354,-8.43236,-84.83683,-154.93753,0.22706248,-0.2162217,19.789997,320000
|
| 26 |
+
1.0,1.0,0.030058917,3.0058918,1.0300589,4.016275,-8.297227,-87.06612,-157.45317,0.47152498,-0.4306037,30.67752,325000
|
| 27 |
+
1.0,0.99999994,0.03162483,3.1624832,1.0316248,2.5495198,-0.4668678,-87.170586,-170.32596,0.41146114,-0.39988688,28.577013,330000
|
| 28 |
+
1.0,0.999882,0.030983685,3.0983686,1.0308657,1.439372,2.0077972,-84.715996,-160.85765,0.16595757,-0.12607631,14.372553,335000
|
| 29 |
+
1.0,0.99999994,0.03135385,3.1353853,1.0313538,1.2581819,-5.2099924,-80.98067,-164.40395,0.29189864,-0.25556502,17.011326,340000
|
| 30 |
+
1.0,1.0,0.030606613,3.0606613,1.0306066,1.52421,-5.65726,-85.59112,-185.86285,0.1847412,-0.1578846,17.110273,345000
|
| 31 |
+
1.0,1.0,0.030419141,3.0419145,1.0304191,1.0420033,-1.032603,-83.69224,-173.63013,0.16154385,-0.15844333,14.108566,350000
|
| 32 |
+
1.0,0.9999999,0.02825858,2.825858,1.0282584,1.5701602,-2.1982,-83.540276,-155.67047,0.3553234,-0.43377733,27.373854,355000
|
| 33 |
+
1.0,1.0000001,0.030708548,3.0708547,1.0307087,2.7066224,-6.375726,-86.650345,-170.5454,0.24326141,-0.26679805,24.431252,360000
|
| 34 |
+
1.0,1.0,0.0313686,3.1368601,1.0313686,2.010262,-1.4613363,-82.9186,-162.98332,1.3600547,-1.9170982,52.401047,365000
|
| 35 |
+
1.0,0.9999999,0.031865686,3.1865687,1.0318656,1.4794757,-3.4631205,-81.06778,-171.31438,0.17847642,-0.21953419,15.585812,370000
|
| 36 |
+
1.0,0.99999994,0.031859558,3.185956,1.0318595,1.4113823,-9.186458,-86.55242,-174.09804,0.22517544,-0.27733824,15.403831,375000
|
| 37 |
+
1.0,0.9998389,0.028534498,2.8534498,1.0283734,0.96002,2.0992067,-84.09124,-170.04305,0.27200183,-0.1399847,15.832279,380000
|
| 38 |
+
1.0,1.0,0.032457925,3.2457924,1.032458,0.94503844,-1.4423074,-79.10052,-153.97305,0.15170301,-0.13842091,12.846035,385000
|
| 39 |
+
1.0,1.0,0.02996755,2.9967551,1.0299675,1.388177,0.45671183,-78.989944,-178.66641,0.33632442,-0.22878036,17.576515,390000
|
| 40 |
+
1.0,0.99999994,0.031292018,3.129202,1.031292,1.5452943,-6.01936,-81.77672,-177.22888,0.1991866,-0.22193602,17.710115,395000
|
| 41 |
+
1.0,1.0,0.032431312,3.2431316,1.0324314,1.4310498,-7.347571,-81.336136,-175.8729,0.25619677,-0.3611488,23.24096,400000
|
| 42 |
+
1.0,1.0,0.031377323,3.1377323,1.0313773,2.0568502,-5.8056054,-79.498856,-153.69475,0.36365044,-0.2579865,22.086159,405000
|
| 43 |
+
1.0,1.0,0.031281937,3.1281939,1.031282,4.416882,-0.21645977,-81.918045,-150.53535,0.87985706,-0.62387985,49.661217,410000
|
| 44 |
+
1.0,0.99999994,0.03140043,3.1400433,1.0314003,2.437575,-4.874737,-79.85715,-155.60728,0.2608129,-0.21628079,21.9558,415000
|
| 45 |
+
1.0,1.0,0.029253673,2.9253674,1.0292537,1.4437917,-2.4806716,-78.35574,-164.71419,0.3538501,-0.3460322,21.493078,420000
|
| 46 |
+
1.0,1.0000001,0.030844264,3.0844264,1.0308443,1.9985535,0.17460492,-77.36448,-147.09822,0.25033838,-0.25439447,22.448338,425000
|
| 47 |
+
1.0,1.0,0.03249896,3.2498956,1.032499,1.2129637,1.498961,-79.555084,-154.13965,0.19304352,-0.13261087,16.055042,430000
|
| 48 |
+
1.0,1.0,0.030828552,3.0828552,1.0308286,4.714972,-1.3205184,-77.06228,-156.75659,1.676339,-1.5143799,38.707706,435000
|
| 49 |
+
1.0,0.9999306,0.031609453,3.1609452,1.03154,1.20639,1.93135,-80.23257,-166.95975,0.17797227,-0.1668192,14.7962055,440000
|
| 50 |
+
1.0,1.0,0.032491907,3.2491913,1.0324919,1.4200523,-7.276107,-80.71316,-154.08221,0.31965247,-0.27857754,21.08955,445000
|
| 51 |
+
1.0,0.99999994,0.031203512,3.1203513,1.0312035,1.6781937,-1.9573224,-76.51711,-149.87233,0.3371867,-0.31978476,19.001892,450000
|
| 52 |
+
1.0,0.99999994,0.03108197,3.108197,1.0310819,1.3605283,1.4478425,-81.41493,-162.99773,0.13524778,-0.20028152,16.046515,455000
|
| 53 |
+
1.0,1.0,0.031850424,3.1850424,1.0318505,1.046276,1.9963506,-77.70357,-169.09915,0.2322996,-0.29529703,14.1539545,460000
|
| 54 |
+
1.0,0.99999994,0.032808132,3.2808135,1.0328081,1.2183393,-2.5496738,-80.08202,-169.62915,0.37365752,-0.28200012,18.139694,465000
|
| 55 |
+
1.0,1.0,0.030085307,3.0085306,1.0300853,1.5790929,0.25371307,-79.29227,-147.82382,0.8710084,-0.6934527,30.535254,470000
|
| 56 |
+
1.0,1.0,0.029145379,2.914538,1.0291454,1.3395525,-3.441834,-78.65687,-171.25876,0.22008543,-0.21538225,14.86774,475000
|
| 57 |
+
1.0,0.9999999,0.030149072,3.0149074,1.030149,1.1539869,-7.141144,-80.71755,-162.89246,0.13832076,-0.30301645,16.009424,480000
|
| 58 |
+
1.0,1.0,0.029961033,2.9961033,1.029961,1.351595,-5.912219,-78.11903,-155.67294,0.2800072,-0.35694912,18.65776,485000
|
| 59 |
+
1.0,1.0000001,0.028795846,2.8795848,1.028796,1.3220056,-1.6795725,-75.43495,-167.94781,1.1372762,-1.1556201,22.081915,490000
|
| 60 |
+
1.0,0.9999904,0.029855046,2.9855046,1.0298455,1.2013062,0.5268147,-77.88159,-160.6494,0.23556311,-0.36117846,17.15471,495000
|
| 61 |
+
1.0,1.0,0.030500736,3.0500739,1.0305008,1.5332049,0.89389586,-80.64691,-160.6646,0.3213295,-0.36695215,22.557518,500000
|
| 62 |
+
1.0,1.0,0.032274663,3.2274666,1.0322747,2.3817253,1.117083,-80.818825,-159.21274,0.847115,-0.89207494,35.32521,505000
|
| 63 |
+
1.0,1.0,0.033299163,3.329916,1.0332992,1.2369092,0.077856764,-76.87699,-163.98514,0.2465963,-0.21333976,17.779009,510000
|
| 64 |
+
1.0,1.0,0.029012252,2.9012256,1.0290122,1.4509493,-2.3543015,-76.43716,-145.6221,0.5598326,-0.52984536,20.263166,515000
|
| 65 |
+
1.0,1.0000001,0.029145047,2.9145048,1.0291451,0.8698225,-1.7509633,-76.437256,-155.71065,0.21443285,-0.20390035,14.075952,520000
|
| 66 |
+
1.0,1.0,0.030380925,3.0380926,1.030381,1.41098,-2.1640887,-76.760254,-154.9049,0.20193774,-0.3221006,18.748135,525000
|
| 67 |
+
1.0,1.0,0.031988166,3.1988168,1.0319881,2.0473852,1.5490704,-75.80947,-140.50632,0.38068146,-0.31706455,25.437197,530000
|
| 68 |
+
1.0,1.0,0.031145304,3.1145306,1.0311453,1.3522594,-3.277514,-75.67664,-171.92535,0.24615896,-0.25093386,17.20178,535000
|
| 69 |
+
1.0,1.0,0.031993404,3.1993406,1.0319934,1.1810012,5.8862963,-76.341354,-151.70148,0.4211687,-0.45292774,16.360771,540000
|
| 70 |
+
1.0,1.0,0.030577129,3.0577128,1.0305772,1.3209032,0.33546966,-78.91277,-154.12442,0.34312364,-0.2994794,18.571129,545000
|
| 71 |
+
1.0,1.0,0.028948756,2.8948758,1.0289488,1.0591663,-3.2787068,-73.11145,-155.65604,0.13465649,-0.16850844,13.42425,550000
|
| 72 |
+
1.0,0.9998354,0.03053857,3.0538573,1.0303739,1.0975431,5.798842,-77.73905,-160.53787,0.32339287,-0.33805028,19.085014,555000
|
| 73 |
+
1.0,1.0,0.029981364,2.9981365,1.0299814,1.6146172,-0.41024968,-72.040245,-165.08347,0.44545317,-0.63966453,23.904284,560000
|
| 74 |
+
1.0,0.9999999,0.03144631,3.1446314,1.0314462,0.82964957,-6.1339846,-76.61248,-153.78323,0.1169815,-0.11413987,9.68123,565000
|
| 75 |
+
1.0,1.0000001,0.030358613,3.0358613,1.0303588,0.97058624,-2.4853566,-73.18885,-142.02686,0.29847685,-0.25728807,13.64438,570000
|
| 76 |
+
1.0,0.99999994,0.030620087,3.0620086,1.03062,0.94892883,0.60441864,-72.66813,-163.75407,0.2465959,-0.1878143,14.36038,575000
|
| 77 |
+
1.0,1.0,0.029339537,2.933954,1.0293396,1.4069014,-1.9012929,-74.35607,-145.04733,4.2590013,-4.2132053,45.364952,580000
|
| 78 |
+
1.0,0.99999994,0.030276276,3.027628,1.0302762,1.1617506,-3.9985723,-74.426186,-146.62067,0.35909027,-0.28260678,19.451,585000
|
| 79 |
+
1.0,0.9999999,0.034184806,3.4184804,1.0341847,0.946505,-0.7771944,-74.23197,-155.59006,0.2975629,-0.30618468,14.081929,590000
|
| 80 |
+
1.0,1.0,0.031023877,3.1023874,1.0310239,0.8744917,-3.4328,-73.45901,-139.10728,0.11035528,-0.22243449,9.545625,595000
|
| 81 |
+
1.0,0.9999999,0.02987929,2.987929,1.0298792,0.8614351,-5.6872096,-71.7231,-141.25444,0.14974447,-0.22954665,12.751015,600000
|
| 82 |
+
1.0,0.9999999,0.030979244,3.0979247,1.0309792,1.107437,-2.9265149,-71.743835,-146.82838,0.22294378,-0.14600557,14.812841,605000
|
| 83 |
+
1.0,1.0,0.03224872,3.224872,1.0322487,1.0618403,-2.364348,-73.65596,-146.10487,0.245281,-0.24714561,14.892716,610000
|
| 84 |
+
1.0,0.9999998,0.030732192,3.0732193,1.030732,0.8814149,0.09992102,-72.30663,-142.08357,0.1543987,-0.21309137,12.655043,615000
|
| 85 |
+
1.0,1.0,0.03180063,3.180063,1.0318006,0.88567686,-2.5908768,-70.88125,-154.24501,1.1901262,-0.80033875,17.818352,620000
|
| 86 |
+
1.0,1.0,0.031212986,3.1212986,1.031213,0.9174347,-1.4725027,-69.43783,-171.77214,0.1344833,-0.22509411,12.827198,625000
|
| 87 |
+
1.0,1.0,0.030416552,3.041655,1.0304166,1.0232195,-3.5521512,-70.19109,-147.21318,0.22218212,-0.23218468,13.394439,630000
|
| 88 |
+
1.0,1.0,0.033170365,3.3170366,1.0331703,1.1533549,-1.7205235,-75.30202,-163.02487,0.3090855,-0.2025495,15.671915,635000
|
| 89 |
+
1.0,1.0,0.030691935,3.0691934,1.030692,1.8229395,-1.737347,-68.387474,-154.5168,0.31494543,-0.32493997,20.730549,640000
|
| 90 |
+
1.0,0.9999999,0.031163484,3.1163483,1.0311633,1.6407639,-1.3121344,-74.000145,-134.80934,0.32862943,-0.37480047,23.223103,645000
|
| 91 |
+
1.0,0.99999994,0.02963058,2.9630582,1.0296305,1.0199043,-4.8180795,-68.83584,-153.2892,0.19796856,-0.30410412,15.534991,650000
|
| 92 |
+
1.0,0.99999994,0.03284984,3.2849844,1.0328498,0.9752413,2.1423984,-73.300224,-154.44049,0.22596359,-0.22738943,13.355074,655000
|
| 93 |
+
1.0,1.0,0.0313209,3.13209,1.0313209,1.2997421,-2.5187285,-71.497696,-135.1802,0.33221573,-0.39862326,20.132072,660000
|
| 94 |
+
1.0,1.0,0.03345702,3.3457017,1.033457,1.3776156,-0.63896596,-70.39292,-138.54129,0.2614699,-0.2071697,15.138164,665000
|
| 95 |
+
1.0,1.0000001,0.032534555,3.2534554,1.0325347,0.89035696,-2.6658297,-69.52831,-129.90323,0.305494,-0.27815568,12.584045,670000
|
| 96 |
+
1.0,1.0,0.03000249,3.0002491,1.0300025,0.9322708,-2.5420017,-69.8063,-155.13002,0.12459258,-0.21550915,13.242807,675000
|
| 97 |
+
1.0,0.999959,0.033283103,3.32831,1.0332421,1.8211697,0.9922099,-72.17238,-147.34123,1.4635212,-1.3936031,30.857166,680000
|
| 98 |
+
1.0,0.99999994,0.03253537,3.253537,1.0325353,0.7820879,-2.3383803,-68.995804,-163.51712,0.21477246,-0.284114,11.978713,685000
|
| 99 |
+
1.0,1.0,0.030495383,3.0495381,1.0304954,1.041303,-0.39875978,-69.799515,-149.21193,0.34633097,-0.38598168,17.749357,690000
|
| 100 |
+
1.0,1.0,0.029893875,2.9893875,1.0298939,1.3992919,-3.222465,-66.52111,-161.41667,0.81703764,-0.8086956,22.862597,695000
|
| 101 |
+
1.0,0.99999994,0.028871637,2.8871639,1.0288715,1.1437153,-0.8859671,-67.24562,-151.3075,0.97736984,-1.0099361,19.322903,700000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33b16d02eab2cb7726884132890d000a30345526c6a3e20292e827a87bc8ac2e
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48021c43fde0bbb1e6d60792efd045314f2096ee18cad08804b61d7373fab01e
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eabbd9587de32b106c562b3584e36a928ae604f13a454cc31174672a09c51320
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5ac34b0923a82761d1d8d3e717861a076ad10f6ea9f9df7f6a05a2e4bff9dce
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02cafd5642dc31c62d967bcf14865d42d22aba75d52547aed8a760b6af01caaf
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8cae412a9e687e75bd51dd444e299a0a4467b0ba60260e92691d8fbb2998e5fa
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17d6d41122e312bf371ec9f046708a791bfa9d6c728c2d47b236536e6cd0931d
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:683cbf510cabbc5d00e37679a5f9c6bfa34019a46a51020c5f7e0d99d0b550ee
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3598160ba95a187fc00b6e6dc6d1237cd118be22e3fb9df9b17e50718ff65c0
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdb49e99fe88732bcb30767b77eccbc16b657e509c9bc959912742da2576c6e8
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_114631/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/j39vnpzh
|