Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/env.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0720483544418701,-0.007832861388471227,-0.07227476112194019,-0.002911800945123014,14.362979967191913,46.850000000013424,0.16,23891.7,-0.84,-934.84,935.0,2.7934979152679444,450000
|
| 3 |
+
0.0,0.0,-0.041538476758114666,0.0042099328609521754,-0.0416547366410843,0.010947004600947276,21.50025648731857,25.84200000000581,0.62,61898.34,-0.38,-514.92,514.84,1.5659972286224366,500000
|
| 4 |
+
0.0,0.0,-0.03719252682595383,0.004268656883505968,-0.03700847765204509,-0.004466428212133387,33.40482437441269,8.146000000000436,0.96,77992.36,-0.06,-176.04,160.92,0.5236720752716064,550000
|
| 5 |
+
0.0,0.0,-0.04271051578529558,0.012151720516081274,-0.041867918483182213,0.010377784568603325,34.488838910358666,4.433000000000206,0.98,84239.74,-0.02,-85.68,86.66,0.2934707546234131,600000
|
| 6 |
+
0.0,0.0,-0.02851539258587288,0.015257449457215001,-0.027017316926088098,0.024392104478190794,35.5296336135383,2.8939999999999064,1.0,88404.38,0.0,-54.88,55.88,0.19071667671203613,650000
|
| 7 |
+
0.0,0.0,-0.009667553151716666,0.03564057516089196,-0.007646341018357526,0.027959770346825327,35.39076246506454,2.0519999999999725,1.0,90805.22,0.0,-38.04,39.04,0.1409156560897827,700000
|
| 8 |
+
0.0,0.0,-0.029346058425957087,0.02682453774361936,-0.02690629992124704,0.027184906374803683,35.732380720864,1.7049999999999932,1.0,92704.04,0.0,-31.1,32.1,0.11353589057922363,750000
|
| 9 |
+
0.0,0.0,-0.024844851790122535,0.04560113449132418,-0.022334756086866678,0.03470270834568964,35.68203752358479,1.816999999999982,1.0,94462.1,0.0,-33.34,34.34,0.12291325092315673,800000
|
| 10 |
+
0.0,0.0,-0.031153031408898007,0.02495373230135104,-0.02858738757011633,0.03149044188234423,35.70873849196752,1.8929999999999731,1.0,96238.5,0.0,-34.86,35.86,0.12667259693145752,850000
|
| 11 |
+
0.0,0.0,-0.03052214310230714,0.030734818823542228,-0.02812344038976095,0.031450083353465975,35.71881600215001,1.6599999999999908,1.0,97969.38,0.0,-30.2,31.2,0.11233081817626953,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0720483544418701,-0.007832861388471227,-0.07227476112194019,-0.002911800945123014,14.362979967191913,46.850000000013424,0.16,23891.7,-0.84,-934.84,935.0,2.7934979152679444,450000
|
| 3 |
+
0.0,0.0,-0.041538476758114666,0.0042099328609521754,-0.0416547366410843,0.010947004600947276,21.50025648731857,25.84200000000581,0.62,61898.34,-0.38,-514.92,514.84,1.5659972286224366,500000
|
| 4 |
+
0.0,0.0,-0.03719252682595383,0.004268656883505968,-0.03700847765204509,-0.004466428212133387,33.40482437441269,8.146000000000436,0.96,77992.36,-0.06,-176.04,160.92,0.5236720752716064,550000
|
| 5 |
+
0.0,0.0,-0.04271051578529558,0.012151720516081274,-0.041867918483182213,0.010377784568603325,34.488838910358666,4.433000000000206,0.98,84239.74,-0.02,-85.68,86.66,0.2934707546234131,600000
|
| 6 |
+
0.0,0.0,-0.02851539258587288,0.015257449457215001,-0.027017316926088098,0.024392104478190794,35.5296336135383,2.8939999999999064,1.0,88404.38,0.0,-54.88,55.88,0.19071667671203613,650000
|
| 7 |
+
0.0,0.0,-0.009667553151716666,0.03564057516089196,-0.007646341018357526,0.027959770346825327,35.39076246506454,2.0519999999999725,1.0,90805.22,0.0,-38.04,39.04,0.1409156560897827,700000
|
| 8 |
+
0.0,0.0,-0.029346058425957087,0.02682453774361936,-0.02690629992124704,0.027184906374803683,35.732380720864,1.7049999999999932,1.0,92704.04,0.0,-31.1,32.1,0.11353589057922363,750000
|
| 9 |
+
0.0,0.0,-0.024844851790122535,0.04560113449132418,-0.022334756086866678,0.03470270834568964,35.68203752358479,1.816999999999982,1.0,94462.1,0.0,-33.34,34.34,0.12291325092315673,800000
|
| 10 |
+
0.0,0.0,-0.031153031408898007,0.02495373230135104,-0.02858738757011633,0.03149044188234423,35.70873849196752,1.8929999999999731,1.0,96238.5,0.0,-34.86,35.86,0.12667259693145752,850000
|
| 11 |
+
0.0,0.0,-0.03052214310230714,0.030734818823542228,-0.02812344038976095,0.031450083353465975,35.71881600215001,1.6599999999999908,1.0,97969.38,0.0,-30.2,31.2,0.11233081817626953,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,0.9999999,0.0075371885,0.75371885,1.0075371,8.804116,-136.16286,-279.61572,-309.2374,7.477375,-8.966198,242.77518,405000
|
| 3 |
+
1.0,1.0000001,0.008307735,0.8307735,1.0083078,2.0147722,-144.61073,-275.715,-307.2552,0.6177016,-0.5612673,34.67003,410000
|
| 4 |
+
1.0,0.99999994,0.007912666,0.79126656,1.0079126,2.7492387,-118.673004,-271.33984,-308.74542,0.5057316,-0.40208173,39.80538,415000
|
| 5 |
+
1.0,1.0,0.007912949,0.7912948,1.007913,2.0826356,-179.05956,-277.69214,-307.19434,0.42232287,-0.41593993,32.285774,420000
|
| 6 |
+
1.0,0.99999994,0.008476924,0.8476924,1.0084769,2.5299077,-107.38079,-276.9732,-307.3062,0.85589796,-0.44947162,39.310867,425000
|
| 7 |
+
1.0,0.9999991,0.007198694,0.7198695,1.0071979,3.8247774,1.5644128,-275.9047,-307.93256,1.4052582,-1.5237988,62.87347,430000
|
| 8 |
+
1.0,1.0,0.007906193,0.7906194,1.0079062,2.4705577,-108.61214,-280.05856,-309.66638,0.48355687,-0.79832506,38.149853,435000
|
| 9 |
+
1.0,0.99999994,0.007300273,0.7300273,1.0073003,2.4220579,-102.41321,-275.8031,-308.76932,0.46381015,-0.341703,35.93393,440000
|
| 10 |
+
1.0,1.0,0.00722488,0.722488,1.0072249,2.544745,-99.800865,-277.74527,-309.10513,0.8388834,-0.69998467,38.187077,445000
|
| 11 |
+
1.0,0.9999999,0.0074577597,0.74577594,1.0074576,2.4919195,-98.00548,-275.04153,-307.65906,1.4642631,-1.2336649,40.787346,450000
|
| 12 |
+
1.0,0.99999994,0.007308078,0.73080784,1.007308,2.6536205,-68.32049,-273.361,-307.66617,4.0406175,-2.2214725,88.87776,455000
|
| 13 |
+
1.0,0.9999999,0.008279532,0.82795334,1.0082794,2.6241271,-94.72681,-274.67627,-308.3493,0.5529263,-0.6048801,37.467434,460000
|
| 14 |
+
1.0,1.0,0.008258792,0.82587916,1.0082588,2.5106723,-92.27951,-275.76367,-307.58383,0.47676104,-0.33911347,35.18519,465000
|
| 15 |
+
1.0,0.9999999,0.008401507,0.8401508,1.0084014,2.2271535,-51.270573,-268.577,-307.20065,0.5276741,-0.7419578,38.15906,470000
|
| 16 |
+
1.0,1.0,0.008391898,0.8391898,1.0083919,5.9858985,-33.901955,-266.08652,-308.6454,1.9789487,-4.3275185,79.98523,475000
|
| 17 |
+
1.0,1.0,0.008095154,0.80951536,1.0080951,2.288417,-72.09792,-269.01865,-307.91522,0.6794299,-0.5667628,37.840424,480000
|
| 18 |
+
1.0,1.0,0.007999852,0.7999852,1.0079999,2.2910988,-30.085194,-269.9833,-307.7342,0.41820097,-0.9101933,31.906025,485000
|
| 19 |
+
1.0,1.0,0.007985253,0.79852533,1.0079852,2.0801237,-25.166191,-271.12524,-307.9849,0.81459606,-0.35865238,32.650158,490000
|
| 20 |
+
1.0,1.0,0.008632393,0.8632393,1.0086324,2.4584491,-86.098724,-272.14322,-307.77673,0.4578223,-0.3743875,33.83605,495000
|
| 21 |
+
1.0,0.99999994,0.0077570984,0.7757099,1.0077571,3.5420837,-58.347874,-268.51498,-309.04855,0.859331,-0.4814654,42.73734,500000
|
| 22 |
+
1.0,1.0,0.007545411,0.7545411,1.0075454,2.2040184,-68.3101,-272.72827,-307.3644,0.37440926,-0.4534275,30.785961,505000
|
| 23 |
+
1.0,1.0,0.008026194,0.8026194,1.0080262,2.5938084,-88.33059,-273.79245,-307.84232,0.41693807,-0.7503741,38.45096,510000
|
| 24 |
+
1.0,1.0,0.007641554,0.7641554,1.0076416,3.7341907,-91.67455,-267.49496,-308.97873,3.7559807,-3.7064714,98.69859,515000
|
| 25 |
+
1.0,1.0,0.0073474785,0.73474777,1.0073475,2.2396297,-23.073711,-266.50192,-308.5673,0.732958,-0.5799924,35.929356,520000
|
| 26 |
+
1.0,1.0,0.007384839,0.7384839,1.0073849,2.1181195,-35.877552,-273.7413,-308.51407,0.28396916,-0.3545977,30.797735,525000
|
| 27 |
+
1.0,1.0,0.008004375,0.80043745,1.0080044,2.2736263,-57.29007,-270.78107,-307.1764,0.63767684,-0.38428637,36.04249,530000
|
| 28 |
+
1.0,1.0,0.007465025,0.7465025,1.007465,2.275249,-35.764786,-270.70218,-308.8162,0.9312223,-0.49816266,37.83214,535000
|
| 29 |
+
1.0,1.0,0.008083385,0.8083385,1.0080833,2.2709186,-45.977722,-267.42667,-307.54547,0.31867647,-0.32634625,32.82846,540000
|
| 30 |
+
1.0,0.99999994,0.00884212,0.884212,1.0088421,4.1511154,-11.263016,-264.54544,-307.5731,0.9739139,-1.5708456,67.681335,545000
|
| 31 |
+
1.0,1.0,0.007511528,0.7511528,1.0075115,2.7305412,-45.872612,-268.142,-308.07687,0.42674088,-0.74540734,39.190067,550000
|
| 32 |
+
1.0,1.0,0.0075206165,0.7520616,1.0075207,2.6304412,-30.164999,-267.7431,-308.15912,0.6330496,-0.60486275,38.1336,555000
|
| 33 |
+
1.0,0.99999994,0.0074166814,0.7416681,1.0074166,3.1296885,-21.433508,-261.17465,-307.6649,1.1308553,-0.7159438,43.121758,560000
|
| 34 |
+
1.0,1.0,0.009143475,0.9143476,1.0091435,2.8267958,-9.907264,-263.89987,-307.60928,0.84809005,-0.6009834,40.363026,565000
|
| 35 |
+
1.0,0.9999999,0.008725996,0.87259966,1.0087259,13.210422,-23.439804,-262.85822,-308.28546,6.635368,-7.897646,174.04889,570000
|
| 36 |
+
1.0,1.0,0.008862739,0.8862739,1.0088627,3.0883477,-22.421421,-262.80704,-307.57898,0.7028522,-0.6880181,38.753395,575000
|
| 37 |
+
1.0,0.99999994,0.009809884,0.98098844,1.0098099,3.501876,-14.666053,-260.4222,-307.07556,0.84632844,-1.2550993,45.105362,580000
|
| 38 |
+
1.0,1.0,0.008687713,0.8687714,1.0086877,2.9225852,-5.280142,-255.54509,-307.2899,1.016813,-0.68104845,42.073982,585000
|
| 39 |
+
1.0,1.0,0.008994706,0.8994707,1.0089947,3.21231,-6.493118,-258.519,-307.63596,0.88565016,-0.8787372,40.96319,590000
|
| 40 |
+
1.0,1.0000002,0.008838522,0.88385224,1.0088388,3.1019216,-10.446144,-263.79514,-307.70297,0.5184799,-0.4668311,40.79864,595000
|
| 41 |
+
1.0,0.9999999,0.009470777,0.94707763,1.0094707,3.0672586,-11.090955,-255.44307,-307.58072,1.4189162,-0.9099077,49.483185,600000
|
| 42 |
+
1.0,1.0,0.009494083,0.9494083,1.0094941,3.663075,-3.7921438,-254.75108,-307.67828,0.5371804,-0.89748305,47.68012,605000
|
| 43 |
+
1.0,1.0,0.00913631,0.913631,1.0091363,3.684562,-9.829289,-259.3906,-307.0688,0.61904067,-1.2402115,50.8039,610000
|
| 44 |
+
1.0,1.0,0.009497518,0.9497518,1.0094975,3.4426477,-13.345113,-253.28304,-307.9609,1.1658486,-0.8539448,43.07381,615000
|
| 45 |
+
1.0,1.0,0.009140712,0.9140712,1.0091407,2.900712,-8.66068,-259.39304,-307.8105,0.8455602,-0.7994654,40.11459,620000
|
| 46 |
+
1.0,1.0,0.008558932,0.8558932,1.008559,3.7162864,-32.452965,-260.61337,-308.20023,1.1547204,-0.9542992,60.921345,625000
|
| 47 |
+
1.0,0.99999994,0.008544074,0.8544074,1.008544,4.351953,-2.4908764,-260.31845,-307.02954,0.7100177,-0.6380743,45.447075,630000
|
| 48 |
+
1.0,0.99999994,0.0088301785,0.8830178,1.0088301,3.0590522,-7.065516,-257.1711,-307.60156,0.549687,-0.68348956,42.69752,635000
|
| 49 |
+
1.0,0.99999994,0.008895757,0.8895757,1.0088958,3.149722,2.183459,-260.1868,-307.1506,0.6675361,-0.6173196,39.78515,640000
|
| 50 |
+
1.0,1.0,0.009119523,0.9119524,1.0091195,2.9689758,-6.454413,-249.67735,-308.3753,1.2173822,-0.45205998,35.31079,645000
|
| 51 |
+
1.0,0.99999994,0.008274682,0.82746816,1.0082747,2.9171805,-17.015848,-265.28604,-308.02216,0.9155754,-0.52114546,39.079647,650000
|
| 52 |
+
1.0,0.99999994,0.007990601,0.79906,1.0079906,2.767384,-1.875886,-255.1339,-307.66687,2.4051063,-0.6302196,41.345627,655000
|
| 53 |
+
1.0,1.0,0.008048507,0.8048508,1.0080485,3.15551,-5.156154,-255.19066,-307.50827,0.44888836,-1.0424998,44.150978,660000
|
| 54 |
+
1.0,1.0000001,0.008950197,0.89501965,1.0089504,2.625269,-21.185123,-254.47803,-307.6118,0.6128526,-0.3598295,33.97355,665000
|
| 55 |
+
1.0,0.99999994,0.008051534,0.8051535,1.0080515,5.5787215,-1.9301211,-259.14606,-307.4623,0.86058766,-0.6840587,50.53833,670000
|
| 56 |
+
1.0,1.0,0.009255779,0.92557794,1.0092558,3.0602438,-3.500426,-251.29903,-308.64294,0.6307951,-0.64002144,42.863,675000
|
| 57 |
+
1.0,1.0,0.008747215,0.8747215,1.0087472,2.968475,-2.886275,-250.81023,-307.2983,0.48780566,-1.1428099,39.671673,680000
|
| 58 |
+
1.0,0.9999964,0.008679053,0.86790526,1.0086755,3.1438272,-1.8047241,-256.55005,-308.0631,1.5878187,-0.7237828,41.416885,685000
|
| 59 |
+
1.0,1.0,0.009471723,0.9471723,1.0094718,2.8201,-6.707945,-250.37077,-307.93817,0.88042355,-0.5424162,37.06327,690000
|
| 60 |
+
1.0,1.0,0.009392712,0.9392712,1.0093927,2.6455216,-3.4888673,-255.60283,-307.97797,0.50139034,-0.79106396,36.976532,695000
|
| 61 |
+
1.0,1.0,0.009307079,0.93070793,1.009307,2.7210693,-3.8907652,-249.12007,-306.4418,0.25776422,-0.6909638,33.668934,700000
|
| 62 |
+
1.0,1.0,0.008639046,0.86390465,1.0086391,3.0304112,-4.398509,-249.3042,-307.58887,0.60789335,-0.71860456,38.372658,705000
|
| 63 |
+
1.0,1.0,0.009788712,0.9788712,1.0097888,2.7660172,-2.4322379,-246.54887,-307.98456,0.60826105,-0.80303854,37.513832,710000
|
| 64 |
+
1.0,1.0,0.010442007,1.0442008,1.010442,3.7351906,-7.6642466,-243.91971,-308.98355,0.7382628,-0.7811479,46.781075,715000
|
| 65 |
+
1.0,1.0,0.0091466755,0.91466755,1.0091467,3.1320705,-1.2335199,-235.88048,-308.40427,1.1022093,-0.6438372,40.234848,720000
|
| 66 |
+
1.0,1.0,0.009574369,0.9574368,1.0095744,3.1697752,-6.932367,-252.7105,-307.91623,1.1003408,-1.1767387,48.15818,725000
|
| 67 |
+
1.0,1.0,0.009259114,0.9259114,1.0092591,8.474109,-4.373792,-245.846,-307.2827,2.8319578,-0.45792696,55.595184,730000
|
| 68 |
+
1.0,0.99999994,0.008862907,0.8862907,1.0088629,4.391243,-2.4060652,-245.01704,-308.52942,1.2658547,-1.4087075,73.59408,735000
|
| 69 |
+
1.0,1.0,0.009543539,0.9543539,1.0095435,3.099223,-5.298288,-254.021,-307.23965,1.317567,-0.7592999,42.755386,740000
|
| 70 |
+
1.0,1.0,0.009315068,0.93150675,1.009315,3.6008668,-1.9423596,-254.35155,-307.59903,1.4934357,-0.6010085,54.140484,745000
|
| 71 |
+
1.0,1.0,0.0095509235,0.95509243,1.0095509,3.1122046,-11.321481,-246.34146,-307.23193,0.99046785,-0.5857379,37.18862,750000
|
| 72 |
+
1.0,0.99999994,0.009886675,0.9886675,1.0098866,2.8299253,-6.0156755,-248.78413,-308.44064,1.0840632,-0.45442763,37.55433,755000
|
| 73 |
+
1.0,1.0,0.008714982,0.8714982,1.008715,2.7457807,-0.69346255,-245.99239,-308.09766,0.4916335,-1.1787713,38.498825,760000
|
| 74 |
+
1.0,1.0,0.008400511,0.8400511,1.0084006,2.2721257,-6.6372232,-251.65445,-308.59906,0.7530451,-0.30459473,30.822662,765000
|
| 75 |
+
1.0,1.0,0.009784812,0.97848123,1.0097848,2.860456,-1.4035528,-241.23145,-307.73242,0.32827288,-1.1131787,37.222916,770000
|
| 76 |
+
1.0,0.99999994,0.008529015,0.8529015,1.008529,2.6391308,-4.953211,-251.39746,-308.4528,0.63448036,-0.8762113,35.83683,775000
|
| 77 |
+
1.0,1.0,0.008909285,0.8909286,1.0089092,3.0746734,-6.574179,-249.98888,-307.47787,0.3867192,-0.5603934,40.131523,780000
|
| 78 |
+
1.0,1.0,0.009142568,0.91425675,1.0091425,5.1503253,-2.1533194,-245.84676,-307.37424,1.7731184,-2.9483483,79.52136,785000
|
| 79 |
+
1.0,1.0,0.009776278,0.9776279,1.0097762,3.047451,-5.841293,-241.13647,-307.537,0.492688,-0.60441256,37.255596,790000
|
| 80 |
+
1.0,1.0,0.009254726,0.9254726,1.0092547,2.5417485,-5.9839573,-246.2539,-307.48663,0.2843491,-0.4746151,31.542938,795000
|
| 81 |
+
1.0,0.99999994,0.008649866,0.86498666,1.0086498,2.619959,-3.7659504,-242.32475,-307.75513,0.5297734,-1.2077831,40.61086,800000
|
| 82 |
+
1.0,1.0,0.009507526,0.9507527,1.0095075,3.2308183,-5.3417463,-245.38219,-306.69476,0.65546644,-0.6191979,40.833096,805000
|
| 83 |
+
1.0,1.0,0.009562053,0.95620525,1.009562,3.258284,-11.516997,-247.59166,-308.45926,0.5813041,-0.5238812,40.414577,810000
|
| 84 |
+
1.0,1.0000001,0.009565238,0.9565238,1.0095654,2.841657,-6.4221787,-237.19254,-306.85892,0.6254442,-0.81315684,37.47847,815000
|
| 85 |
+
1.0,1.0,0.008763332,0.87633324,1.0087633,2.0802786,-3.5383482,-243.41264,-307.54022,0.9949417,-0.97801596,32.016743,820000
|
| 86 |
+
1.0,1.0,0.008473445,0.8473445,1.0084734,2.2332714,-4.4190598,-247.60205,-306.9306,0.764868,-1.3930085,33.308403,825000
|
| 87 |
+
1.0,1.0,0.009892008,0.98920083,1.009892,3.464914,-7.5283475,-242.56665,-306.69608,0.8076664,-0.58986396,51.80994,830000
|
| 88 |
+
1.0,0.99999994,0.009157394,0.9157394,1.0091573,3.0091398,-3.9246833,-239.52568,-307.21777,0.9317335,-0.54630107,43.19123,835000
|
| 89 |
+
1.0,1.0,0.010350676,1.0350677,1.0103507,2.991179,-5.1866746,-237.10657,-307.23233,0.7023873,-1.4605534,45.242634,840000
|
| 90 |
+
1.0,0.99999994,0.009961155,0.99611557,1.0099611,2.3743963,-5.752917,-233.60179,-307.7667,0.59666336,-1.2129953,38.484108,845000
|
| 91 |
+
1.0,1.0000001,0.009624566,0.96245664,1.0096247,3.2845333,-2.9909983,-237.74438,-307.26672,0.57658434,-0.6425176,37.305473,850000
|
| 92 |
+
1.0,1.0,0.009192642,0.9192642,1.0091926,2.1907663,-6.167241,-242.81163,-307.97598,0.47544798,-0.35868263,30.062199,855000
|
| 93 |
+
1.0,1.0,0.009896228,0.9896228,1.0098963,3.675367,-5.475681,-229.78154,-307.36053,0.59080786,-0.7050901,38.95228,860000
|
| 94 |
+
1.0,1.0,0.008546922,0.85469234,1.008547,2.3650327,-0.53156006,-237.03133,-306.3292,0.5865322,-0.5113578,32.527225,865000
|
| 95 |
+
1.0,1.0,0.009792127,0.97921276,1.0097921,3.7731118,-4.6430154,-240.75337,-307.1514,1.0479032,-1.5528116,52.485065,870000
|
| 96 |
+
1.0,0.9999999,0.00972306,0.97230595,1.009723,2.709153,0.4024132,-236.12169,-307.02734,0.40845686,-1.0713315,36.835606,875000
|
| 97 |
+
1.0,1.0,0.009305179,0.93051785,1.0093052,3.377398,-3.606733,-247.49486,-306.5257,1.554063,-0.5819482,50.971165,880000
|
| 98 |
+
1.0,0.99999994,0.0084706135,0.84706146,1.0084705,2.550502,-7.616336,-245.20618,-308.1611,0.73761606,-0.9317355,42.56286,885000
|
| 99 |
+
1.0,1.0,0.009894727,0.9894727,1.0098947,2.906594,1.252499,-234.6022,-307.79874,2.4188478,-0.5889175,42.283504,890000
|
| 100 |
+
1.0,0.9999999,0.009056546,0.90565455,1.0090564,2.7734036,-1.0601113,-234.41338,-307.77637,0.72177786,-0.9175116,36.23427,895000
|
| 101 |
+
1.0,1.0,0.009332472,0.93324727,1.0093324,3.4309938,-5.1093593,-243.06116,-306.9879,1.0355103,-1.0717793,58.04723,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,0.9999999,0.0075371885,0.75371885,1.0075371,8.804116,-136.16286,-279.61572,-309.2374,7.477375,-8.966198,242.77518,405000
|
| 3 |
+
1.0,1.0000001,0.008307735,0.8307735,1.0083078,2.0147722,-144.61073,-275.715,-307.2552,0.6177016,-0.5612673,34.67003,410000
|
| 4 |
+
1.0,0.99999994,0.007912666,0.79126656,1.0079126,2.7492387,-118.673004,-271.33984,-308.74542,0.5057316,-0.40208173,39.80538,415000
|
| 5 |
+
1.0,1.0,0.007912949,0.7912948,1.007913,2.0826356,-179.05956,-277.69214,-307.19434,0.42232287,-0.41593993,32.285774,420000
|
| 6 |
+
1.0,0.99999994,0.008476924,0.8476924,1.0084769,2.5299077,-107.38079,-276.9732,-307.3062,0.85589796,-0.44947162,39.310867,425000
|
| 7 |
+
1.0,0.9999991,0.007198694,0.7198695,1.0071979,3.8247774,1.5644128,-275.9047,-307.93256,1.4052582,-1.5237988,62.87347,430000
|
| 8 |
+
1.0,1.0,0.007906193,0.7906194,1.0079062,2.4705577,-108.61214,-280.05856,-309.66638,0.48355687,-0.79832506,38.149853,435000
|
| 9 |
+
1.0,0.99999994,0.007300273,0.7300273,1.0073003,2.4220579,-102.41321,-275.8031,-308.76932,0.46381015,-0.341703,35.93393,440000
|
| 10 |
+
1.0,1.0,0.00722488,0.722488,1.0072249,2.544745,-99.800865,-277.74527,-309.10513,0.8388834,-0.69998467,38.187077,445000
|
| 11 |
+
1.0,0.9999999,0.0074577597,0.74577594,1.0074576,2.4919195,-98.00548,-275.04153,-307.65906,1.4642631,-1.2336649,40.787346,450000
|
| 12 |
+
1.0,0.99999994,0.007308078,0.73080784,1.007308,2.6536205,-68.32049,-273.361,-307.66617,4.0406175,-2.2214725,88.87776,455000
|
| 13 |
+
1.0,0.9999999,0.008279532,0.82795334,1.0082794,2.6241271,-94.72681,-274.67627,-308.3493,0.5529263,-0.6048801,37.467434,460000
|
| 14 |
+
1.0,1.0,0.008258792,0.82587916,1.0082588,2.5106723,-92.27951,-275.76367,-307.58383,0.47676104,-0.33911347,35.18519,465000
|
| 15 |
+
1.0,0.9999999,0.008401507,0.8401508,1.0084014,2.2271535,-51.270573,-268.577,-307.20065,0.5276741,-0.7419578,38.15906,470000
|
| 16 |
+
1.0,1.0,0.008391898,0.8391898,1.0083919,5.9858985,-33.901955,-266.08652,-308.6454,1.9789487,-4.3275185,79.98523,475000
|
| 17 |
+
1.0,1.0,0.008095154,0.80951536,1.0080951,2.288417,-72.09792,-269.01865,-307.91522,0.6794299,-0.5667628,37.840424,480000
|
| 18 |
+
1.0,1.0,0.007999852,0.7999852,1.0079999,2.2910988,-30.085194,-269.9833,-307.7342,0.41820097,-0.9101933,31.906025,485000
|
| 19 |
+
1.0,1.0,0.007985253,0.79852533,1.0079852,2.0801237,-25.166191,-271.12524,-307.9849,0.81459606,-0.35865238,32.650158,490000
|
| 20 |
+
1.0,1.0,0.008632393,0.8632393,1.0086324,2.4584491,-86.098724,-272.14322,-307.77673,0.4578223,-0.3743875,33.83605,495000
|
| 21 |
+
1.0,0.99999994,0.0077570984,0.7757099,1.0077571,3.5420837,-58.347874,-268.51498,-309.04855,0.859331,-0.4814654,42.73734,500000
|
| 22 |
+
1.0,1.0,0.007545411,0.7545411,1.0075454,2.2040184,-68.3101,-272.72827,-307.3644,0.37440926,-0.4534275,30.785961,505000
|
| 23 |
+
1.0,1.0,0.008026194,0.8026194,1.0080262,2.5938084,-88.33059,-273.79245,-307.84232,0.41693807,-0.7503741,38.45096,510000
|
| 24 |
+
1.0,1.0,0.007641554,0.7641554,1.0076416,3.7341907,-91.67455,-267.49496,-308.97873,3.7559807,-3.7064714,98.69859,515000
|
| 25 |
+
1.0,1.0,0.0073474785,0.73474777,1.0073475,2.2396297,-23.073711,-266.50192,-308.5673,0.732958,-0.5799924,35.929356,520000
|
| 26 |
+
1.0,1.0,0.007384839,0.7384839,1.0073849,2.1181195,-35.877552,-273.7413,-308.51407,0.28396916,-0.3545977,30.797735,525000
|
| 27 |
+
1.0,1.0,0.008004375,0.80043745,1.0080044,2.2736263,-57.29007,-270.78107,-307.1764,0.63767684,-0.38428637,36.04249,530000
|
| 28 |
+
1.0,1.0,0.007465025,0.7465025,1.007465,2.275249,-35.764786,-270.70218,-308.8162,0.9312223,-0.49816266,37.83214,535000
|
| 29 |
+
1.0,1.0,0.008083385,0.8083385,1.0080833,2.2709186,-45.977722,-267.42667,-307.54547,0.31867647,-0.32634625,32.82846,540000
|
| 30 |
+
1.0,0.99999994,0.00884212,0.884212,1.0088421,4.1511154,-11.263016,-264.54544,-307.5731,0.9739139,-1.5708456,67.681335,545000
|
| 31 |
+
1.0,1.0,0.007511528,0.7511528,1.0075115,2.7305412,-45.872612,-268.142,-308.07687,0.42674088,-0.74540734,39.190067,550000
|
| 32 |
+
1.0,1.0,0.0075206165,0.7520616,1.0075207,2.6304412,-30.164999,-267.7431,-308.15912,0.6330496,-0.60486275,38.1336,555000
|
| 33 |
+
1.0,0.99999994,0.0074166814,0.7416681,1.0074166,3.1296885,-21.433508,-261.17465,-307.6649,1.1308553,-0.7159438,43.121758,560000
|
| 34 |
+
1.0,1.0,0.009143475,0.9143476,1.0091435,2.8267958,-9.907264,-263.89987,-307.60928,0.84809005,-0.6009834,40.363026,565000
|
| 35 |
+
1.0,0.9999999,0.008725996,0.87259966,1.0087259,13.210422,-23.439804,-262.85822,-308.28546,6.635368,-7.897646,174.04889,570000
|
| 36 |
+
1.0,1.0,0.008862739,0.8862739,1.0088627,3.0883477,-22.421421,-262.80704,-307.57898,0.7028522,-0.6880181,38.753395,575000
|
| 37 |
+
1.0,0.99999994,0.009809884,0.98098844,1.0098099,3.501876,-14.666053,-260.4222,-307.07556,0.84632844,-1.2550993,45.105362,580000
|
| 38 |
+
1.0,1.0,0.008687713,0.8687714,1.0086877,2.9225852,-5.280142,-255.54509,-307.2899,1.016813,-0.68104845,42.073982,585000
|
| 39 |
+
1.0,1.0,0.008994706,0.8994707,1.0089947,3.21231,-6.493118,-258.519,-307.63596,0.88565016,-0.8787372,40.96319,590000
|
| 40 |
+
1.0,1.0000002,0.008838522,0.88385224,1.0088388,3.1019216,-10.446144,-263.79514,-307.70297,0.5184799,-0.4668311,40.79864,595000
|
| 41 |
+
1.0,0.9999999,0.009470777,0.94707763,1.0094707,3.0672586,-11.090955,-255.44307,-307.58072,1.4189162,-0.9099077,49.483185,600000
|
| 42 |
+
1.0,1.0,0.009494083,0.9494083,1.0094941,3.663075,-3.7921438,-254.75108,-307.67828,0.5371804,-0.89748305,47.68012,605000
|
| 43 |
+
1.0,1.0,0.00913631,0.913631,1.0091363,3.684562,-9.829289,-259.3906,-307.0688,0.61904067,-1.2402115,50.8039,610000
|
| 44 |
+
1.0,1.0,0.009497518,0.9497518,1.0094975,3.4426477,-13.345113,-253.28304,-307.9609,1.1658486,-0.8539448,43.07381,615000
|
| 45 |
+
1.0,1.0,0.009140712,0.9140712,1.0091407,2.900712,-8.66068,-259.39304,-307.8105,0.8455602,-0.7994654,40.11459,620000
|
| 46 |
+
1.0,1.0,0.008558932,0.8558932,1.008559,3.7162864,-32.452965,-260.61337,-308.20023,1.1547204,-0.9542992,60.921345,625000
|
| 47 |
+
1.0,0.99999994,0.008544074,0.8544074,1.008544,4.351953,-2.4908764,-260.31845,-307.02954,0.7100177,-0.6380743,45.447075,630000
|
| 48 |
+
1.0,0.99999994,0.0088301785,0.8830178,1.0088301,3.0590522,-7.065516,-257.1711,-307.60156,0.549687,-0.68348956,42.69752,635000
|
| 49 |
+
1.0,0.99999994,0.008895757,0.8895757,1.0088958,3.149722,2.183459,-260.1868,-307.1506,0.6675361,-0.6173196,39.78515,640000
|
| 50 |
+
1.0,1.0,0.009119523,0.9119524,1.0091195,2.9689758,-6.454413,-249.67735,-308.3753,1.2173822,-0.45205998,35.31079,645000
|
| 51 |
+
1.0,0.99999994,0.008274682,0.82746816,1.0082747,2.9171805,-17.015848,-265.28604,-308.02216,0.9155754,-0.52114546,39.079647,650000
|
| 52 |
+
1.0,0.99999994,0.007990601,0.79906,1.0079906,2.767384,-1.875886,-255.1339,-307.66687,2.4051063,-0.6302196,41.345627,655000
|
| 53 |
+
1.0,1.0,0.008048507,0.8048508,1.0080485,3.15551,-5.156154,-255.19066,-307.50827,0.44888836,-1.0424998,44.150978,660000
|
| 54 |
+
1.0,1.0000001,0.008950197,0.89501965,1.0089504,2.625269,-21.185123,-254.47803,-307.6118,0.6128526,-0.3598295,33.97355,665000
|
| 55 |
+
1.0,0.99999994,0.008051534,0.8051535,1.0080515,5.5787215,-1.9301211,-259.14606,-307.4623,0.86058766,-0.6840587,50.53833,670000
|
| 56 |
+
1.0,1.0,0.009255779,0.92557794,1.0092558,3.0602438,-3.500426,-251.29903,-308.64294,0.6307951,-0.64002144,42.863,675000
|
| 57 |
+
1.0,1.0,0.008747215,0.8747215,1.0087472,2.968475,-2.886275,-250.81023,-307.2983,0.48780566,-1.1428099,39.671673,680000
|
| 58 |
+
1.0,0.9999964,0.008679053,0.86790526,1.0086755,3.1438272,-1.8047241,-256.55005,-308.0631,1.5878187,-0.7237828,41.416885,685000
|
| 59 |
+
1.0,1.0,0.009471723,0.9471723,1.0094718,2.8201,-6.707945,-250.37077,-307.93817,0.88042355,-0.5424162,37.06327,690000
|
| 60 |
+
1.0,1.0,0.009392712,0.9392712,1.0093927,2.6455216,-3.4888673,-255.60283,-307.97797,0.50139034,-0.79106396,36.976532,695000
|
| 61 |
+
1.0,1.0,0.009307079,0.93070793,1.009307,2.7210693,-3.8907652,-249.12007,-306.4418,0.25776422,-0.6909638,33.668934,700000
|
| 62 |
+
1.0,1.0,0.008639046,0.86390465,1.0086391,3.0304112,-4.398509,-249.3042,-307.58887,0.60789335,-0.71860456,38.372658,705000
|
| 63 |
+
1.0,1.0,0.009788712,0.9788712,1.0097888,2.7660172,-2.4322379,-246.54887,-307.98456,0.60826105,-0.80303854,37.513832,710000
|
| 64 |
+
1.0,1.0,0.010442007,1.0442008,1.010442,3.7351906,-7.6642466,-243.91971,-308.98355,0.7382628,-0.7811479,46.781075,715000
|
| 65 |
+
1.0,1.0,0.0091466755,0.91466755,1.0091467,3.1320705,-1.2335199,-235.88048,-308.40427,1.1022093,-0.6438372,40.234848,720000
|
| 66 |
+
1.0,1.0,0.009574369,0.9574368,1.0095744,3.1697752,-6.932367,-252.7105,-307.91623,1.1003408,-1.1767387,48.15818,725000
|
| 67 |
+
1.0,1.0,0.009259114,0.9259114,1.0092591,8.474109,-4.373792,-245.846,-307.2827,2.8319578,-0.45792696,55.595184,730000
|
| 68 |
+
1.0,0.99999994,0.008862907,0.8862907,1.0088629,4.391243,-2.4060652,-245.01704,-308.52942,1.2658547,-1.4087075,73.59408,735000
|
| 69 |
+
1.0,1.0,0.009543539,0.9543539,1.0095435,3.099223,-5.298288,-254.021,-307.23965,1.317567,-0.7592999,42.755386,740000
|
| 70 |
+
1.0,1.0,0.009315068,0.93150675,1.009315,3.6008668,-1.9423596,-254.35155,-307.59903,1.4934357,-0.6010085,54.140484,745000
|
| 71 |
+
1.0,1.0,0.0095509235,0.95509243,1.0095509,3.1122046,-11.321481,-246.34146,-307.23193,0.99046785,-0.5857379,37.18862,750000
|
| 72 |
+
1.0,0.99999994,0.009886675,0.9886675,1.0098866,2.8299253,-6.0156755,-248.78413,-308.44064,1.0840632,-0.45442763,37.55433,755000
|
| 73 |
+
1.0,1.0,0.008714982,0.8714982,1.008715,2.7457807,-0.69346255,-245.99239,-308.09766,0.4916335,-1.1787713,38.498825,760000
|
| 74 |
+
1.0,1.0,0.008400511,0.8400511,1.0084006,2.2721257,-6.6372232,-251.65445,-308.59906,0.7530451,-0.30459473,30.822662,765000
|
| 75 |
+
1.0,1.0,0.009784812,0.97848123,1.0097848,2.860456,-1.4035528,-241.23145,-307.73242,0.32827288,-1.1131787,37.222916,770000
|
| 76 |
+
1.0,0.99999994,0.008529015,0.8529015,1.008529,2.6391308,-4.953211,-251.39746,-308.4528,0.63448036,-0.8762113,35.83683,775000
|
| 77 |
+
1.0,1.0,0.008909285,0.8909286,1.0089092,3.0746734,-6.574179,-249.98888,-307.47787,0.3867192,-0.5603934,40.131523,780000
|
| 78 |
+
1.0,1.0,0.009142568,0.91425675,1.0091425,5.1503253,-2.1533194,-245.84676,-307.37424,1.7731184,-2.9483483,79.52136,785000
|
| 79 |
+
1.0,1.0,0.009776278,0.9776279,1.0097762,3.047451,-5.841293,-241.13647,-307.537,0.492688,-0.60441256,37.255596,790000
|
| 80 |
+
1.0,1.0,0.009254726,0.9254726,1.0092547,2.5417485,-5.9839573,-246.2539,-307.48663,0.2843491,-0.4746151,31.542938,795000
|
| 81 |
+
1.0,0.99999994,0.008649866,0.86498666,1.0086498,2.619959,-3.7659504,-242.32475,-307.75513,0.5297734,-1.2077831,40.61086,800000
|
| 82 |
+
1.0,1.0,0.009507526,0.9507527,1.0095075,3.2308183,-5.3417463,-245.38219,-306.69476,0.65546644,-0.6191979,40.833096,805000
|
| 83 |
+
1.0,1.0,0.009562053,0.95620525,1.009562,3.258284,-11.516997,-247.59166,-308.45926,0.5813041,-0.5238812,40.414577,810000
|
| 84 |
+
1.0,1.0000001,0.009565238,0.9565238,1.0095654,2.841657,-6.4221787,-237.19254,-306.85892,0.6254442,-0.81315684,37.47847,815000
|
| 85 |
+
1.0,1.0,0.008763332,0.87633324,1.0087633,2.0802786,-3.5383482,-243.41264,-307.54022,0.9949417,-0.97801596,32.016743,820000
|
| 86 |
+
1.0,1.0,0.008473445,0.8473445,1.0084734,2.2332714,-4.4190598,-247.60205,-306.9306,0.764868,-1.3930085,33.308403,825000
|
| 87 |
+
1.0,1.0,0.009892008,0.98920083,1.009892,3.464914,-7.5283475,-242.56665,-306.69608,0.8076664,-0.58986396,51.80994,830000
|
| 88 |
+
1.0,0.99999994,0.009157394,0.9157394,1.0091573,3.0091398,-3.9246833,-239.52568,-307.21777,0.9317335,-0.54630107,43.19123,835000
|
| 89 |
+
1.0,1.0,0.010350676,1.0350677,1.0103507,2.991179,-5.1866746,-237.10657,-307.23233,0.7023873,-1.4605534,45.242634,840000
|
| 90 |
+
1.0,0.99999994,0.009961155,0.99611557,1.0099611,2.3743963,-5.752917,-233.60179,-307.7667,0.59666336,-1.2129953,38.484108,845000
|
| 91 |
+
1.0,1.0000001,0.009624566,0.96245664,1.0096247,3.2845333,-2.9909983,-237.74438,-307.26672,0.57658434,-0.6425176,37.305473,850000
|
| 92 |
+
1.0,1.0,0.009192642,0.9192642,1.0091926,2.1907663,-6.167241,-242.81163,-307.97598,0.47544798,-0.35868263,30.062199,855000
|
| 93 |
+
1.0,1.0,0.009896228,0.9896228,1.0098963,3.675367,-5.475681,-229.78154,-307.36053,0.59080786,-0.7050901,38.95228,860000
|
| 94 |
+
1.0,1.0,0.008546922,0.85469234,1.008547,2.3650327,-0.53156006,-237.03133,-306.3292,0.5865322,-0.5113578,32.527225,865000
|
| 95 |
+
1.0,1.0,0.009792127,0.97921276,1.0097921,3.7731118,-4.6430154,-240.75337,-307.1514,1.0479032,-1.5528116,52.485065,870000
|
| 96 |
+
1.0,0.9999999,0.00972306,0.97230595,1.009723,2.709153,0.4024132,-236.12169,-307.02734,0.40845686,-1.0713315,36.835606,875000
|
| 97 |
+
1.0,1.0,0.009305179,0.93051785,1.0093052,3.377398,-3.606733,-247.49486,-306.5257,1.554063,-0.5819482,50.971165,880000
|
| 98 |
+
1.0,0.99999994,0.0084706135,0.84706146,1.0084705,2.550502,-7.616336,-245.20618,-308.1611,0.73761606,-0.9317355,42.56286,885000
|
| 99 |
+
1.0,1.0,0.009894727,0.9894727,1.0098947,2.906594,1.252499,-234.6022,-307.79874,2.4188478,-0.5889175,42.283504,890000
|
| 100 |
+
1.0,0.9999999,0.009056546,0.90565455,1.0090564,2.7734036,-1.0601113,-234.41338,-307.77637,0.72177786,-0.9175116,36.23427,895000
|
| 101 |
+
1.0,1.0,0.009332472,0.93324727,1.0093324,3.4309938,-5.1093593,-243.06116,-306.9879,1.0355103,-1.0717793,58.04723,900000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3942ff5790e3d9b469454d4be2d28926c08832a121a2fb69587a0f96534cfec4
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86faa78454ded0176b35ccce14e48cc43b828a4241ca1166c24d2d8693cfd454
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f976ef8ff5b483e01cf4e9ef88a52019a556f85496954aac1b29416af6af0ba6
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28449c506e800ea8765df36a557d64fe32f6e813e2eaf95badf489e3a7134cd8
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:056a149ff6e2f6001cb1553579ed617ac60cfeab52536c66738377399d4c63e4
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6289932c680bf64d92b8038d04f9fd5727cfcfc780448ae87fef00ea41bf642
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c2ee14fd88de2d95aa9307bf5f3f90782e99ed56218ee9c716c55d02328bc42
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de165dbcd4a5b89f6775f7e33d21fa87f8f943905e2bea6b86fe56e87a7174f4
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abfcc9486bc8ba3c0b3f7c7264b0f0451670cb34160b3121769ede86b7646709
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3de82658d3d4a35bfa2da65e04aa8757b15f7c138be67fa82adb1077446f5bc8
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_020846/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/jjmanmw9
|