Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/env.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_350000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_400000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.051427158192154154,0.00045752618364959167,-0.051414548116136154,0.0004493076697388483,29.688256334962873,50.10000000001527,0.0,25500.0,-1.0,-1001.64,1000.0,3.021239757537842,250000
|
| 3 |
+
0.0,0.0,-0.16617738047458086,-0.0006269337779439415,-0.1661991678214596,-0.0004966032953380475,33.53594438946779,50.10000000001527,0.0,77500.0,-1.0,-1000.0,1000.0,3.0867704248428343,300000
|
| 4 |
+
0.0,0.0,-0.12508423761347454,-0.0008583071432725175,-0.125121347549559,-0.0007144201096344116,34.37554935025586,50.10000000001527,0.0,129500.0,-1.0,-1000.0,1000.0,3.0898955392837526,350000
|
| 5 |
+
0.0,0.0,-0.17143286480954972,0.0001126044530427905,-0.17142073013235234,0.00031604067549339496,34.17095749860988,50.10000000001527,0.0,181500.0,-1.0,-1000.0,1000.0,3.0830334424972534,400000
|
| 6 |
+
0.0,0.0,-0.17354934890598245,-0.0009947555612753066,-0.17359846032872636,-0.0009344058931977289,34.19288497053175,50.10000000001527,0.0,233500.0,-1.0,-1000.0,1000.0,3.070554690361023,450000
|
| 7 |
+
0.0,0.0,-0.12724299273118245,-0.0002985849684956346,-0.12729047055970852,-0.0008821712142246624,32.74184089836062,50.10000000001527,0.0,285500.0,-1.02,-1019.58,1000.0,3.0756011152267457,500000
|
| 8 |
+
0.0,0.0,-0.12376693507216026,-0.001292126350215634,-0.12382820041982093,-0.0012763645540042456,35.09303559419827,49.25700000001496,0.02,336758.16,-1.0,-992.74,983.14,3.056854453086853,550000
|
| 9 |
+
0.0,0.0,-0.18281089697883585,-0.0021179955493421665,-0.18289239441729782,-0.0017210541851999186,31.62556653878321,50.10000000001527,0.0,388657.0,-1.0,-1000.0,1000.0,3.0830931758880613,600000
|
| 10 |
+
0.0,0.0,-0.12454053819300355,0.002536557222054421,-0.1245543449177281,-0.0013266996678082666,27.404010446288453,50.10000000001527,0.0,440657.0,-1.0,-1000.0,1000.0,3.055699849128723,650000
|
| 11 |
+
0.0,0.0,-0.15029365785256946,-0.0011891924177180786,-0.15029477905143598,-8.172417703297477e-06,31.653730327173918,50.10000000001527,0.0,492657.0,-1.0,-1012.8,1000.0,3.0779986238479613,700000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.051427158192154154,0.00045752618364959167,-0.051414548116136154,0.0004493076697388483,29.688256334962873,50.10000000001527,0.0,25500.0,-1.0,-1001.64,1000.0,3.021239757537842,250000
|
| 3 |
+
0.0,0.0,-0.16617738047458086,-0.0006269337779439415,-0.1661991678214596,-0.0004966032953380475,33.53594438946779,50.10000000001527,0.0,77500.0,-1.0,-1000.0,1000.0,3.0867704248428343,300000
|
| 4 |
+
0.0,0.0,-0.12508423761347454,-0.0008583071432725175,-0.125121347549559,-0.0007144201096344116,34.37554935025586,50.10000000001527,0.0,129500.0,-1.0,-1000.0,1000.0,3.0898955392837526,350000
|
| 5 |
+
0.0,0.0,-0.17143286480954972,0.0001126044530427905,-0.17142073013235234,0.00031604067549339496,34.17095749860988,50.10000000001527,0.0,181500.0,-1.0,-1000.0,1000.0,3.0830334424972534,400000
|
| 6 |
+
0.0,0.0,-0.17354934890598245,-0.0009947555612753066,-0.17359846032872636,-0.0009344058931977289,34.19288497053175,50.10000000001527,0.0,233500.0,-1.0,-1000.0,1000.0,3.070554690361023,450000
|
| 7 |
+
0.0,0.0,-0.12724299273118245,-0.0002985849684956346,-0.12729047055970852,-0.0008821712142246624,32.74184089836062,50.10000000001527,0.0,285500.0,-1.02,-1019.58,1000.0,3.0756011152267457,500000
|
| 8 |
+
0.0,0.0,-0.12376693507216026,-0.001292126350215634,-0.12382820041982093,-0.0012763645540042456,35.09303559419827,49.25700000001496,0.02,336758.16,-1.0,-992.74,983.14,3.056854453086853,550000
|
| 9 |
+
0.0,0.0,-0.18281089697883585,-0.0021179955493421665,-0.18289239441729782,-0.0017210541851999186,31.62556653878321,50.10000000001527,0.0,388657.0,-1.0,-1000.0,1000.0,3.0830931758880613,600000
|
| 10 |
+
0.0,0.0,-0.12454053819300355,0.002536557222054421,-0.1245543449177281,-0.0013266996678082666,27.404010446288453,50.10000000001527,0.0,440657.0,-1.0,-1000.0,1000.0,3.055699849128723,650000
|
| 11 |
+
0.0,0.0,-0.15029365785256946,-0.0011891924177180786,-0.15029477905143598,-8.172417703297477e-06,31.653730327173918,50.10000000001527,0.0,492657.0,-1.0,-1012.8,1000.0,3.0779986238479613,700000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.65579474,289.55646,0.0045382013,-0.008342665,-14.33832,0.20246127,-289.4914,289.75058,4.5027323,22.89533,-130.13101,-290.55835,-303.3519,27.398064,10.83729,-10.434435,345.09967,205000
|
| 3 |
+
0.664169,286.10022,0.005077404,0.007465872,-11.029589,0.2006762,-286.04425,286.30838,6.9924607,14.539914,-161.62901,-286.8273,-302.74905,21.532375,4.4317694,-2.587756,223.65167,210000
|
| 4 |
+
0.65014356,282.78494,0.0045922324,-0.010605943,-14.80954,0.1862624,-282.71695,282.96057,2.5621567,11.698562,-105.90492,-283.828,-303.37958,14.260718,1.5817201,-1.271885,125.26338,215000
|
| 5 |
+
0.6527405,289.38538,0.004253953,-0.002234918,-13.025374,0.20214786,-289.32996,289.5853,3.6697145,13.9999695,-181.95032,-290.4246,-302.90384,17.669683,4.170117,-3.9868605,300.32922,220000
|
| 6 |
+
0.6521496,284.91028,0.00476721,-0.012534021,-15.129215,0.22642553,-284.83813,285.12418,3.4707954,8.972132,-105.557434,-286.44348,-303.46155,12.442927,1.1243138,-1.2778258,131.27873,225000
|
| 7 |
+
0.6774745,285.11755,0.004578785,0.009270864,-10.475257,0.19891806,-285.06958,285.32574,1.981074,10.952258,1.4104205,-285.94345,-303.5594,12.933332,11.269644,-11.912134,251.17723,230000
|
| 8 |
+
0.6683064,289.61642,0.004434156,-0.002770709,-13.124856,0.20394577,-289.55826,289.8176,1.7354946,8.660205,-102.88532,-290.545,-303.5669,10.3956995,0.61288935,-1.0530986,108.83346,235000
|
| 9 |
+
0.67065483,284.8335,0.0048238807,0.0008245961,-12.32906,0.22196347,-284.774,285.05627,2.6832237,5.0731344,-101.586426,-285.46994,-303.2357,7.756358,0.6658835,-0.7510364,87.95654,240000
|
| 10 |
+
0.6799752,285.0667,0.0048001003,0.008968798,-10.631539,0.19436862,-285.01566,285.27005,2.816118,7.1798234,-100.67865,-286.2794,-304.8351,9.995941,1.9656345,-1.4686198,132.84561,245000
|
| 11 |
+
0.67427963,283.4964,0.004301518,0.0049724365,-11.3440275,0.21014085,-283.44757,283.71152,2.1927164,7.9797835,-100.65283,-284.90146,-304.98914,10.1725,2.4183683,-2.300204,180.79214,250000
|
| 12 |
+
0.6721445,284.27582,0.0043845912,0.0012139984,-12.223122,0.17335445,-284.2222,284.45038,2.8059757,5.6941295,-101.29469,-285.25357,-303.27097,8.500105,1.4088492,-1.27432,115.302444,255000
|
| 13 |
+
0.67491555,283.93546,0.004504392,0.0067886985,-10.992871,0.2145448,-283.88593,284.15677,2.3585558,7.2105174,-96.80996,-284.9026,-303.3535,9.569073,0.9426595,-1.155998,114.132065,260000
|
| 14 |
+
0.66698986,284.74426,0.004299285,0.0061543914,-11.068508,0.1986421,-284.69672,284.94907,1.7748127,5.5357604,-101.24925,-286.1546,-304.00345,7.310573,1.4175696,-1.6023366,122.57452,265000
|
| 15 |
+
0.6533178,278.56894,0.0041289357,-0.0036373977,-13.380953,0.18274489,-278.51367,278.74805,2.4954422,6.5480247,-101.46714,-279.1888,-303.23706,9.043467,0.73148173,-0.6174495,95.03786,270000
|
| 16 |
+
0.64304364,276.87506,0.0042328066,-0.014032329,-15.815136,0.21124901,-276.8081,277.07227,3.9503834,11.373797,-36.62857,-278.53122,-303.0312,15.324181,4.506175,-4.3216276,213.15605,275000
|
| 17 |
+
0.6379761,278.4782,0.0045466595,-0.013447519,-15.45767,0.20701672,-278.4079,278.67178,2.6393516,6.780114,-100.992195,-279.65366,-303.3584,9.419466,1.0633577,-1.249515,102.30609,280000
|
| 18 |
+
0.65316474,280.759,0.0043334966,-0.0012549326,-12.789589,0.19111185,-280.7036,280.94885,2.3957145,11.35825,-65.1554,-281.68576,-302.7161,13.753964,1.8307678,-2.2602496,149.82713,285000
|
| 19 |
+
0.6477759,281.45557,0.004254754,-0.00681195,-14.101021,0.18844083,-281.39557,281.6372,2.0734227,7.486287,-101.10373,-282.26382,-302.8448,9.55971,0.8929246,-0.9062083,95.9232,290000
|
| 20 |
+
0.6609227,281.58322,0.0045721047,-0.0025672698,-13.061507,0.19543135,-281.5235,281.7761,2.2105155,5.5261087,-100.58609,-282.38126,-305.15854,7.7366242,0.5588816,-0.9356603,89.81483,295000
|
| 21 |
+
0.64545804,278.20117,0.0043936493,-0.009358101,-14.629915,0.21016628,-278.1369,278.40198,1.7975715,12.169691,-100.557816,-279.4787,-303.0404,13.967262,8.1426935,-8.560642,248.25484,300000
|
| 22 |
+
0.6607737,280.79385,0.0044062543,0.0036858115,-11.663505,0.16577685,-280.74246,280.96332,1.9353437,4.8655596,-100.90819,-281.53513,-302.80743,6.8009033,1.7918084,-0.6960084,83.30025,305000
|
| 23 |
+
0.6544622,281.82892,0.004395671,-0.0033870458,-13.270541,0.19797936,-281.7706,282.0235,2.9935029,6.2299676,-100.836395,-282.62253,-303.2887,9.223471,0.5320097,-0.6040565,101.02286,310000
|
| 24 |
+
0.6381172,278.07736,0.0043686638,-0.009839351,-14.752256,0.16354173,-278.0129,278.23108,2.0093858,6.6985445,-100.503914,-279.08987,-302.57605,8.707931,5.494936,-4.4567947,126.85245,315000
|
| 25 |
+
0.6577967,274.09064,0.0042399317,0.0025847517,-11.890379,0.1796853,-274.04022,274.27292,2.1047876,5.0893145,-100.73793,-274.98294,-302.5347,7.1941023,0.6449779,-0.4764257,76.55284,320000
|
| 26 |
+
0.66436857,281.87537,0.004034549,0.01037106,-9.929438,0.19386712,-281.8353,282.07962,1.9395001,3.2399971,-100.84729,-282.44833,-304.00995,5.1794972,0.6936612,-0.7435257,71.778336,325000
|
| 27 |
+
0.6636998,278.71002,0.0045509567,0.0016485291,-12.137762,0.2083087,-278.6548,278.91998,7.529682,7.2026443,-100.52687,-279.97192,-303.00635,14.7323265,3.6707027,-3.4749079,165.5765,330000
|
| 28 |
+
0.66501874,279.61115,0.0041080033,0.0041535976,-11.488901,0.18378094,-279.5639,279.79907,2.6986125,5.8774967,-100.56667,-280.56522,-303.0589,8.576109,1.5032051,-2.4566588,117.83123,335000
|
| 29 |
+
0.6706224,275.70297,0.0041697472,0.008767486,-10.397358,0.17887864,-275.6596,275.8906,1.6757478,3.821811,-100.54099,-276.5132,-302.5341,5.4975586,2.421283,-2.5389712,98.985886,340000
|
| 30 |
+
0.659397,273.23907,0.0039182752,0.003236074,-11.674108,0.19179307,-273.19333,273.4341,1.9626449,7.847397,-99.36938,-274.18408,-302.68973,9.810041,1.7631744,-1.2399523,95.34065,345000
|
| 31 |
+
0.65508175,279.23907,0.0042924862,0.0028873258,-11.8273535,0.19144037,-279.1883,279.4334,3.4379883,5.818012,-100.22728,-280.01007,-302.5092,9.2560005,2.988078,-2.5548239,121.905304,350000
|
| 32 |
+
0.6548236,277.0666,0.0045097866,-0.0058576097,-13.798866,0.18319842,-277.0044,277.24393,1.931892,9.008718,-100.20274,-277.91348,-302.52832,10.94061,3.7504723,-8.367122,147.12552,355000
|
| 33 |
+
0.66067404,271.7577,0.0043546315,0.00449843,-11.466978,0.21777232,-271.70776,271.97995,1.6121672,6.218572,-100.57529,-272.72427,-303.734,7.8307395,0.63029814,-0.6169585,79.426254,360000
|
| 34 |
+
0.6555983,273.2543,0.0041333465,0.00034013577,-12.417709,0.17447266,-273.203,273.4291,2.5412605,5.6639547,-100.777145,-274.32745,-302.63925,8.205215,0.63894385,-0.619176,94.974144,365000
|
| 35 |
+
0.6583505,271.8911,0.004223158,0.009099644,-10.345299,0.18103914,-271.84744,272.08124,7.1231203,9.866492,-100.82562,-273.09555,-302.89642,16.989613,3.7278235,-4.3215685,167.51567,370000
|
| 36 |
+
0.6618046,273.3683,0.0040657558,0.0032436873,-11.702193,0.20579594,-273.32068,273.57733,2.831558,13.087527,-100.01856,-274.3715,-302.89264,15.9190855,1.0464661,-0.9985296,118.21257,375000
|
| 37 |
+
0.65117306,273.4319,0.003997706,-0.004797067,-13.699955,0.18629846,-273.37708,273.6134,2.2306166,7.071506,-100.13004,-274.01523,-303.80542,9.302122,0.70121604,-0.90795714,109.4255,380000
|
| 38 |
+
0.6613171,269.70813,0.004070695,0.0009861509,-12.257744,0.17668022,-269.6582,269.88577,1.806276,3.6972713,-100.53477,-270.14536,-302.60635,5.503547,0.66996014,-0.6041347,88.96436,385000
|
| 39 |
+
0.65938765,269.88068,0.0039478806,0.005034322,-11.224804,0.17084062,-269.83636,270.05655,1.2486538,5.321135,-100.58226,-270.5263,-302.40717,6.569789,3.0583432,-4.091283,98.4547,390000
|
| 40 |
+
0.65254736,276.94757,0.0042597745,-0.001242265,-12.791627,0.1885623,-276.8931,277.1349,1.7742087,4.6716995,-100.78352,-277.7967,-302.57523,6.445908,0.61743563,-0.81172174,80.42094,395000
|
| 41 |
+
0.66215193,269.5462,0.004328507,0.004238546,-11.520783,0.18212657,-269.49634,269.73257,2.1460347,6.7850266,-100.42453,-270.15903,-303.28168,8.931061,0.7978551,-0.8255046,93.33862,400000
|
| 42 |
+
0.6481337,268.39432,0.0043230494,-0.014586202,-15.874054,0.19444486,-268.32568,268.5742,2.9180174,6.9269943,-100.34379,-268.62708,-302.169,9.845012,1.0980976,-1.3097146,120.709625,405000
|
| 43 |
+
0.65660965,271.3036,0.004315145,0.0041817576,-11.530911,0.16509016,-271.2538,271.47287,1.9242424,4.2927475,-100.65872,-272.40454,-302.56982,6.21699,1.8943851,-1.6540843,79.30311,410000
|
| 44 |
+
0.6575792,268.651,0.0039830413,0.0038543472,-11.5323105,0.21153897,-268.60504,268.8664,1.4430364,3.5887601,-100.56429,-269.38733,-302.44873,5.0317965,0.43507627,-0.5396991,53.805267,415000
|
| 45 |
+
0.64881873,273.3325,0.004119657,-0.0032954554,-13.299934,0.16928574,-273.2777,273.49847,1.3671179,4.3310595,-100.52424,-274.0935,-302.6576,5.6981773,0.78958887,-0.6226814,67.15813,420000
|
| 46 |
+
0.6627836,274.9635,0.0039525027,0.005535048,-11.099609,0.20290804,-274.91962,275.17194,1.9892892,3.9088292,-100.31982,-275.8449,-302.8474,5.8981185,0.55778545,-0.5355591,65.61831,425000
|
| 47 |
+
0.6515824,275.39325,0.0038066406,-0.001994361,-13.023916,0.20070267,-275.34363,275.59198,4.899343,9.360319,-100.45593,-276.46378,-302.49985,14.259663,9.654808,-10.180573,361.35294,430000
|
| 48 |
+
0.6694878,271.9486,0.0040741633,0.006516798,-10.900457,0.19083354,-271.90424,272.14597,1.942921,7.238843,-35.707954,-272.65155,-302.31693,9.181764,4.3971195,-4.399325,155.64487,435000
|
| 49 |
+
0.6491924,274.44818,0.0039203535,-0.0066563487,-14.197895,0.21213028,-274.39252,274.65366,5.8499703,8.798113,-100.426674,-275.48154,-302.32068,14.648083,3.5931406,-2.822448,203.07309,440000
|
| 50 |
+
0.67182773,265.38574,0.0037673742,0.013186762,-8.999747,0.18194309,-265.35184,265.58087,1.6294832,3.9560525,-93.31305,-266.027,-302.91,5.585536,1.3575081,-1.3443812,77.37044,445000
|
| 51 |
+
0.68450546,275.33966,0.003950078,0.010315609,-9.888505,0.16921219,-275.3006,275.5192,1.8512688,3.5915444,-97.500046,-276.60968,-303.74768,5.442813,1.6638749,-1.465851,89.45836,450000
|
| 52 |
+
0.6605621,268.9157,0.004193223,0.00832291,-10.515152,0.16968295,-268.87164,269.09372,1.594735,3.964339,-68.08038,-269.99017,-303.20938,5.559074,0.5405185,-0.49669093,72.22586,455000
|
| 53 |
+
0.65967536,267.9367,0.0041472213,0.004704815,-11.36555,0.21220344,-267.8896,268.1536,1.8184124,4.814575,-43.40813,-268.45685,-302.79535,6.6329875,0.58890206,-0.67420155,80.400604,460000
|
| 54 |
+
0.65345544,269.50146,0.0040455605,-0.0002853987,-12.570546,0.16892779,-269.45062,269.6701,2.07731,4.6542354,-100.49036,-270.71118,-302.72165,6.7315454,0.7326379,-0.5868558,83.48969,465000
|
| 55 |
+
0.6613906,273.58212,0.0041812793,-0.0013706943,-12.827817,0.19034562,-273.52847,273.7711,2.383503,13.67435,-100.33886,-274.23093,-302.45322,16.057854,3.2778685,-3.756027,195.0068,470000
|
| 56 |
+
0.66012937,265.99466,0.0039001193,0.00253126,-11.850979,0.18734273,-265.94846,266.18454,1.7213799,10.950155,-49.094864,-267.36465,-303.26376,12.6715355,2.3214488,-2.8234951,98.849525,475000
|
| 57 |
+
0.66988456,265.97528,0.003916002,0.0033541627,-11.643473,0.18896598,-265.9297,266.1676,1.3890224,4.3349996,-100.21213,-266.73764,-302.32578,5.724022,0.8014107,-0.9624639,71.35576,480000
|
| 58 |
+
0.6448479,271.14966,0.0038117263,-0.008673014,-14.775351,0.15449926,-271.09332,271.2955,1.4305977,3.5433342,-100.35294,-271.92612,-302.50732,4.973932,0.5159749,-0.4070945,60.26667,485000
|
| 59 |
+
0.65566796,265.2486,0.004194531,0.0036791551,-11.622869,0.17263617,-265.19986,265.42493,1.4560636,3.971553,-100.31386,-266.05817,-302.31915,5.4276166,0.4220368,-0.3876178,56.528114,490000
|
| 60 |
+
0.6590246,272.08997,0.0037348724,-0.0017853569,-12.978024,0.18493119,-272.0415,272.2731,1.2230705,3.6346385,-99.45829,-272.8045,-302.26453,4.857709,0.85862505,-0.6247362,69.47423,495000
|
| 61 |
+
0.6598666,266.67838,0.0037820379,0.00053220976,-12.35928,0.17428595,-266.63165,266.85318,3.5787892,4.4970617,-99.58999,-267.3133,-302.2838,8.075851,7.268953,-4.5548363,191.61023,500000
|
| 62 |
+
0.6655656,266.11807,0.0036147207,0.009332429,-9.918216,0.19951257,-266.0822,266.32693,1.2105052,3.8364732,-100.38399,-266.68246,-302.77652,5.0469785,0.6067161,-0.68948054,60.91378,505000
|
| 63 |
+
0.65032464,264.32727,0.0036125614,-0.0069437046,-14.4221,0.20497528,-264.27518,264.5253,1.2378601,3.3283372,-100.37813,-265.04465,-302.22363,4.5661974,0.694142,-0.6641756,63.4105,510000
|
| 64 |
+
0.6626691,260.36795,0.0036996754,0.003733794,-11.490778,0.18402578,-260.32544,260.5557,1.972654,4.0200934,-100.047775,-261.148,-302.62076,5.9927473,0.42836398,-0.42083955,61.119545,515000
|
| 65 |
+
0.6611422,256.05853,0.0035783874,0.0071853315,-10.49202,0.16327862,-256.021,256.22897,1.3779975,3.9969957,-98.58329,-256.73773,-302.4239,5.3749933,0.48635066,-0.7718786,56.598248,520000
|
| 66 |
+
0.64997154,268.24844,0.0034682872,-0.0031411308,-13.405672,0.16358344,-268.20193,268.40887,2.634392,4.889274,-100.21744,-269.4151,-302.38235,7.5236664,11.834171,-8.455617,242.92685,525000
|
| 67 |
+
0.66268593,263.15146,0.0036837354,0.003794826,-11.469843,0.18140325,-263.10922,263.33664,1.2728685,3.6444664,-99.56988,-264.52032,-302.22714,4.917335,0.57021946,-0.5055126,64.87028,530000
|
| 68 |
+
0.67029524,261.11627,0.0038222556,0.007668001,-10.4938545,0.2035051,-261.07617,261.32742,1.748571,4.6442995,-100.34868,-261.9876,-302.5581,6.3928704,0.7295077,-0.5572396,74.029205,535000
|
| 69 |
+
0.6550598,269.67938,0.0036066936,0.002920357,-11.690295,0.17020413,-269.63727,269.8525,1.3458986,3.9939458,-100.35446,-270.56223,-302.24445,5.3398447,0.3943383,-0.61711097,62.328682,540000
|
| 70 |
+
0.6480975,270.0806,0.003891381,-0.007199899,-14.350217,0.20227571,-270.02478,270.27567,1.6247838,4.8976398,-100.260605,-270.763,-302.12042,6.5224237,1.0194336,-1.2691985,81.40845,545000
|
| 71 |
+
0.67252547,261.4847,0.0040117893,0.0047739856,-11.310011,0.15896796,-261.43936,261.64844,1.6600016,3.483772,-100.34266,-262.40424,-302.57083,5.1437736,0.3943763,-0.29599965,55.75776,550000
|
| 72 |
+
0.6544177,264.24475,0.00372352,-0.005500645,-13.97727,0.203001,-264.19275,264.44226,1.69422,4.2778206,-97.612404,-265.49045,-302.46118,5.9720407,0.44014946,-0.5851059,68.775085,555000
|
| 73 |
+
0.6564298,263.62054,0.0038304825,0.0029019911,-11.742395,0.16968808,-263.57556,263.79312,1.1797205,3.0408223,-99.4725,-264.18076,-302.3257,4.220543,0.36236644,-0.47168502,51.130386,560000
|
| 74 |
+
0.6735563,266.12592,0.0038133624,-4.9233724e-05,-12.512911,0.18944304,-266.0782,266.3153,1.6091931,3.4185631,-100.244804,-267.0755,-302.5903,5.027756,0.5921902,-0.49170777,66.08627,565000
|
| 75 |
+
0.6546372,257.14496,0.003701904,-0.002733816,-13.238489,0.17176086,-257.09598,257.31396,1.0766732,3.367859,-100.09601,-257.95163,-302.62973,4.444532,0.7430787,-0.5413269,52.30329,570000
|
| 76 |
+
0.6564057,267.43176,0.0037128998,-0.006192781,-14.16791,0.19004652,-267.37915,267.6156,1.8500038,4.087278,-98.51134,-268.1512,-302.4549,5.9372816,1.4603418,-1.5467713,80.06695,575000
|
| 77 |
+
0.6530026,264.14365,0.0034178686,0.000452684,-12.367554,0.16194779,-264.10138,264.30606,1.2009678,3.148072,-99.98587,-264.64014,-302.265,4.34904,0.3223728,-0.4186517,53.86177,580000
|
| 78 |
+
0.65662736,264.18237,0.0034177464,0.002019398,-11.909143,0.16348654,-264.14166,264.34787,1.1906942,5.313781,-49.103474,-265.08774,-302.0591,6.504475,1.5205104,-1.4223309,73.35552,585000
|
| 79 |
+
0.6789743,258.22156,0.0037346461,0.010580762,-9.666863,0.16885938,-258.1855,258.401,1.4909447,4.1353145,-88.764755,-259.29294,-302.42694,5.6262593,0.48218688,-0.57141054,70.82895,590000
|
| 80 |
+
0.6705664,262.53107,0.0034614257,0.009105316,-9.86949,0.17975229,-262.49695,262.7199,1.4828422,3.6392457,-100.24905,-263.09897,-302.23584,5.122088,0.6842683,-0.4537009,64.50248,595000
|
| 81 |
+
0.6603621,260.622,0.003508171,0.0016708524,-12.0237255,0.17153375,-260.57983,260.79523,1.4442412,3.8219018,-98.79514,-261.4917,-302.27725,5.266143,0.48181164,-0.4054966,65.6174,600000
|
| 82 |
+
0.67132765,262.66064,0.0033689898,0.0061487304,-10.674904,0.18329018,-262.6247,262.85007,3.2014585,4.5694656,-100.04072,-263.4492,-302.48337,7.770924,1.324372,-1.4578564,107.06532,605000
|
| 83 |
+
0.6653919,262.6031,0.0035789625,-0.0036615713,-13.523082,0.18236533,-262.5547,262.7818,1.1173273,3.5915368,-100.20243,-263.84653,-302.40967,4.708864,0.60160255,-0.46928644,64.097595,610000
|
| 84 |
+
0.66199714,254.89487,0.0033183307,-0.001960876,-13.090922,0.16296205,-254.85144,255.05586,1.0904696,3.2705324,-100.246925,-255.62149,-302.2002,4.361002,0.38537014,-0.39957142,53.271942,615000
|
| 85 |
+
0.6559547,262.6046,0.003705523,-0.0063100993,-14.20289,0.16691852,-262.552,262.76523,1.8062708,3.631411,-85.69373,-263.44858,-302.32944,5.437682,0.4142108,-0.63232756,70.499084,620000
|
| 86 |
+
0.6403051,264.3777,0.0034219944,-0.0083333375,-14.935228,0.16446479,-264.32654,264.5338,1.1462058,3.5420232,-99.9432,-265.0379,-303.31894,4.688229,0.3629696,-0.40044463,56.512154,625000
|
| 87 |
+
0.6443225,260.54712,0.0035005982,-0.007714546,-14.703779,0.15493336,-260.49564,260.69434,1.670228,5.2060943,-100.29377,-261.4131,-302.36035,6.8763223,1.4769678,-1.288478,73.24065,630000
|
| 88 |
+
0.66473377,257.4653,0.0037386338,0.0022005604,-11.9114,0.1682497,-257.42075,257.63574,1.2459538,3.6653938,-99.32434,-258.33188,-302.20557,4.9113474,0.4515524,-0.5315856,56.42484,635000
|
| 89 |
+
0.677383,256.56873,0.0037059255,0.0035325638,-11.54678,0.1764624,-256.5259,256.74872,1.6392424,3.7074697,-99.51852,-257.1257,-301.96457,5.346712,0.5999432,-0.80386084,66.908966,640000
|
| 90 |
+
0.6782604,252.14796,0.0035620867,0.007740334,-10.327023,0.16146716,-252.11118,252.31717,1.8375944,3.243838,-100.0679,-252.89061,-301.9646,5.0814323,0.43213046,-0.30662838,53.359886,645000
|
| 91 |
+
0.67856544,257.66272,0.0035322132,0.0030221224,-11.644411,0.18539195,-257.62158,257.85114,0.9761144,4.164628,-100.14021,-258.48032,-302.21658,5.1407423,1.1239525,-0.8592754,64.41332,650000
|
| 92 |
+
0.6648457,259.90747,0.0035434363,0.004225754,-11.307442,0.20611218,-259.8674,260.1178,1.1711562,2.6447399,-100.097694,-260.67493,-302.09143,3.815896,0.41563764,-0.6061593,53.348408,655000
|
| 93 |
+
0.6742601,250.36487,0.0036402664,0.005581764,-10.9666605,0.18257019,-250.32494,250.55302,1.354206,3.7047753,-99.96856,-250.99815,-302.13144,5.0589814,0.59254,-0.5798214,58.587303,660000
|
| 94 |
+
0.66257215,255.16382,0.0035106966,0.00041399445,-12.382076,0.17049968,-255.12035,255.33473,1.442717,3.702147,-100.274635,-255.68999,-302.24182,5.144864,0.5315721,-0.5407169,68.906334,665000
|
| 95 |
+
0.65686077,258.32504,0.00363072,-0.0027788698,-13.265377,0.17819683,-258.27692,258.50046,1.5093999,3.1340368,-100.17191,-259.20184,-302.45807,4.6434364,0.40682003,-0.28348437,49.605568,670000
|
| 96 |
+
0.672638,254.11456,0.0035910006,0.0019255477,-11.963785,0.17801751,-254.0716,254.29451,1.3351728,3.5346467,-100.0951,-254.63147,-302.10077,4.8698196,0.3055289,-0.52399623,50.124268,675000
|
| 97 |
+
0.66197205,262.73126,0.003599603,0.002389201,-11.83626,0.18171662,-262.68866,262.91534,1.559502,5.046367,-34.448433,-263.72058,-302.1835,6.6058693,1.0847968,-1.1173602,74.17804,680000
|
| 98 |
+
0.66086715,261.79553,0.0035769118,-0.001522194,-12.925561,0.16917346,-261.74927,261.96317,1.8537235,4.3863206,-100.240295,-262.8641,-301.8177,6.240044,1.0694969,-0.74358463,81.77374,685000
|
| 99 |
+
0.65530926,254.77545,0.0035827789,-0.0038495664,-13.574464,0.16993,-254.72684,254.94154,1.3848752,4.918664,-100.07644,-255.61133,-302.1856,6.3035393,0.46325743,-0.5640386,68.97348,690000
|
| 100 |
+
0.66802746,254.09021,0.0034564147,-0.00011691625,-12.533826,0.19177204,-254.04688,254.28186,1.3432864,3.3823736,-98.675545,-255.1447,-302.10403,4.72566,0.6081267,-0.60491025,57.878395,695000
|
| 101 |
+
0.6498374,260.83356,0.0033863212,-0.005395251,-14.093248,0.19051215,-260.78583,261.01868,1.1976585,3.299151,-100.27798,-261.94684,-302.12622,4.4968095,0.488734,-0.51911247,51.194126,700000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.65579474,289.55646,0.0045382013,-0.008342665,-14.33832,0.20246127,-289.4914,289.75058,4.5027323,22.89533,-130.13101,-290.55835,-303.3519,27.398064,10.83729,-10.434435,345.09967,205000
|
| 3 |
+
0.664169,286.10022,0.005077404,0.007465872,-11.029589,0.2006762,-286.04425,286.30838,6.9924607,14.539914,-161.62901,-286.8273,-302.74905,21.532375,4.4317694,-2.587756,223.65167,210000
|
| 4 |
+
0.65014356,282.78494,0.0045922324,-0.010605943,-14.80954,0.1862624,-282.71695,282.96057,2.5621567,11.698562,-105.90492,-283.828,-303.37958,14.260718,1.5817201,-1.271885,125.26338,215000
|
| 5 |
+
0.6527405,289.38538,0.004253953,-0.002234918,-13.025374,0.20214786,-289.32996,289.5853,3.6697145,13.9999695,-181.95032,-290.4246,-302.90384,17.669683,4.170117,-3.9868605,300.32922,220000
|
| 6 |
+
0.6521496,284.91028,0.00476721,-0.012534021,-15.129215,0.22642553,-284.83813,285.12418,3.4707954,8.972132,-105.557434,-286.44348,-303.46155,12.442927,1.1243138,-1.2778258,131.27873,225000
|
| 7 |
+
0.6774745,285.11755,0.004578785,0.009270864,-10.475257,0.19891806,-285.06958,285.32574,1.981074,10.952258,1.4104205,-285.94345,-303.5594,12.933332,11.269644,-11.912134,251.17723,230000
|
| 8 |
+
0.6683064,289.61642,0.004434156,-0.002770709,-13.124856,0.20394577,-289.55826,289.8176,1.7354946,8.660205,-102.88532,-290.545,-303.5669,10.3956995,0.61288935,-1.0530986,108.83346,235000
|
| 9 |
+
0.67065483,284.8335,0.0048238807,0.0008245961,-12.32906,0.22196347,-284.774,285.05627,2.6832237,5.0731344,-101.586426,-285.46994,-303.2357,7.756358,0.6658835,-0.7510364,87.95654,240000
|
| 10 |
+
0.6799752,285.0667,0.0048001003,0.008968798,-10.631539,0.19436862,-285.01566,285.27005,2.816118,7.1798234,-100.67865,-286.2794,-304.8351,9.995941,1.9656345,-1.4686198,132.84561,245000
|
| 11 |
+
0.67427963,283.4964,0.004301518,0.0049724365,-11.3440275,0.21014085,-283.44757,283.71152,2.1927164,7.9797835,-100.65283,-284.90146,-304.98914,10.1725,2.4183683,-2.300204,180.79214,250000
|
| 12 |
+
0.6721445,284.27582,0.0043845912,0.0012139984,-12.223122,0.17335445,-284.2222,284.45038,2.8059757,5.6941295,-101.29469,-285.25357,-303.27097,8.500105,1.4088492,-1.27432,115.302444,255000
|
| 13 |
+
0.67491555,283.93546,0.004504392,0.0067886985,-10.992871,0.2145448,-283.88593,284.15677,2.3585558,7.2105174,-96.80996,-284.9026,-303.3535,9.569073,0.9426595,-1.155998,114.132065,260000
|
| 14 |
+
0.66698986,284.74426,0.004299285,0.0061543914,-11.068508,0.1986421,-284.69672,284.94907,1.7748127,5.5357604,-101.24925,-286.1546,-304.00345,7.310573,1.4175696,-1.6023366,122.57452,265000
|
| 15 |
+
0.6533178,278.56894,0.0041289357,-0.0036373977,-13.380953,0.18274489,-278.51367,278.74805,2.4954422,6.5480247,-101.46714,-279.1888,-303.23706,9.043467,0.73148173,-0.6174495,95.03786,270000
|
| 16 |
+
0.64304364,276.87506,0.0042328066,-0.014032329,-15.815136,0.21124901,-276.8081,277.07227,3.9503834,11.373797,-36.62857,-278.53122,-303.0312,15.324181,4.506175,-4.3216276,213.15605,275000
|
| 17 |
+
0.6379761,278.4782,0.0045466595,-0.013447519,-15.45767,0.20701672,-278.4079,278.67178,2.6393516,6.780114,-100.992195,-279.65366,-303.3584,9.419466,1.0633577,-1.249515,102.30609,280000
|
| 18 |
+
0.65316474,280.759,0.0043334966,-0.0012549326,-12.789589,0.19111185,-280.7036,280.94885,2.3957145,11.35825,-65.1554,-281.68576,-302.7161,13.753964,1.8307678,-2.2602496,149.82713,285000
|
| 19 |
+
0.6477759,281.45557,0.004254754,-0.00681195,-14.101021,0.18844083,-281.39557,281.6372,2.0734227,7.486287,-101.10373,-282.26382,-302.8448,9.55971,0.8929246,-0.9062083,95.9232,290000
|
| 20 |
+
0.6609227,281.58322,0.0045721047,-0.0025672698,-13.061507,0.19543135,-281.5235,281.7761,2.2105155,5.5261087,-100.58609,-282.38126,-305.15854,7.7366242,0.5588816,-0.9356603,89.81483,295000
|
| 21 |
+
0.64545804,278.20117,0.0043936493,-0.009358101,-14.629915,0.21016628,-278.1369,278.40198,1.7975715,12.169691,-100.557816,-279.4787,-303.0404,13.967262,8.1426935,-8.560642,248.25484,300000
|
| 22 |
+
0.6607737,280.79385,0.0044062543,0.0036858115,-11.663505,0.16577685,-280.74246,280.96332,1.9353437,4.8655596,-100.90819,-281.53513,-302.80743,6.8009033,1.7918084,-0.6960084,83.30025,305000
|
| 23 |
+
0.6544622,281.82892,0.004395671,-0.0033870458,-13.270541,0.19797936,-281.7706,282.0235,2.9935029,6.2299676,-100.836395,-282.62253,-303.2887,9.223471,0.5320097,-0.6040565,101.02286,310000
|
| 24 |
+
0.6381172,278.07736,0.0043686638,-0.009839351,-14.752256,0.16354173,-278.0129,278.23108,2.0093858,6.6985445,-100.503914,-279.08987,-302.57605,8.707931,5.494936,-4.4567947,126.85245,315000
|
| 25 |
+
0.6577967,274.09064,0.0042399317,0.0025847517,-11.890379,0.1796853,-274.04022,274.27292,2.1047876,5.0893145,-100.73793,-274.98294,-302.5347,7.1941023,0.6449779,-0.4764257,76.55284,320000
|
| 26 |
+
0.66436857,281.87537,0.004034549,0.01037106,-9.929438,0.19386712,-281.8353,282.07962,1.9395001,3.2399971,-100.84729,-282.44833,-304.00995,5.1794972,0.6936612,-0.7435257,71.778336,325000
|
| 27 |
+
0.6636998,278.71002,0.0045509567,0.0016485291,-12.137762,0.2083087,-278.6548,278.91998,7.529682,7.2026443,-100.52687,-279.97192,-303.00635,14.7323265,3.6707027,-3.4749079,165.5765,330000
|
| 28 |
+
0.66501874,279.61115,0.0041080033,0.0041535976,-11.488901,0.18378094,-279.5639,279.79907,2.6986125,5.8774967,-100.56667,-280.56522,-303.0589,8.576109,1.5032051,-2.4566588,117.83123,335000
|
| 29 |
+
0.6706224,275.70297,0.0041697472,0.008767486,-10.397358,0.17887864,-275.6596,275.8906,1.6757478,3.821811,-100.54099,-276.5132,-302.5341,5.4975586,2.421283,-2.5389712,98.985886,340000
|
| 30 |
+
0.659397,273.23907,0.0039182752,0.003236074,-11.674108,0.19179307,-273.19333,273.4341,1.9626449,7.847397,-99.36938,-274.18408,-302.68973,9.810041,1.7631744,-1.2399523,95.34065,345000
|
| 31 |
+
0.65508175,279.23907,0.0042924862,0.0028873258,-11.8273535,0.19144037,-279.1883,279.4334,3.4379883,5.818012,-100.22728,-280.01007,-302.5092,9.2560005,2.988078,-2.5548239,121.905304,350000
|
| 32 |
+
0.6548236,277.0666,0.0045097866,-0.0058576097,-13.798866,0.18319842,-277.0044,277.24393,1.931892,9.008718,-100.20274,-277.91348,-302.52832,10.94061,3.7504723,-8.367122,147.12552,355000
|
| 33 |
+
0.66067404,271.7577,0.0043546315,0.00449843,-11.466978,0.21777232,-271.70776,271.97995,1.6121672,6.218572,-100.57529,-272.72427,-303.734,7.8307395,0.63029814,-0.6169585,79.426254,360000
|
| 34 |
+
0.6555983,273.2543,0.0041333465,0.00034013577,-12.417709,0.17447266,-273.203,273.4291,2.5412605,5.6639547,-100.777145,-274.32745,-302.63925,8.205215,0.63894385,-0.619176,94.974144,365000
|
| 35 |
+
0.6583505,271.8911,0.004223158,0.009099644,-10.345299,0.18103914,-271.84744,272.08124,7.1231203,9.866492,-100.82562,-273.09555,-302.89642,16.989613,3.7278235,-4.3215685,167.51567,370000
|
| 36 |
+
0.6618046,273.3683,0.0040657558,0.0032436873,-11.702193,0.20579594,-273.32068,273.57733,2.831558,13.087527,-100.01856,-274.3715,-302.89264,15.9190855,1.0464661,-0.9985296,118.21257,375000
|
| 37 |
+
0.65117306,273.4319,0.003997706,-0.004797067,-13.699955,0.18629846,-273.37708,273.6134,2.2306166,7.071506,-100.13004,-274.01523,-303.80542,9.302122,0.70121604,-0.90795714,109.4255,380000
|
| 38 |
+
0.6613171,269.70813,0.004070695,0.0009861509,-12.257744,0.17668022,-269.6582,269.88577,1.806276,3.6972713,-100.53477,-270.14536,-302.60635,5.503547,0.66996014,-0.6041347,88.96436,385000
|
| 39 |
+
0.65938765,269.88068,0.0039478806,0.005034322,-11.224804,0.17084062,-269.83636,270.05655,1.2486538,5.321135,-100.58226,-270.5263,-302.40717,6.569789,3.0583432,-4.091283,98.4547,390000
|
| 40 |
+
0.65254736,276.94757,0.0042597745,-0.001242265,-12.791627,0.1885623,-276.8931,277.1349,1.7742087,4.6716995,-100.78352,-277.7967,-302.57523,6.445908,0.61743563,-0.81172174,80.42094,395000
|
| 41 |
+
0.66215193,269.5462,0.004328507,0.004238546,-11.520783,0.18212657,-269.49634,269.73257,2.1460347,6.7850266,-100.42453,-270.15903,-303.28168,8.931061,0.7978551,-0.8255046,93.33862,400000
|
| 42 |
+
0.6481337,268.39432,0.0043230494,-0.014586202,-15.874054,0.19444486,-268.32568,268.5742,2.9180174,6.9269943,-100.34379,-268.62708,-302.169,9.845012,1.0980976,-1.3097146,120.709625,405000
|
| 43 |
+
0.65660965,271.3036,0.004315145,0.0041817576,-11.530911,0.16509016,-271.2538,271.47287,1.9242424,4.2927475,-100.65872,-272.40454,-302.56982,6.21699,1.8943851,-1.6540843,79.30311,410000
|
| 44 |
+
0.6575792,268.651,0.0039830413,0.0038543472,-11.5323105,0.21153897,-268.60504,268.8664,1.4430364,3.5887601,-100.56429,-269.38733,-302.44873,5.0317965,0.43507627,-0.5396991,53.805267,415000
|
| 45 |
+
0.64881873,273.3325,0.004119657,-0.0032954554,-13.299934,0.16928574,-273.2777,273.49847,1.3671179,4.3310595,-100.52424,-274.0935,-302.6576,5.6981773,0.78958887,-0.6226814,67.15813,420000
|
| 46 |
+
0.6627836,274.9635,0.0039525027,0.005535048,-11.099609,0.20290804,-274.91962,275.17194,1.9892892,3.9088292,-100.31982,-275.8449,-302.8474,5.8981185,0.55778545,-0.5355591,65.61831,425000
|
| 47 |
+
0.6515824,275.39325,0.0038066406,-0.001994361,-13.023916,0.20070267,-275.34363,275.59198,4.899343,9.360319,-100.45593,-276.46378,-302.49985,14.259663,9.654808,-10.180573,361.35294,430000
|
| 48 |
+
0.6694878,271.9486,0.0040741633,0.006516798,-10.900457,0.19083354,-271.90424,272.14597,1.942921,7.238843,-35.707954,-272.65155,-302.31693,9.181764,4.3971195,-4.399325,155.64487,435000
|
| 49 |
+
0.6491924,274.44818,0.0039203535,-0.0066563487,-14.197895,0.21213028,-274.39252,274.65366,5.8499703,8.798113,-100.426674,-275.48154,-302.32068,14.648083,3.5931406,-2.822448,203.07309,440000
|
| 50 |
+
0.67182773,265.38574,0.0037673742,0.013186762,-8.999747,0.18194309,-265.35184,265.58087,1.6294832,3.9560525,-93.31305,-266.027,-302.91,5.585536,1.3575081,-1.3443812,77.37044,445000
|
| 51 |
+
0.68450546,275.33966,0.003950078,0.010315609,-9.888505,0.16921219,-275.3006,275.5192,1.8512688,3.5915444,-97.500046,-276.60968,-303.74768,5.442813,1.6638749,-1.465851,89.45836,450000
|
| 52 |
+
0.6605621,268.9157,0.004193223,0.00832291,-10.515152,0.16968295,-268.87164,269.09372,1.594735,3.964339,-68.08038,-269.99017,-303.20938,5.559074,0.5405185,-0.49669093,72.22586,455000
|
| 53 |
+
0.65967536,267.9367,0.0041472213,0.004704815,-11.36555,0.21220344,-267.8896,268.1536,1.8184124,4.814575,-43.40813,-268.45685,-302.79535,6.6329875,0.58890206,-0.67420155,80.400604,460000
|
| 54 |
+
0.65345544,269.50146,0.0040455605,-0.0002853987,-12.570546,0.16892779,-269.45062,269.6701,2.07731,4.6542354,-100.49036,-270.71118,-302.72165,6.7315454,0.7326379,-0.5868558,83.48969,465000
|
| 55 |
+
0.6613906,273.58212,0.0041812793,-0.0013706943,-12.827817,0.19034562,-273.52847,273.7711,2.383503,13.67435,-100.33886,-274.23093,-302.45322,16.057854,3.2778685,-3.756027,195.0068,470000
|
| 56 |
+
0.66012937,265.99466,0.0039001193,0.00253126,-11.850979,0.18734273,-265.94846,266.18454,1.7213799,10.950155,-49.094864,-267.36465,-303.26376,12.6715355,2.3214488,-2.8234951,98.849525,475000
|
| 57 |
+
0.66988456,265.97528,0.003916002,0.0033541627,-11.643473,0.18896598,-265.9297,266.1676,1.3890224,4.3349996,-100.21213,-266.73764,-302.32578,5.724022,0.8014107,-0.9624639,71.35576,480000
|
| 58 |
+
0.6448479,271.14966,0.0038117263,-0.008673014,-14.775351,0.15449926,-271.09332,271.2955,1.4305977,3.5433342,-100.35294,-271.92612,-302.50732,4.973932,0.5159749,-0.4070945,60.26667,485000
|
| 59 |
+
0.65566796,265.2486,0.004194531,0.0036791551,-11.622869,0.17263617,-265.19986,265.42493,1.4560636,3.971553,-100.31386,-266.05817,-302.31915,5.4276166,0.4220368,-0.3876178,56.528114,490000
|
| 60 |
+
0.6590246,272.08997,0.0037348724,-0.0017853569,-12.978024,0.18493119,-272.0415,272.2731,1.2230705,3.6346385,-99.45829,-272.8045,-302.26453,4.857709,0.85862505,-0.6247362,69.47423,495000
|
| 61 |
+
0.6598666,266.67838,0.0037820379,0.00053220976,-12.35928,0.17428595,-266.63165,266.85318,3.5787892,4.4970617,-99.58999,-267.3133,-302.2838,8.075851,7.268953,-4.5548363,191.61023,500000
|
| 62 |
+
0.6655656,266.11807,0.0036147207,0.009332429,-9.918216,0.19951257,-266.0822,266.32693,1.2105052,3.8364732,-100.38399,-266.68246,-302.77652,5.0469785,0.6067161,-0.68948054,60.91378,505000
|
| 63 |
+
0.65032464,264.32727,0.0036125614,-0.0069437046,-14.4221,0.20497528,-264.27518,264.5253,1.2378601,3.3283372,-100.37813,-265.04465,-302.22363,4.5661974,0.694142,-0.6641756,63.4105,510000
|
| 64 |
+
0.6626691,260.36795,0.0036996754,0.003733794,-11.490778,0.18402578,-260.32544,260.5557,1.972654,4.0200934,-100.047775,-261.148,-302.62076,5.9927473,0.42836398,-0.42083955,61.119545,515000
|
| 65 |
+
0.6611422,256.05853,0.0035783874,0.0071853315,-10.49202,0.16327862,-256.021,256.22897,1.3779975,3.9969957,-98.58329,-256.73773,-302.4239,5.3749933,0.48635066,-0.7718786,56.598248,520000
|
| 66 |
+
0.64997154,268.24844,0.0034682872,-0.0031411308,-13.405672,0.16358344,-268.20193,268.40887,2.634392,4.889274,-100.21744,-269.4151,-302.38235,7.5236664,11.834171,-8.455617,242.92685,525000
|
| 67 |
+
0.66268593,263.15146,0.0036837354,0.003794826,-11.469843,0.18140325,-263.10922,263.33664,1.2728685,3.6444664,-99.56988,-264.52032,-302.22714,4.917335,0.57021946,-0.5055126,64.87028,530000
|
| 68 |
+
0.67029524,261.11627,0.0038222556,0.007668001,-10.4938545,0.2035051,-261.07617,261.32742,1.748571,4.6442995,-100.34868,-261.9876,-302.5581,6.3928704,0.7295077,-0.5572396,74.029205,535000
|
| 69 |
+
0.6550598,269.67938,0.0036066936,0.002920357,-11.690295,0.17020413,-269.63727,269.8525,1.3458986,3.9939458,-100.35446,-270.56223,-302.24445,5.3398447,0.3943383,-0.61711097,62.328682,540000
|
| 70 |
+
0.6480975,270.0806,0.003891381,-0.007199899,-14.350217,0.20227571,-270.02478,270.27567,1.6247838,4.8976398,-100.260605,-270.763,-302.12042,6.5224237,1.0194336,-1.2691985,81.40845,545000
|
| 71 |
+
0.67252547,261.4847,0.0040117893,0.0047739856,-11.310011,0.15896796,-261.43936,261.64844,1.6600016,3.483772,-100.34266,-262.40424,-302.57083,5.1437736,0.3943763,-0.29599965,55.75776,550000
|
| 72 |
+
0.6544177,264.24475,0.00372352,-0.005500645,-13.97727,0.203001,-264.19275,264.44226,1.69422,4.2778206,-97.612404,-265.49045,-302.46118,5.9720407,0.44014946,-0.5851059,68.775085,555000
|
| 73 |
+
0.6564298,263.62054,0.0038304825,0.0029019911,-11.742395,0.16968808,-263.57556,263.79312,1.1797205,3.0408223,-99.4725,-264.18076,-302.3257,4.220543,0.36236644,-0.47168502,51.130386,560000
|
| 74 |
+
0.6735563,266.12592,0.0038133624,-4.9233724e-05,-12.512911,0.18944304,-266.0782,266.3153,1.6091931,3.4185631,-100.244804,-267.0755,-302.5903,5.027756,0.5921902,-0.49170777,66.08627,565000
|
| 75 |
+
0.6546372,257.14496,0.003701904,-0.002733816,-13.238489,0.17176086,-257.09598,257.31396,1.0766732,3.367859,-100.09601,-257.95163,-302.62973,4.444532,0.7430787,-0.5413269,52.30329,570000
|
| 76 |
+
0.6564057,267.43176,0.0037128998,-0.006192781,-14.16791,0.19004652,-267.37915,267.6156,1.8500038,4.087278,-98.51134,-268.1512,-302.4549,5.9372816,1.4603418,-1.5467713,80.06695,575000
|
| 77 |
+
0.6530026,264.14365,0.0034178686,0.000452684,-12.367554,0.16194779,-264.10138,264.30606,1.2009678,3.148072,-99.98587,-264.64014,-302.265,4.34904,0.3223728,-0.4186517,53.86177,580000
|
| 78 |
+
0.65662736,264.18237,0.0034177464,0.002019398,-11.909143,0.16348654,-264.14166,264.34787,1.1906942,5.313781,-49.103474,-265.08774,-302.0591,6.504475,1.5205104,-1.4223309,73.35552,585000
|
| 79 |
+
0.6789743,258.22156,0.0037346461,0.010580762,-9.666863,0.16885938,-258.1855,258.401,1.4909447,4.1353145,-88.764755,-259.29294,-302.42694,5.6262593,0.48218688,-0.57141054,70.82895,590000
|
| 80 |
+
0.6705664,262.53107,0.0034614257,0.009105316,-9.86949,0.17975229,-262.49695,262.7199,1.4828422,3.6392457,-100.24905,-263.09897,-302.23584,5.122088,0.6842683,-0.4537009,64.50248,595000
|
| 81 |
+
0.6603621,260.622,0.003508171,0.0016708524,-12.0237255,0.17153375,-260.57983,260.79523,1.4442412,3.8219018,-98.79514,-261.4917,-302.27725,5.266143,0.48181164,-0.4054966,65.6174,600000
|
| 82 |
+
0.67132765,262.66064,0.0033689898,0.0061487304,-10.674904,0.18329018,-262.6247,262.85007,3.2014585,4.5694656,-100.04072,-263.4492,-302.48337,7.770924,1.324372,-1.4578564,107.06532,605000
|
| 83 |
+
0.6653919,262.6031,0.0035789625,-0.0036615713,-13.523082,0.18236533,-262.5547,262.7818,1.1173273,3.5915368,-100.20243,-263.84653,-302.40967,4.708864,0.60160255,-0.46928644,64.097595,610000
|
| 84 |
+
0.66199714,254.89487,0.0033183307,-0.001960876,-13.090922,0.16296205,-254.85144,255.05586,1.0904696,3.2705324,-100.246925,-255.62149,-302.2002,4.361002,0.38537014,-0.39957142,53.271942,615000
|
| 85 |
+
0.6559547,262.6046,0.003705523,-0.0063100993,-14.20289,0.16691852,-262.552,262.76523,1.8062708,3.631411,-85.69373,-263.44858,-302.32944,5.437682,0.4142108,-0.63232756,70.499084,620000
|
| 86 |
+
0.6403051,264.3777,0.0034219944,-0.0083333375,-14.935228,0.16446479,-264.32654,264.5338,1.1462058,3.5420232,-99.9432,-265.0379,-303.31894,4.688229,0.3629696,-0.40044463,56.512154,625000
|
| 87 |
+
0.6443225,260.54712,0.0035005982,-0.007714546,-14.703779,0.15493336,-260.49564,260.69434,1.670228,5.2060943,-100.29377,-261.4131,-302.36035,6.8763223,1.4769678,-1.288478,73.24065,630000
|
| 88 |
+
0.66473377,257.4653,0.0037386338,0.0022005604,-11.9114,0.1682497,-257.42075,257.63574,1.2459538,3.6653938,-99.32434,-258.33188,-302.20557,4.9113474,0.4515524,-0.5315856,56.42484,635000
|
| 89 |
+
0.677383,256.56873,0.0037059255,0.0035325638,-11.54678,0.1764624,-256.5259,256.74872,1.6392424,3.7074697,-99.51852,-257.1257,-301.96457,5.346712,0.5999432,-0.80386084,66.908966,640000
|
| 90 |
+
0.6782604,252.14796,0.0035620867,0.007740334,-10.327023,0.16146716,-252.11118,252.31717,1.8375944,3.243838,-100.0679,-252.89061,-301.9646,5.0814323,0.43213046,-0.30662838,53.359886,645000
|
| 91 |
+
0.67856544,257.66272,0.0035322132,0.0030221224,-11.644411,0.18539195,-257.62158,257.85114,0.9761144,4.164628,-100.14021,-258.48032,-302.21658,5.1407423,1.1239525,-0.8592754,64.41332,650000
|
| 92 |
+
0.6648457,259.90747,0.0035434363,0.004225754,-11.307442,0.20611218,-259.8674,260.1178,1.1711562,2.6447399,-100.097694,-260.67493,-302.09143,3.815896,0.41563764,-0.6061593,53.348408,655000
|
| 93 |
+
0.6742601,250.36487,0.0036402664,0.005581764,-10.9666605,0.18257019,-250.32494,250.55302,1.354206,3.7047753,-99.96856,-250.99815,-302.13144,5.0589814,0.59254,-0.5798214,58.587303,660000
|
| 94 |
+
0.66257215,255.16382,0.0035106966,0.00041399445,-12.382076,0.17049968,-255.12035,255.33473,1.442717,3.702147,-100.274635,-255.68999,-302.24182,5.144864,0.5315721,-0.5407169,68.906334,665000
|
| 95 |
+
0.65686077,258.32504,0.00363072,-0.0027788698,-13.265377,0.17819683,-258.27692,258.50046,1.5093999,3.1340368,-100.17191,-259.20184,-302.45807,4.6434364,0.40682003,-0.28348437,49.605568,670000
|
| 96 |
+
0.672638,254.11456,0.0035910006,0.0019255477,-11.963785,0.17801751,-254.0716,254.29451,1.3351728,3.5346467,-100.0951,-254.63147,-302.10077,4.8698196,0.3055289,-0.52399623,50.124268,675000
|
| 97 |
+
0.66197205,262.73126,0.003599603,0.002389201,-11.83626,0.18171662,-262.68866,262.91534,1.559502,5.046367,-34.448433,-263.72058,-302.1835,6.6058693,1.0847968,-1.1173602,74.17804,680000
|
| 98 |
+
0.66086715,261.79553,0.0035769118,-0.001522194,-12.925561,0.16917346,-261.74927,261.96317,1.8537235,4.3863206,-100.240295,-262.8641,-301.8177,6.240044,1.0694969,-0.74358463,81.77374,685000
|
| 99 |
+
0.65530926,254.77545,0.0035827789,-0.0038495664,-13.574464,0.16993,-254.72684,254.94154,1.3848752,4.918664,-100.07644,-255.61133,-302.1856,6.3035393,0.46325743,-0.5640386,68.97348,690000
|
| 100 |
+
0.66802746,254.09021,0.0034564147,-0.00011691625,-12.533826,0.19177204,-254.04688,254.28186,1.3432864,3.3823736,-98.675545,-255.1447,-302.10403,4.72566,0.6081267,-0.60491025,57.878395,695000
|
| 101 |
+
0.6498374,260.83356,0.0033863212,-0.005395251,-14.093248,0.19051215,-260.78583,261.01868,1.1976585,3.299151,-100.27798,-261.94684,-302.12622,4.4968095,0.488734,-0.51911247,51.194126,700000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c2aec45c7c301b9a2bdf11ec559cfebf48cedf287c9ae6b12b8597e5f2ad8f1
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a40e6c8a4bb0b7427f7968ab547b67d9feaab5a9cd29fb6e4c757d097dc1b594
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d78e415a6f7c66aabd8a30422a3882e10fd45bfbe68d0f15176d922289d369e6
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0cb8511b82e41d73af38f1893b3c6980ee5713ec37df10dc0644b9f24997ac0
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c6daf1172c4b765a9a5af5781731879401220e16f41c94498c87c6570c0f926
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f337ee94a50c06ce22b18941d7efc93fb288f4a35739136e3a7b341ae0debea
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fba7bc5c55473fbfd124efb9061bc2e53077a925b56245a9c951c0bf536d6d23
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9dd4e46b2ef9be1f558e50ab56801450247f6a7cfd6e5c1419bed6f310be260
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:611ccc2e54424212c9d8a237be821c7f60c35fb64c66ffd32cafd4db988b0d21
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df6aa289cf437d3bd2af6a739028e3281e588cbe841664140f1d6a4131c3ab68
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_175117/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/h8ns4yxp
|