Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/env.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.04223142458894218,0.002500016042863143,-0.042089526665175965,0.0023628626618691336,29.87823914677283,50.10000000001527,0.0,25500.0,-1.0,-1001.06,1000.0,3.239729790687561,550000
|
| 3 |
+
0.0,0.0,-0.02522695395100609,0.003220996565529655,-0.025067098001616148,0.003240421114854276,33.65246930699094,49.264000000014946,0.02,77048.56,-0.98,-983.26,983.28,3.1660610961914064,600000
|
| 4 |
+
0.0,0.0,-0.03936071479753159,-0.00018814818365287978,-0.03936553849021311,-0.00014065258935062788,35.56853231469027,50.10000000001527,0.0,128664.0,-1.0,-1000.0,1000.0,3.261902241706848,650000
|
| 5 |
+
0.0,0.0,-0.015566920148364756,0.0010189720537616095,-0.015516501247176122,0.001024963182845281,35.5032315216506,48.27800000001466,0.04,179562.48,-0.96,-963.52,963.56,3.1778956031799317,700000
|
| 6 |
+
0.0,0.0,-0.04614836714741864,-0.0011911388459023636,-0.04617677781345347,-0.0005409144082556284,34.304646735546086,50.10000000001527,0.0,230842.0,-1.0,-1000.0,1000.0,3.23541645526886,750000
|
| 7 |
+
0.0,0.0,-0.04347839063243155,-0.0002057771523071996,-0.043484641564038466,-0.0001596018013440784,35.5411006896409,50.10000000001527,0.0,282842.0,-1.0,-1000.0,1000.0,3.302938446998596,800000
|
| 8 |
+
0.0,0.0,-0.036326811190816835,-0.0028346786052763696,-0.0364665503016561,-0.0021898923648368367,34.41113390117904,50.10000000001527,0.0,334842.0,-1.0,-1000.0,1000.0,3.261806273460388,850000
|
| 9 |
+
0.0,0.0,-0.05403774543819705,-0.000258907891743083,-0.05405080629622026,-0.0002386881045386834,35.52695011287609,50.10000000001527,0.0,386842.0,-1.0,-1000.0,1000.0,3.2821730518341066,900000
|
| 10 |
+
0.0,0.0,-0.036534576027061394,0.0001405185798246079,-0.03652740181977289,0.0001516398861080911,35.56374126880635,50.10000000001527,0.0,438842.0,-1.0,-1000.0,1000.0,3.269608874320984,950000
|
| 11 |
+
0.0,0.0,-0.05183702177254829,0.0002772522384652211,-0.05181999452645014,0.000336069876742391,35.504469201573876,50.10000000001527,0.0,490842.0,-1.0,-1000.0,1000.0,3.304591245651245,1000000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.04223142458894218,0.002500016042863143,-0.042089526665175965,0.0023628626618691336,29.87823914677283,50.10000000001527,0.0,25500.0,-1.0,-1001.06,1000.0,3.239729790687561,550000
|
| 3 |
+
0.0,0.0,-0.02522695395100609,0.003220996565529655,-0.025067098001616148,0.003240421114854276,33.65246930699094,49.264000000014946,0.02,77048.56,-0.98,-983.26,983.28,3.1660610961914064,600000
|
| 4 |
+
0.0,0.0,-0.03936071479753159,-0.00018814818365287978,-0.03936553849021311,-0.00014065258935062788,35.56853231469027,50.10000000001527,0.0,128664.0,-1.0,-1000.0,1000.0,3.261902241706848,650000
|
| 5 |
+
0.0,0.0,-0.015566920148364756,0.0010189720537616095,-0.015516501247176122,0.001024963182845281,35.5032315216506,48.27800000001466,0.04,179562.48,-0.96,-963.52,963.56,3.1778956031799317,700000
|
| 6 |
+
0.0,0.0,-0.04614836714741864,-0.0011911388459023636,-0.04617677781345347,-0.0005409144082556284,34.304646735546086,50.10000000001527,0.0,230842.0,-1.0,-1000.0,1000.0,3.23541645526886,750000
|
| 7 |
+
0.0,0.0,-0.04347839063243155,-0.0002057771523071996,-0.043484641564038466,-0.0001596018013440784,35.5411006896409,50.10000000001527,0.0,282842.0,-1.0,-1000.0,1000.0,3.302938446998596,800000
|
| 8 |
+
0.0,0.0,-0.036326811190816835,-0.0028346786052763696,-0.0364665503016561,-0.0021898923648368367,34.41113390117904,50.10000000001527,0.0,334842.0,-1.0,-1000.0,1000.0,3.261806273460388,850000
|
| 9 |
+
0.0,0.0,-0.05403774543819705,-0.000258907891743083,-0.05405080629622026,-0.0002386881045386834,35.52695011287609,50.10000000001527,0.0,386842.0,-1.0,-1000.0,1000.0,3.2821730518341066,900000
|
| 10 |
+
0.0,0.0,-0.036534576027061394,0.0001405185798246079,-0.03652740181977289,0.0001516398861080911,35.56374126880635,50.10000000001527,0.0,438842.0,-1.0,-1000.0,1000.0,3.269608874320984,950000
|
| 11 |
+
0.0,0.0,-0.05183702177254829,0.0002772522384652211,-0.05181999452645014,0.000336069876742391,35.504469201573876,50.10000000001527,0.0,490842.0,-1.0,-1000.0,1000.0,3.304591245651245,1000000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6579108,285.24158,0.004269041,-0.0044148173,-13.534147,0.19352192,-285.18384,285.43066,2.305907,12.363885,-108.428825,-286.3291,-302.3941,14.669792,7.704104,-7.999422,182.68709,505000
|
| 3 |
+
0.6482419,282.412,0.004252499,-0.0033554956,-13.289064,0.22285533,-282.35547,282.6315,2.0103023,4.8546524,-151.6265,-283.33618,-302.42822,6.864955,0.45896095,-0.61040497,79.892494,510000
|
| 4 |
+
0.64253396,279.51172,0.0043037036,-0.008590809,-14.496143,0.17736652,-279.44934,279.68048,2.02234,5.998417,-106.318825,-280.22144,-302.31702,8.020757,0.49095348,-0.53607917,73.442764,515000
|
| 5 |
+
0.64946324,284.69528,0.004213521,0.0009482005,-12.274962,0.1941945,-284.6436,284.8904,1.8179009,5.859243,-171.06764,-285.94678,-302.42395,7.677144,3.664655,-4.2297335,152.50937,520000
|
| 6 |
+
0.64851874,281.47028,0.0044555226,-0.008389951,-14.383045,0.17736971,-281.40616,281.63925,1.9743651,5.113734,-108.02618,-282.90817,-302.70517,7.088099,3.39288,-3.4057093,105.194916,525000
|
| 7 |
+
0.6590448,282.108,0.00446858,-0.001012157,-12.726505,0.19991712,-282.05115,282.30692,1.6459783,3.6566017,2.3949852,-282.91623,-302.5097,5.30258,0.5514908,-0.47224048,65.14531,530000
|
| 8 |
+
0.65717834,286.16235,0.0043604425,0.0013730011,-12.185123,0.21230601,-286.10922,286.37604,1.394222,3.4966638,-103.44467,-287.03378,-302.46027,4.890886,0.9867109,-1.0123389,63.62149,535000
|
| 9 |
+
0.6753093,281.73306,0.0043556946,0.0050711897,-11.335733,0.16924639,-281.6837,281.90738,1.602425,3.1229558,-102.35301,-282.48456,-302.2549,4.725381,0.54118687,-0.73532814,59.220146,540000
|
| 10 |
+
0.6566088,282.4691,0.004283153,0.004200968,-11.519188,0.19946557,-282.41977,282.67276,2.0064652,4.2895455,-99.30843,-283.34286,-302.69785,6.296011,2.7466438,-6.653881,118.63893,545000
|
| 11 |
+
0.6702547,281.30988,0.0041895197,0.0022060487,-11.973436,0.16854598,-281.2597,281.48062,1.3484406,4.3984976,-101.71804,-282.29572,-302.50003,5.746938,2.3096564,-2.81008,75.08936,550000
|
| 12 |
+
0.64996624,280.8162,0.004023349,-0.0010815866,-12.768827,0.18744063,-280.76483,281.00256,1.5161011,3.5669897,-99.24022,-281.81894,-302.62723,5.083091,0.46459895,-0.4238368,60.63732,555000
|
| 13 |
+
0.65406835,280.85065,0.0039708326,0.0023749424,-11.901903,0.18117136,-280.80334,281.0342,1.4838288,5.591621,-100.93049,-281.95358,-302.42758,7.07545,1.3338618,-1.5406343,98.0056,560000
|
| 14 |
+
0.65903074,282.04303,0.004168576,0.006525239,-10.93466,0.19970699,-281.99744,282.24927,1.3485047,3.6588066,-100.89266,-283.06784,-302.64685,5.0073113,0.92941684,-0.74450964,70.571,565000
|
| 15 |
+
0.654156,274.54523,0.0041874424,-0.0002570508,-12.561386,0.18130913,-274.4926,274.7263,1.5361179,4.8811355,-99.92146,-275.63208,-302.58997,6.4172535,0.7437991,-0.6460404,77.166306,570000
|
| 16 |
+
0.64024365,273.93253,0.0042919195,-0.011758467,-15.2396755,0.20564896,-273.86713,274.12643,1.7860802,6.1350827,-36.66558,-275.2302,-302.2682,7.921163,1.3881371,-1.3338459,102.117744,575000
|
| 17 |
+
0.64399517,275.4572,0.0041780183,-0.011934684,-15.356542,0.17917162,-275.39307,275.62445,1.858714,4.8050704,-100.26678,-276.7459,-302.52158,6.6637845,0.5069331,-0.36317953,65.779564,580000
|
| 18 |
+
0.65519935,277.5551,0.0040830686,-0.0042236196,-13.534423,0.1903638,-277.49982,277.74127,1.788393,7.41225,-77.43577,-278.45407,-302.32092,9.200644,2.1290636,-2.1656468,109.63863,585000
|
| 19 |
+
0.6499478,278.60513,0.004347316,0.0011670527,-12.231546,0.1813238,-278.55197,278.78763,1.6923878,6.2120194,-100.57816,-279.3454,-301.93286,7.9044075,0.8948976,-0.9816704,82.05042,590000
|
| 20 |
+
0.65493405,278.4978,0.0041355644,0.0010866221,-12.237249,0.18184271,-278.4472,278.68076,1.6918949,4.151825,-100.42406,-279.56207,-302.1095,5.84372,0.606123,-0.51206505,70.0126,595000
|
| 21 |
+
0.6440921,274.9148,0.00402248,-0.0038213897,-13.450008,0.17499566,-274.8607,275.08597,1.6653713,6.347351,-100.36592,-276.24213,-302.30768,8.012722,0.6634669,-0.6572055,72.54601,600000
|
| 22 |
+
0.66541106,278.55142,0.0043007513,0.004124706,-11.540934,0.19401859,-278.50177,278.74957,1.5629041,3.5239532,-100.53205,-279.70248,-302.72397,5.0868573,0.5023196,-0.45712885,61.717377,605000
|
| 23 |
+
0.6496609,279.09595,0.0040393746,-0.0033373756,-13.326211,0.19936857,-279.04208,279.292,1.7947426,3.5359643,-100.252174,-279.905,-302.14877,5.3307066,0.44802743,-0.5795466,63.165096,610000
|
| 24 |
+
0.6410962,274.25998,0.0041908026,-0.008252457,-14.469183,0.16964206,-274.19934,274.4214,1.3980329,4.406976,-100.09972,-275.67587,-302.62558,5.805009,0.42812753,-0.6291275,69.598785,615000
|
| 25 |
+
0.6475113,272.6054,0.004014321,0.0062023946,-10.954933,0.17531602,-272.5614,272.78693,1.3857636,4.045783,-100.034996,-273.4021,-302.50497,5.4315467,0.7223223,-0.55456954,62.701817,620000
|
| 26 |
+
0.66686493,279.5427,0.0039657517,0.0105235595,-9.84639,0.16944607,-279.50363,279.72266,1.1528013,8.209586,-99.976036,-280.12973,-302.0818,9.362388,1.235816,-1.6528295,95.44603,625000
|
| 27 |
+
0.6613433,276.98932,0.0039608967,0.0036786452,-11.5712595,0.167822,-276.9435,277.16083,1.1697361,3.9659538,-100.1421,-278.42715,-302.49448,5.1356897,0.7194244,-0.5588134,73.59481,630000
|
| 28 |
+
0.6553294,277.48907,0.003933549,0.0042172167,-11.427885,0.16597621,-277.44415,277.65927,1.6424217,3.937697,-100.25317,-278.04715,-302.23584,5.5801187,0.3884722,-0.48473638,74.911766,635000
|
| 29 |
+
0.6547197,273.35077,0.0039235977,0.0020039955,-11.989245,0.17922178,-273.3037,273.532,1.1532909,3.061859,-100.2702,-274.09482,-302.18552,4.21515,0.4519494,-0.25431377,46.820393,640000
|
| 30 |
+
0.65763044,270.4004,0.004035836,0.002765831,-11.814682,0.16117021,-270.35272,270.56433,1.7856337,4.3431754,-100.27941,-271.561,-302.4321,6.128809,0.5661363,-0.6200773,74.07515,645000
|
| 31 |
+
0.6578578,277.07782,0.003989164,0.0021242423,-11.967497,0.2093355,-277.03006,277.2893,1.0554068,3.3147073,-100.13067,-277.73465,-302.0236,4.3701143,0.30701816,-0.6334218,47.134026,650000
|
| 32 |
+
0.66149,274.747,0.0039170403,7.861903e-05,-12.479929,0.20226413,-274.69815,274.94937,1.0429538,3.5783842,-100.26443,-275.49976,-302.35846,4.621338,0.40889263,-0.37137836,52.390213,655000
|
| 33 |
+
0.6586339,270.12643,0.0040302975,0.0048105274,-11.306409,0.19770864,-270.08084,270.32898,1.4270971,4.00599,-100.1032,-271.09323,-302.28915,5.4330873,0.47264162,-0.54923874,59.601425,660000
|
| 34 |
+
0.6564718,271.09753,0.004053427,0.001999905,-12.006614,0.17686921,-271.04883,271.27643,1.3831472,3.8952348,-100.39118,-272.2464,-302.0752,5.2783823,0.59391475,-0.44214538,68.038025,665000
|
| 35 |
+
0.65270203,270.46118,0.0038130644,0.004112851,-11.421379,0.18208158,-270.41763,270.64737,5.9893494,8.596335,-100.16749,-271.5046,-302.1702,14.585685,2.040939,-3.9936056,130.16058,670000
|
| 36 |
+
0.65804404,271.1789,0.003937441,0.0026719524,-11.821399,0.20705265,-271.1324,271.38864,1.1196574,4.146377,-100.10693,-272.11633,-302.35623,5.2660346,0.6394224,-0.5033328,62.62883,675000
|
| 37 |
+
0.6515773,271.64444,0.003840263,-0.0014543562,-12.878713,0.18823653,-271.59497,271.8312,2.1273289,4.5044503,-100.30377,-272.41626,-302.073,6.631779,0.39479148,-0.5832519,70.361786,680000
|
| 38 |
+
0.65639526,267.5936,0.0035606774,0.0010649168,-12.200923,0.17778195,-267.55017,267.77246,1.4803528,2.729139,-100.28829,-268.24026,-302.39996,4.2094917,0.45577335,-0.32739058,50.48861,685000
|
| 39 |
+
0.6585547,267.57278,0.003848362,0.00213829,-11.944364,0.16491027,-267.5268,267.73984,1.1999657,3.9507809,-100.23173,-268.33737,-302.17996,5.1507463,0.8598517,-0.94193274,67.2074,690000
|
| 40 |
+
0.64795196,274.61438,0.0039766077,-0.0043735798,-13.599827,0.21267137,-274.5603,274.8227,1.448272,3.2389607,-100.028015,-275.47946,-302.151,4.687233,0.504261,-0.5026045,54.90171,695000
|
| 41 |
+
0.65903914,267.42685,0.003929865,3.9494436e-05,-12.48995,0.19844292,-267.37775,267.62534,1.4019492,6.6904254,-100.047264,-268.0916,-302.0159,8.092375,1.1006799,-1.133639,88.083954,700000
|
| 42 |
+
0.654465,266.766,0.0039654626,-0.0044943304,-13.6333685,0.2007213,-266.7119,266.96222,2.453056,4.870449,-100.27568,-267.1039,-301.96866,7.3235054,0.6881039,-0.8729202,93.83666,705000
|
| 43 |
+
0.6598286,269.7295,0.0039366,0.009884002,-9.989203,0.1643028,-269.6902,269.9037,1.2517636,3.616803,-100.33865,-270.6122,-302.15054,4.8685665,0.35371718,-0.4636666,58.86762,710000
|
| 44 |
+
0.65873635,266.86548,0.0039079622,-8.9956746e-05,-12.523019,0.17943174,-266.81653,267.04483,1.2043087,2.9442682,-91.77467,-267.58054,-302.08554,4.1485767,0.49964902,-0.47979164,54.32775,715000
|
| 45 |
+
0.6491007,271.56396,0.0037551192,-0.0029110468,-13.275221,0.1852826,-271.51413,271.74634,1.0828753,3.629132,-100.25554,-272.5719,-302.08646,4.7120075,0.48159328,-0.44247323,54.44368,720000
|
| 46 |
+
0.64970535,273.51233,0.003922672,-0.005965606,-14.020802,0.15443659,-273.45734,273.66083,1.1719073,3.3286805,-100.27914,-274.41037,-302.28577,4.500588,0.4507487,-0.42968816,47.86422,725000
|
| 47 |
+
0.65824324,272.8471,0.0039757695,0.00033541536,-12.415635,0.18737072,-272.79773,273.03482,1.3791993,5.950578,-100.22128,-274.27057,-302.16833,7.3297777,2.2802033,-2.0377588,79.12106,730000
|
| 48 |
+
0.66684127,269.41754,0.0037930442,0.008523244,-10.252928,0.18753831,-269.37866,269.6136,1.3561953,4.563749,-39.105396,-270.27875,-301.86578,5.9199443,0.54330045,-0.61932176,66.64336,735000
|
| 49 |
+
0.6549791,272.51184,0.0037475347,-0.0039762766,-13.561038,0.15051734,-272.46106,272.6584,2.6842532,3.9534855,-100.29303,-273.83545,-301.96072,6.6377387,0.65364367,-0.50323796,75.37738,740000
|
| 50 |
+
0.660583,264.27094,0.0038873174,0.005876345,-10.988329,0.15288179,-264.2282,264.42972,1.1613934,3.7703264,-100.06768,-264.5982,-302.01605,4.93172,0.79439616,-1.1263962,81.93108,745000
|
| 51 |
+
0.67569375,273.83072,0.003647474,0.0073077525,-10.49649,0.15170161,-273.79242,273.98972,1.1124833,2.901037,-100.27383,-275.1587,-302.17755,4.0135202,0.800637,-0.6174868,72.36986,750000
|
| 52 |
+
0.659771,267.953,0.0035435888,0.006766527,-10.5904875,0.17106886,-267.91547,268.13086,1.0859827,3.827282,-100.34251,-268.78073,-302.244,4.9132648,0.50307035,-0.5714288,47.62855,755000
|
| 53 |
+
0.65912855,266.71906,0.0036389667,0.004088271,-11.37653,0.20112103,-266.67764,266.92426,1.0303773,4.0326047,-100.32261,-267.38547,-302.83835,5.062982,0.5884076,-0.6155299,61.199135,760000
|
| 54 |
+
0.6533072,267.51697,0.0037740231,-0.003154106,-13.335741,0.17709541,-267.4666,267.69092,1.2856374,4.262731,-99.89339,-269.07477,-302.09225,5.5483685,0.7513955,-0.4752431,75.81791,765000
|
| 55 |
+
0.6505034,272.10205,0.0038065733,-0.0031955692,-13.339487,0.18426293,-272.0513,272.2831,1.6317999,3.0589836,-100.169044,-272.6441,-302.14038,4.6907835,1.9642518,-1.8907006,97.60035,770000
|
| 56 |
+
0.6669611,264.73584,0.0038625028,0.0042426544,-11.401579,0.1799136,-264.6918,264.91998,2.136467,4.1961007,-51.583878,-266.09775,-301.93106,6.3325677,0.58273274,-0.56520087,67.05593,775000
|
| 57 |
+
0.6706135,264.33484,0.0038459369,0.00063872035,-12.333923,0.17666805,-264.28738,264.51215,0.89271766,3.1907961,-100.28022,-265.40146,-302.11288,4.0835137,0.62755805,-0.44962803,54.27177,780000
|
| 58 |
+
0.6393167,270.19983,0.0036216215,-0.009497967,-15.122573,0.18963808,-270.14508,270.37997,1.5215266,3.1575873,-100.359474,-270.8645,-302.08258,4.679114,0.41344947,-0.4369626,56.093754,785000
|
| 59 |
+
0.6583575,263.63232,0.0038283148,-0.0021768918,-13.068629,0.1867085,-263.58228,263.81686,1.341794,3.2047203,-100.23556,-264.60916,-302.22928,4.5465145,0.6111065,-0.58238685,58.104137,790000
|
| 60 |
+
0.660354,270.9447,0.0034488959,0.0027820657,-11.693346,0.17695838,-270.90436,271.12445,1.0112712,3.002655,-100.21121,-271.57755,-302.12866,4.0139265,0.32436568,-0.39716777,49.948387,795000
|
| 61 |
+
0.6612035,265.60034,0.0035471169,0.006082298,-10.785284,0.17400928,-265.56207,265.78043,0.854949,3.72716,-100.35894,-266.7373,-302.2896,4.582109,4.4497485,-2.0588434,91.694855,800000
|
| 62 |
+
0.66160077,264.6712,0.003556632,0.0058699506,-10.849576,0.19140334,-264.63263,264.86847,0.988584,2.7916417,-100.35386,-265.2942,-302.07452,3.7802258,0.47160432,-0.32477254,41.041553,805000
|
| 63 |
+
0.65140325,262.6825,0.0035989904,-0.004620515,-13.783836,0.17776537,-262.63287,262.85565,1.1168289,2.9251237,-100.39459,-263.50278,-302.17273,4.0419526,0.45007935,-0.26391026,49.118736,810000
|
| 64 |
+
0.65736234,258.56592,0.0036489125,-6.691102e-05,-12.518337,0.18602231,-258.52026,258.7519,1.65688,3.500407,-99.35056,-259.3193,-302.01044,5.157287,0.4767809,-0.31385258,53.574795,815000
|
| 65 |
+
0.6609553,254.82785,0.0035622923,0.009012514,-9.970024,0.16699883,-254.79233,255.00386,1.3061771,2.9790673,-100.2149,-255.57378,-302.33063,4.2852445,0.40408978,-0.43442953,46.331448,820000
|
| 66 |
+
0.65997165,266.86395,0.003466293,-0.0030131852,-13.369282,0.17107767,-266.8176,267.032,1.2300591,3.1246192,-100.216736,-268.05548,-302.19327,4.354678,0.63331866,-0.44845146,53.569023,825000
|
| 67 |
+
0.6597874,262.56848,0.0033510067,0.0004083937,-12.378128,0.17262757,-262.527,262.74152,1.1972287,2.9701624,-100.11888,-263.67044,-301.90247,4.167391,1.3787316,-1.3200547,57.63839,830000
|
| 68 |
+
0.661816,260.10144,0.0034279132,0.0014635001,-12.073064,0.18463403,-260.06006,260.28754,0.9610017,3.604702,-100.26887,-260.74136,-302.25555,4.565704,0.4801946,-0.47190732,49.2775,835000
|
| 69 |
+
0.6729698,268.84448,0.0034654387,0.005585796,-10.888142,0.1918374,-268.80673,269.0419,1.0130769,3.2839723,-100.1103,-269.29523,-301.7728,4.297049,0.46723855,-0.79178226,67.18686,840000
|
| 70 |
+
0.6475446,268.9315,0.0035538126,-0.005582338,-14.070803,0.18204898,-268.8815,269.10794,1.1875839,2.9777095,-100.19597,-269.89746,-302.02164,4.1652937,0.36196595,-0.31968978,48.15271,845000
|
| 71 |
+
0.66225183,261.26642,0.003524,0.003473552,-11.514316,0.15395162,-261.22583,261.42386,1.3212742,6.821426,-100.32072,-262.14127,-302.14597,8.1427,1.1449107,-1.2660453,87.37157,850000
|
| 72 |
+
0.6458808,262.50894,0.0035564436,-0.00748794,-14.605457,0.1718918,-262.457,262.67337,1.3812838,4.410611,-100.29953,-263.7125,-302.12747,5.791895,0.45800027,-0.3847227,58.874794,855000
|
| 73 |
+
0.6533093,262.20276,0.003306043,0.00094456755,-12.214291,0.16670758,-262.16238,262.37042,1.373183,2.6442707,-100.34472,-262.90295,-301.75812,4.0174537,0.59678143,-0.6023824,45.552795,860000
|
| 74 |
+
0.67128074,265.81143,0.0035794713,0.006958329,-10.556046,0.17598487,-265.77365,265.9944,0.92725104,2.9992085,-100.22694,-266.72894,-302.0214,3.9264596,0.5033796,-0.48129946,53.767544,865000
|
| 75 |
+
0.6639645,256.6471,0.0034052937,-0.00041215844,-12.621035,0.13910717,-256.60413,256.78577,1.0672913,2.268841,-100.242516,-257.22958,-301.9998,3.3361323,0.33892122,-0.37365082,46.651367,870000
|
| 76 |
+
0.64887756,265.70367,0.0034828065,-0.007252368,-14.5823345,0.14883053,-265.6529,265.84525,1.3585048,3.2215207,-100.32057,-266.65012,-302.41916,4.5800257,1.4365287,-1.015739,65.32008,875000
|
| 77 |
+
0.6491017,262.06558,0.00333764,0.001290693,-12.113292,0.1597955,-262.02515,262.22665,1.2567949,3.1631486,-60.158665,-262.60587,-302.05194,4.419944,0.41426903,-0.45999384,57.531513,880000
|
| 78 |
+
0.64904034,262.63193,0.0036440473,-0.011081178,-15.540898,0.14113033,-262.57532,262.762,1.2622297,3.8852978,-57.618084,-263.7565,-301.86826,5.1475277,2.0148263,-2.0418425,72.76189,885000
|
| 79 |
+
0.66686904,257.7063,0.003370074,0.0040569217,-11.296192,0.18583782,-257.66827,257.8962,1.4001695,2.931129,-100.22185,-258.3873,-302.1135,4.3312984,0.8963166,-0.87369686,64.19837,890000
|
| 80 |
+
0.66846687,261.21484,0.003716214,-0.0041712783,-13.622454,0.15039398,-261.16425,261.36105,1.42408,3.8545258,-58.864037,-261.8497,-302.00986,5.278606,0.5176733,-0.8860972,60.892822,895000
|
| 81 |
+
0.6616928,260.28625,0.0033758853,0.0017230834,-11.989591,0.18185063,-260.2458,260.46982,1.0287497,5.0489364,-100.2207,-260.7898,-301.86118,6.0776863,3.8054667,-3.364719,102.93163,900000
|
| 82 |
+
0.6607762,261.81195,0.0033868994,0.0045329384,-11.161626,0.19677435,-261.77414,262.01328,1.3420513,2.680408,-100.22532,-262.45126,-301.9041,4.022459,0.4306695,-0.49891794,51.281128,905000
|
| 83 |
+
0.6591948,261.89047,0.0032551696,-0.002847218,-13.374676,0.16035116,-261.84692,262.04797,1.0049092,3.9302957,-100.32098,-263.2369,-302.17883,4.935205,0.44956487,-0.48775324,53.508183,910000
|
| 84 |
+
0.6646911,254.03027,0.0032549894,0.0015933082,-12.010503,0.18312363,-253.99118,254.21498,0.94391555,2.6857595,-100.24098,-254.69376,-302.22104,3.6296751,0.38873577,-0.5574588,46.66717,915000
|
| 85 |
+
0.6550456,261.82407,0.0034827136,-0.0018453855,-13.02987,0.14818305,-261.7787,261.97043,1.5327252,2.7634144,-100.26288,-262.33023,-302.13095,4.2961397,0.3025517,-0.2753719,47.400536,920000
|
| 86 |
+
0.64301986,263.792,0.0032643822,-0.004605982,-13.910981,0.1737886,-263.74658,263.96118,1.119194,3.8596017,-100.06816,-264.1212,-302.46982,4.978796,0.43353498,-0.635875,69.33059,925000
|
| 87 |
+
0.6405682,259.21338,0.0033984305,-0.006373574,-14.375446,0.1684061,-259.1645,259.3754,1.2560793,4.198245,-100.2315,-260.05942,-301.99396,5.4543242,0.35991946,-0.4241051,60.18328,930000
|
| 88 |
+
0.659425,257.3658,0.0030532745,0.0057108547,-10.629597,0.18215698,-257.33334,257.55368,1.8099288,2.849876,-100.13437,-258.04395,-301.86725,4.659805,0.4479385,-0.45597848,52.865494,935000
|
| 89 |
+
0.668947,255.81494,0.0033168374,-0.00049985875,-12.650703,0.19116437,-255.77298,256.0056,1.8097489,3.2686841,-100.2608,-256.47565,-301.8953,5.078433,0.52237636,-0.5262101,58.495743,940000
|
| 90 |
+
0.67086303,250.86426,0.003449901,0.005241545,-10.980668,0.14667575,-250.82637,251.01619,1.8482136,3.2666566,-45.504993,-251.88394,-301.8986,5.11487,0.5782371,-0.37540194,59.916058,945000
|
| 91 |
+
0.6692862,256.6159,0.003446016,0.008727638,-9.967325,0.1828635,-256.58154,256.8075,0.77006304,4.6359344,-100.29463,-257.49756,-301.81592,5.4059973,0.79986614,-1.3263894,48.205376,950000
|
| 92 |
+
0.6632227,259.28906,0.0034777797,0.003302885,-11.550289,0.17131753,-259.24893,259.46368,1.2018646,2.635976,-100.29667,-260.0095,-301.98438,3.8378406,0.3772642,-0.4393739,45.591316,955000
|
| 93 |
+
0.6635672,249.6278,0.0032623268,0.0074428893,-10.2185335,0.16292073,-249.59448,249.79817,1.1667366,2.8812551,-100.169495,-250.52197,-301.71265,4.0479918,0.4839263,-0.28421694,47.26676,960000
|
| 94 |
+
0.6578454,253.80338,0.0032295156,-2.3013059e-05,-12.507126,0.18230997,-253.76299,253.98566,1.3159975,2.949149,-100.25543,-254.31084,-301.89313,4.2651463,0.37375084,-0.3230095,49.35797,965000
|
| 95 |
+
0.65563077,257.8425,0.0033530528,-0.0032277917,-13.462643,0.1692284,-257.79733,258.00848,1.2426844,2.6231441,-99.64882,-258.79224,-301.9296,3.8658285,0.36780477,-0.42535925,43.829018,970000
|
| 96 |
+
0.66448766,253.32779,0.0031828461,0.0019235563,-11.895649,0.15422365,-253.28992,253.48393,1.1299638,2.8972435,-100.2213,-253.76973,-301.96,4.0272074,0.4436818,-0.3324184,44.530373,975000
|
| 97 |
+
0.67096025,262.0478,0.0032576555,0.0052718343,-10.881709,0.16283634,-262.0124,262.2159,1.097958,4.4795427,-100.242096,-263.06177,-301.80212,5.577501,0.81732154,-1.0260156,63.47316,980000
|
| 98 |
+
0.65371263,261.46448,0.0034228938,-0.0033714545,-13.484972,0.16992252,-261.4183,261.63104,0.9755501,3.0850713,-100.239426,-262.37802,-301.9889,4.0606213,0.3768756,-0.37279937,44.370087,985000
|
| 99 |
+
0.6475131,254.62534,0.003390074,-0.0015821914,-12.966713,0.16861197,-254.58138,254.79236,1.3092974,4.2092037,-100.25667,-255.42705,-301.78094,5.5185013,1.4193403,-1.5999489,59.263725,990000
|
| 100 |
+
0.66602886,253.32042,0.0031676088,-0.00065718964,-12.707472,0.1731353,-253.28018,253.4929,1.0007268,2.7954175,-100.11356,-253.89241,-301.8325,3.7961445,0.41382098,-0.39672512,50.639988,995000
|
| 101 |
+
0.64553696,260.55115,0.0031723627,-0.008678066,-15.235521,0.14429584,-260.5028,260.68677,1.1913785,3.8330712,-99.25356,-261.5567,-301.85995,5.02445,0.7915227,-0.64243615,53.116688,1000000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6579108,285.24158,0.004269041,-0.0044148173,-13.534147,0.19352192,-285.18384,285.43066,2.305907,12.363885,-108.428825,-286.3291,-302.3941,14.669792,7.704104,-7.999422,182.68709,505000
|
| 3 |
+
0.6482419,282.412,0.004252499,-0.0033554956,-13.289064,0.22285533,-282.35547,282.6315,2.0103023,4.8546524,-151.6265,-283.33618,-302.42822,6.864955,0.45896095,-0.61040497,79.892494,510000
|
| 4 |
+
0.64253396,279.51172,0.0043037036,-0.008590809,-14.496143,0.17736652,-279.44934,279.68048,2.02234,5.998417,-106.318825,-280.22144,-302.31702,8.020757,0.49095348,-0.53607917,73.442764,515000
|
| 5 |
+
0.64946324,284.69528,0.004213521,0.0009482005,-12.274962,0.1941945,-284.6436,284.8904,1.8179009,5.859243,-171.06764,-285.94678,-302.42395,7.677144,3.664655,-4.2297335,152.50937,520000
|
| 6 |
+
0.64851874,281.47028,0.0044555226,-0.008389951,-14.383045,0.17736971,-281.40616,281.63925,1.9743651,5.113734,-108.02618,-282.90817,-302.70517,7.088099,3.39288,-3.4057093,105.194916,525000
|
| 7 |
+
0.6590448,282.108,0.00446858,-0.001012157,-12.726505,0.19991712,-282.05115,282.30692,1.6459783,3.6566017,2.3949852,-282.91623,-302.5097,5.30258,0.5514908,-0.47224048,65.14531,530000
|
| 8 |
+
0.65717834,286.16235,0.0043604425,0.0013730011,-12.185123,0.21230601,-286.10922,286.37604,1.394222,3.4966638,-103.44467,-287.03378,-302.46027,4.890886,0.9867109,-1.0123389,63.62149,535000
|
| 9 |
+
0.6753093,281.73306,0.0043556946,0.0050711897,-11.335733,0.16924639,-281.6837,281.90738,1.602425,3.1229558,-102.35301,-282.48456,-302.2549,4.725381,0.54118687,-0.73532814,59.220146,540000
|
| 10 |
+
0.6566088,282.4691,0.004283153,0.004200968,-11.519188,0.19946557,-282.41977,282.67276,2.0064652,4.2895455,-99.30843,-283.34286,-302.69785,6.296011,2.7466438,-6.653881,118.63893,545000
|
| 11 |
+
0.6702547,281.30988,0.0041895197,0.0022060487,-11.973436,0.16854598,-281.2597,281.48062,1.3484406,4.3984976,-101.71804,-282.29572,-302.50003,5.746938,2.3096564,-2.81008,75.08936,550000
|
| 12 |
+
0.64996624,280.8162,0.004023349,-0.0010815866,-12.768827,0.18744063,-280.76483,281.00256,1.5161011,3.5669897,-99.24022,-281.81894,-302.62723,5.083091,0.46459895,-0.4238368,60.63732,555000
|
| 13 |
+
0.65406835,280.85065,0.0039708326,0.0023749424,-11.901903,0.18117136,-280.80334,281.0342,1.4838288,5.591621,-100.93049,-281.95358,-302.42758,7.07545,1.3338618,-1.5406343,98.0056,560000
|
| 14 |
+
0.65903074,282.04303,0.004168576,0.006525239,-10.93466,0.19970699,-281.99744,282.24927,1.3485047,3.6588066,-100.89266,-283.06784,-302.64685,5.0073113,0.92941684,-0.74450964,70.571,565000
|
| 15 |
+
0.654156,274.54523,0.0041874424,-0.0002570508,-12.561386,0.18130913,-274.4926,274.7263,1.5361179,4.8811355,-99.92146,-275.63208,-302.58997,6.4172535,0.7437991,-0.6460404,77.166306,570000
|
| 16 |
+
0.64024365,273.93253,0.0042919195,-0.011758467,-15.2396755,0.20564896,-273.86713,274.12643,1.7860802,6.1350827,-36.66558,-275.2302,-302.2682,7.921163,1.3881371,-1.3338459,102.117744,575000
|
| 17 |
+
0.64399517,275.4572,0.0041780183,-0.011934684,-15.356542,0.17917162,-275.39307,275.62445,1.858714,4.8050704,-100.26678,-276.7459,-302.52158,6.6637845,0.5069331,-0.36317953,65.779564,580000
|
| 18 |
+
0.65519935,277.5551,0.0040830686,-0.0042236196,-13.534423,0.1903638,-277.49982,277.74127,1.788393,7.41225,-77.43577,-278.45407,-302.32092,9.200644,2.1290636,-2.1656468,109.63863,585000
|
| 19 |
+
0.6499478,278.60513,0.004347316,0.0011670527,-12.231546,0.1813238,-278.55197,278.78763,1.6923878,6.2120194,-100.57816,-279.3454,-301.93286,7.9044075,0.8948976,-0.9816704,82.05042,590000
|
| 20 |
+
0.65493405,278.4978,0.0041355644,0.0010866221,-12.237249,0.18184271,-278.4472,278.68076,1.6918949,4.151825,-100.42406,-279.56207,-302.1095,5.84372,0.606123,-0.51206505,70.0126,595000
|
| 21 |
+
0.6440921,274.9148,0.00402248,-0.0038213897,-13.450008,0.17499566,-274.8607,275.08597,1.6653713,6.347351,-100.36592,-276.24213,-302.30768,8.012722,0.6634669,-0.6572055,72.54601,600000
|
| 22 |
+
0.66541106,278.55142,0.0043007513,0.004124706,-11.540934,0.19401859,-278.50177,278.74957,1.5629041,3.5239532,-100.53205,-279.70248,-302.72397,5.0868573,0.5023196,-0.45712885,61.717377,605000
|
| 23 |
+
0.6496609,279.09595,0.0040393746,-0.0033373756,-13.326211,0.19936857,-279.04208,279.292,1.7947426,3.5359643,-100.252174,-279.905,-302.14877,5.3307066,0.44802743,-0.5795466,63.165096,610000
|
| 24 |
+
0.6410962,274.25998,0.0041908026,-0.008252457,-14.469183,0.16964206,-274.19934,274.4214,1.3980329,4.406976,-100.09972,-275.67587,-302.62558,5.805009,0.42812753,-0.6291275,69.598785,615000
|
| 25 |
+
0.6475113,272.6054,0.004014321,0.0062023946,-10.954933,0.17531602,-272.5614,272.78693,1.3857636,4.045783,-100.034996,-273.4021,-302.50497,5.4315467,0.7223223,-0.55456954,62.701817,620000
|
| 26 |
+
0.66686493,279.5427,0.0039657517,0.0105235595,-9.84639,0.16944607,-279.50363,279.72266,1.1528013,8.209586,-99.976036,-280.12973,-302.0818,9.362388,1.235816,-1.6528295,95.44603,625000
|
| 27 |
+
0.6613433,276.98932,0.0039608967,0.0036786452,-11.5712595,0.167822,-276.9435,277.16083,1.1697361,3.9659538,-100.1421,-278.42715,-302.49448,5.1356897,0.7194244,-0.5588134,73.59481,630000
|
| 28 |
+
0.6553294,277.48907,0.003933549,0.0042172167,-11.427885,0.16597621,-277.44415,277.65927,1.6424217,3.937697,-100.25317,-278.04715,-302.23584,5.5801187,0.3884722,-0.48473638,74.911766,635000
|
| 29 |
+
0.6547197,273.35077,0.0039235977,0.0020039955,-11.989245,0.17922178,-273.3037,273.532,1.1532909,3.061859,-100.2702,-274.09482,-302.18552,4.21515,0.4519494,-0.25431377,46.820393,640000
|
| 30 |
+
0.65763044,270.4004,0.004035836,0.002765831,-11.814682,0.16117021,-270.35272,270.56433,1.7856337,4.3431754,-100.27941,-271.561,-302.4321,6.128809,0.5661363,-0.6200773,74.07515,645000
|
| 31 |
+
0.6578578,277.07782,0.003989164,0.0021242423,-11.967497,0.2093355,-277.03006,277.2893,1.0554068,3.3147073,-100.13067,-277.73465,-302.0236,4.3701143,0.30701816,-0.6334218,47.134026,650000
|
| 32 |
+
0.66149,274.747,0.0039170403,7.861903e-05,-12.479929,0.20226413,-274.69815,274.94937,1.0429538,3.5783842,-100.26443,-275.49976,-302.35846,4.621338,0.40889263,-0.37137836,52.390213,655000
|
| 33 |
+
0.6586339,270.12643,0.0040302975,0.0048105274,-11.306409,0.19770864,-270.08084,270.32898,1.4270971,4.00599,-100.1032,-271.09323,-302.28915,5.4330873,0.47264162,-0.54923874,59.601425,660000
|
| 34 |
+
0.6564718,271.09753,0.004053427,0.001999905,-12.006614,0.17686921,-271.04883,271.27643,1.3831472,3.8952348,-100.39118,-272.2464,-302.0752,5.2783823,0.59391475,-0.44214538,68.038025,665000
|
| 35 |
+
0.65270203,270.46118,0.0038130644,0.004112851,-11.421379,0.18208158,-270.41763,270.64737,5.9893494,8.596335,-100.16749,-271.5046,-302.1702,14.585685,2.040939,-3.9936056,130.16058,670000
|
| 36 |
+
0.65804404,271.1789,0.003937441,0.0026719524,-11.821399,0.20705265,-271.1324,271.38864,1.1196574,4.146377,-100.10693,-272.11633,-302.35623,5.2660346,0.6394224,-0.5033328,62.62883,675000
|
| 37 |
+
0.6515773,271.64444,0.003840263,-0.0014543562,-12.878713,0.18823653,-271.59497,271.8312,2.1273289,4.5044503,-100.30377,-272.41626,-302.073,6.631779,0.39479148,-0.5832519,70.361786,680000
|
| 38 |
+
0.65639526,267.5936,0.0035606774,0.0010649168,-12.200923,0.17778195,-267.55017,267.77246,1.4803528,2.729139,-100.28829,-268.24026,-302.39996,4.2094917,0.45577335,-0.32739058,50.48861,685000
|
| 39 |
+
0.6585547,267.57278,0.003848362,0.00213829,-11.944364,0.16491027,-267.5268,267.73984,1.1999657,3.9507809,-100.23173,-268.33737,-302.17996,5.1507463,0.8598517,-0.94193274,67.2074,690000
|
| 40 |
+
0.64795196,274.61438,0.0039766077,-0.0043735798,-13.599827,0.21267137,-274.5603,274.8227,1.448272,3.2389607,-100.028015,-275.47946,-302.151,4.687233,0.504261,-0.5026045,54.90171,695000
|
| 41 |
+
0.65903914,267.42685,0.003929865,3.9494436e-05,-12.48995,0.19844292,-267.37775,267.62534,1.4019492,6.6904254,-100.047264,-268.0916,-302.0159,8.092375,1.1006799,-1.133639,88.083954,700000
|
| 42 |
+
0.654465,266.766,0.0039654626,-0.0044943304,-13.6333685,0.2007213,-266.7119,266.96222,2.453056,4.870449,-100.27568,-267.1039,-301.96866,7.3235054,0.6881039,-0.8729202,93.83666,705000
|
| 43 |
+
0.6598286,269.7295,0.0039366,0.009884002,-9.989203,0.1643028,-269.6902,269.9037,1.2517636,3.616803,-100.33865,-270.6122,-302.15054,4.8685665,0.35371718,-0.4636666,58.86762,710000
|
| 44 |
+
0.65873635,266.86548,0.0039079622,-8.9956746e-05,-12.523019,0.17943174,-266.81653,267.04483,1.2043087,2.9442682,-91.77467,-267.58054,-302.08554,4.1485767,0.49964902,-0.47979164,54.32775,715000
|
| 45 |
+
0.6491007,271.56396,0.0037551192,-0.0029110468,-13.275221,0.1852826,-271.51413,271.74634,1.0828753,3.629132,-100.25554,-272.5719,-302.08646,4.7120075,0.48159328,-0.44247323,54.44368,720000
|
| 46 |
+
0.64970535,273.51233,0.003922672,-0.005965606,-14.020802,0.15443659,-273.45734,273.66083,1.1719073,3.3286805,-100.27914,-274.41037,-302.28577,4.500588,0.4507487,-0.42968816,47.86422,725000
|
| 47 |
+
0.65824324,272.8471,0.0039757695,0.00033541536,-12.415635,0.18737072,-272.79773,273.03482,1.3791993,5.950578,-100.22128,-274.27057,-302.16833,7.3297777,2.2802033,-2.0377588,79.12106,730000
|
| 48 |
+
0.66684127,269.41754,0.0037930442,0.008523244,-10.252928,0.18753831,-269.37866,269.6136,1.3561953,4.563749,-39.105396,-270.27875,-301.86578,5.9199443,0.54330045,-0.61932176,66.64336,735000
|
| 49 |
+
0.6549791,272.51184,0.0037475347,-0.0039762766,-13.561038,0.15051734,-272.46106,272.6584,2.6842532,3.9534855,-100.29303,-273.83545,-301.96072,6.6377387,0.65364367,-0.50323796,75.37738,740000
|
| 50 |
+
0.660583,264.27094,0.0038873174,0.005876345,-10.988329,0.15288179,-264.2282,264.42972,1.1613934,3.7703264,-100.06768,-264.5982,-302.01605,4.93172,0.79439616,-1.1263962,81.93108,745000
|
| 51 |
+
0.67569375,273.83072,0.003647474,0.0073077525,-10.49649,0.15170161,-273.79242,273.98972,1.1124833,2.901037,-100.27383,-275.1587,-302.17755,4.0135202,0.800637,-0.6174868,72.36986,750000
|
| 52 |
+
0.659771,267.953,0.0035435888,0.006766527,-10.5904875,0.17106886,-267.91547,268.13086,1.0859827,3.827282,-100.34251,-268.78073,-302.244,4.9132648,0.50307035,-0.5714288,47.62855,755000
|
| 53 |
+
0.65912855,266.71906,0.0036389667,0.004088271,-11.37653,0.20112103,-266.67764,266.92426,1.0303773,4.0326047,-100.32261,-267.38547,-302.83835,5.062982,0.5884076,-0.6155299,61.199135,760000
|
| 54 |
+
0.6533072,267.51697,0.0037740231,-0.003154106,-13.335741,0.17709541,-267.4666,267.69092,1.2856374,4.262731,-99.89339,-269.07477,-302.09225,5.5483685,0.7513955,-0.4752431,75.81791,765000
|
| 55 |
+
0.6505034,272.10205,0.0038065733,-0.0031955692,-13.339487,0.18426293,-272.0513,272.2831,1.6317999,3.0589836,-100.169044,-272.6441,-302.14038,4.6907835,1.9642518,-1.8907006,97.60035,770000
|
| 56 |
+
0.6669611,264.73584,0.0038625028,0.0042426544,-11.401579,0.1799136,-264.6918,264.91998,2.136467,4.1961007,-51.583878,-266.09775,-301.93106,6.3325677,0.58273274,-0.56520087,67.05593,775000
|
| 57 |
+
0.6706135,264.33484,0.0038459369,0.00063872035,-12.333923,0.17666805,-264.28738,264.51215,0.89271766,3.1907961,-100.28022,-265.40146,-302.11288,4.0835137,0.62755805,-0.44962803,54.27177,780000
|
| 58 |
+
0.6393167,270.19983,0.0036216215,-0.009497967,-15.122573,0.18963808,-270.14508,270.37997,1.5215266,3.1575873,-100.359474,-270.8645,-302.08258,4.679114,0.41344947,-0.4369626,56.093754,785000
|
| 59 |
+
0.6583575,263.63232,0.0038283148,-0.0021768918,-13.068629,0.1867085,-263.58228,263.81686,1.341794,3.2047203,-100.23556,-264.60916,-302.22928,4.5465145,0.6111065,-0.58238685,58.104137,790000
|
| 60 |
+
0.660354,270.9447,0.0034488959,0.0027820657,-11.693346,0.17695838,-270.90436,271.12445,1.0112712,3.002655,-100.21121,-271.57755,-302.12866,4.0139265,0.32436568,-0.39716777,49.948387,795000
|
| 61 |
+
0.6612035,265.60034,0.0035471169,0.006082298,-10.785284,0.17400928,-265.56207,265.78043,0.854949,3.72716,-100.35894,-266.7373,-302.2896,4.582109,4.4497485,-2.0588434,91.694855,800000
|
| 62 |
+
0.66160077,264.6712,0.003556632,0.0058699506,-10.849576,0.19140334,-264.63263,264.86847,0.988584,2.7916417,-100.35386,-265.2942,-302.07452,3.7802258,0.47160432,-0.32477254,41.041553,805000
|
| 63 |
+
0.65140325,262.6825,0.0035989904,-0.004620515,-13.783836,0.17776537,-262.63287,262.85565,1.1168289,2.9251237,-100.39459,-263.50278,-302.17273,4.0419526,0.45007935,-0.26391026,49.118736,810000
|
| 64 |
+
0.65736234,258.56592,0.0036489125,-6.691102e-05,-12.518337,0.18602231,-258.52026,258.7519,1.65688,3.500407,-99.35056,-259.3193,-302.01044,5.157287,0.4767809,-0.31385258,53.574795,815000
|
| 65 |
+
0.6609553,254.82785,0.0035622923,0.009012514,-9.970024,0.16699883,-254.79233,255.00386,1.3061771,2.9790673,-100.2149,-255.57378,-302.33063,4.2852445,0.40408978,-0.43442953,46.331448,820000
|
| 66 |
+
0.65997165,266.86395,0.003466293,-0.0030131852,-13.369282,0.17107767,-266.8176,267.032,1.2300591,3.1246192,-100.216736,-268.05548,-302.19327,4.354678,0.63331866,-0.44845146,53.569023,825000
|
| 67 |
+
0.6597874,262.56848,0.0033510067,0.0004083937,-12.378128,0.17262757,-262.527,262.74152,1.1972287,2.9701624,-100.11888,-263.67044,-301.90247,4.167391,1.3787316,-1.3200547,57.63839,830000
|
| 68 |
+
0.661816,260.10144,0.0034279132,0.0014635001,-12.073064,0.18463403,-260.06006,260.28754,0.9610017,3.604702,-100.26887,-260.74136,-302.25555,4.565704,0.4801946,-0.47190732,49.2775,835000
|
| 69 |
+
0.6729698,268.84448,0.0034654387,0.005585796,-10.888142,0.1918374,-268.80673,269.0419,1.0130769,3.2839723,-100.1103,-269.29523,-301.7728,4.297049,0.46723855,-0.79178226,67.18686,840000
|
| 70 |
+
0.6475446,268.9315,0.0035538126,-0.005582338,-14.070803,0.18204898,-268.8815,269.10794,1.1875839,2.9777095,-100.19597,-269.89746,-302.02164,4.1652937,0.36196595,-0.31968978,48.15271,845000
|
| 71 |
+
0.66225183,261.26642,0.003524,0.003473552,-11.514316,0.15395162,-261.22583,261.42386,1.3212742,6.821426,-100.32072,-262.14127,-302.14597,8.1427,1.1449107,-1.2660453,87.37157,850000
|
| 72 |
+
0.6458808,262.50894,0.0035564436,-0.00748794,-14.605457,0.1718918,-262.457,262.67337,1.3812838,4.410611,-100.29953,-263.7125,-302.12747,5.791895,0.45800027,-0.3847227,58.874794,855000
|
| 73 |
+
0.6533093,262.20276,0.003306043,0.00094456755,-12.214291,0.16670758,-262.16238,262.37042,1.373183,2.6442707,-100.34472,-262.90295,-301.75812,4.0174537,0.59678143,-0.6023824,45.552795,860000
|
| 74 |
+
0.67128074,265.81143,0.0035794713,0.006958329,-10.556046,0.17598487,-265.77365,265.9944,0.92725104,2.9992085,-100.22694,-266.72894,-302.0214,3.9264596,0.5033796,-0.48129946,53.767544,865000
|
| 75 |
+
0.6639645,256.6471,0.0034052937,-0.00041215844,-12.621035,0.13910717,-256.60413,256.78577,1.0672913,2.268841,-100.242516,-257.22958,-301.9998,3.3361323,0.33892122,-0.37365082,46.651367,870000
|
| 76 |
+
0.64887756,265.70367,0.0034828065,-0.007252368,-14.5823345,0.14883053,-265.6529,265.84525,1.3585048,3.2215207,-100.32057,-266.65012,-302.41916,4.5800257,1.4365287,-1.015739,65.32008,875000
|
| 77 |
+
0.6491017,262.06558,0.00333764,0.001290693,-12.113292,0.1597955,-262.02515,262.22665,1.2567949,3.1631486,-60.158665,-262.60587,-302.05194,4.419944,0.41426903,-0.45999384,57.531513,880000
|
| 78 |
+
0.64904034,262.63193,0.0036440473,-0.011081178,-15.540898,0.14113033,-262.57532,262.762,1.2622297,3.8852978,-57.618084,-263.7565,-301.86826,5.1475277,2.0148263,-2.0418425,72.76189,885000
|
| 79 |
+
0.66686904,257.7063,0.003370074,0.0040569217,-11.296192,0.18583782,-257.66827,257.8962,1.4001695,2.931129,-100.22185,-258.3873,-302.1135,4.3312984,0.8963166,-0.87369686,64.19837,890000
|
| 80 |
+
0.66846687,261.21484,0.003716214,-0.0041712783,-13.622454,0.15039398,-261.16425,261.36105,1.42408,3.8545258,-58.864037,-261.8497,-302.00986,5.278606,0.5176733,-0.8860972,60.892822,895000
|
| 81 |
+
0.6616928,260.28625,0.0033758853,0.0017230834,-11.989591,0.18185063,-260.2458,260.46982,1.0287497,5.0489364,-100.2207,-260.7898,-301.86118,6.0776863,3.8054667,-3.364719,102.93163,900000
|
| 82 |
+
0.6607762,261.81195,0.0033868994,0.0045329384,-11.161626,0.19677435,-261.77414,262.01328,1.3420513,2.680408,-100.22532,-262.45126,-301.9041,4.022459,0.4306695,-0.49891794,51.281128,905000
|
| 83 |
+
0.6591948,261.89047,0.0032551696,-0.002847218,-13.374676,0.16035116,-261.84692,262.04797,1.0049092,3.9302957,-100.32098,-263.2369,-302.17883,4.935205,0.44956487,-0.48775324,53.508183,910000
|
| 84 |
+
0.6646911,254.03027,0.0032549894,0.0015933082,-12.010503,0.18312363,-253.99118,254.21498,0.94391555,2.6857595,-100.24098,-254.69376,-302.22104,3.6296751,0.38873577,-0.5574588,46.66717,915000
|
| 85 |
+
0.6550456,261.82407,0.0034827136,-0.0018453855,-13.02987,0.14818305,-261.7787,261.97043,1.5327252,2.7634144,-100.26288,-262.33023,-302.13095,4.2961397,0.3025517,-0.2753719,47.400536,920000
|
| 86 |
+
0.64301986,263.792,0.0032643822,-0.004605982,-13.910981,0.1737886,-263.74658,263.96118,1.119194,3.8596017,-100.06816,-264.1212,-302.46982,4.978796,0.43353498,-0.635875,69.33059,925000
|
| 87 |
+
0.6405682,259.21338,0.0033984305,-0.006373574,-14.375446,0.1684061,-259.1645,259.3754,1.2560793,4.198245,-100.2315,-260.05942,-301.99396,5.4543242,0.35991946,-0.4241051,60.18328,930000
|
| 88 |
+
0.659425,257.3658,0.0030532745,0.0057108547,-10.629597,0.18215698,-257.33334,257.55368,1.8099288,2.849876,-100.13437,-258.04395,-301.86725,4.659805,0.4479385,-0.45597848,52.865494,935000
|
| 89 |
+
0.668947,255.81494,0.0033168374,-0.00049985875,-12.650703,0.19116437,-255.77298,256.0056,1.8097489,3.2686841,-100.2608,-256.47565,-301.8953,5.078433,0.52237636,-0.5262101,58.495743,940000
|
| 90 |
+
0.67086303,250.86426,0.003449901,0.005241545,-10.980668,0.14667575,-250.82637,251.01619,1.8482136,3.2666566,-45.504993,-251.88394,-301.8986,5.11487,0.5782371,-0.37540194,59.916058,945000
|
| 91 |
+
0.6692862,256.6159,0.003446016,0.008727638,-9.967325,0.1828635,-256.58154,256.8075,0.77006304,4.6359344,-100.29463,-257.49756,-301.81592,5.4059973,0.79986614,-1.3263894,48.205376,950000
|
| 92 |
+
0.6632227,259.28906,0.0034777797,0.003302885,-11.550289,0.17131753,-259.24893,259.46368,1.2018646,2.635976,-100.29667,-260.0095,-301.98438,3.8378406,0.3772642,-0.4393739,45.591316,955000
|
| 93 |
+
0.6635672,249.6278,0.0032623268,0.0074428893,-10.2185335,0.16292073,-249.59448,249.79817,1.1667366,2.8812551,-100.169495,-250.52197,-301.71265,4.0479918,0.4839263,-0.28421694,47.26676,960000
|
| 94 |
+
0.6578454,253.80338,0.0032295156,-2.3013059e-05,-12.507126,0.18230997,-253.76299,253.98566,1.3159975,2.949149,-100.25543,-254.31084,-301.89313,4.2651463,0.37375084,-0.3230095,49.35797,965000
|
| 95 |
+
0.65563077,257.8425,0.0033530528,-0.0032277917,-13.462643,0.1692284,-257.79733,258.00848,1.2426844,2.6231441,-99.64882,-258.79224,-301.9296,3.8658285,0.36780477,-0.42535925,43.829018,970000
|
| 96 |
+
0.66448766,253.32779,0.0031828461,0.0019235563,-11.895649,0.15422365,-253.28992,253.48393,1.1299638,2.8972435,-100.2213,-253.76973,-301.96,4.0272074,0.4436818,-0.3324184,44.530373,975000
|
| 97 |
+
0.67096025,262.0478,0.0032576555,0.0052718343,-10.881709,0.16283634,-262.0124,262.2159,1.097958,4.4795427,-100.242096,-263.06177,-301.80212,5.577501,0.81732154,-1.0260156,63.47316,980000
|
| 98 |
+
0.65371263,261.46448,0.0034228938,-0.0033714545,-13.484972,0.16992252,-261.4183,261.63104,0.9755501,3.0850713,-100.239426,-262.37802,-301.9889,4.0606213,0.3768756,-0.37279937,44.370087,985000
|
| 99 |
+
0.6475131,254.62534,0.003390074,-0.0015821914,-12.966713,0.16861197,-254.58138,254.79236,1.3092974,4.2092037,-100.25667,-255.42705,-301.78094,5.5185013,1.4193403,-1.5999489,59.263725,990000
|
| 100 |
+
0.66602886,253.32042,0.0031676088,-0.00065718964,-12.707472,0.1731353,-253.28018,253.4929,1.0007268,2.7954175,-100.11356,-253.89241,-301.8325,3.7961445,0.41382098,-0.39672512,50.639988,995000
|
| 101 |
+
0.64553696,260.55115,0.0031723627,-0.008678066,-15.235521,0.14429584,-260.5028,260.68677,1.1913785,3.8330712,-99.25356,-261.5567,-301.85995,5.02445,0.7915227,-0.64243615,53.116688,1000000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c02ec91cf4e960c6e7612b68c1af61f2a1f944f4ce3ee96731e4e134db14391
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e17e0bf45f07965c7a9653c21f84fff9a3fe161609ddada0a65e44a10e58c02f
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ea4ed04d3b3135c5536341791d2ac44345a7ac647db175d620356fe00f040cb
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a57f99183897806da596de00ee4bb672b3b6224023435bfa287ed8ff16e37d4f
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5594ee2bd89bb5348e70d83c0286593b9269b3241d76510e02cfc8e61bc53e0f
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09afb8a5d58516d1af28d2d4f3695da2c247f2f1972ad11fefbdcbc3cd80f64b
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f5639e836bba3f36e9aa9ccb2f8f028ff6e656d44de9e57e22b8f4f2ae5bf95
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a5f03b0bae4f138830964374ae8fc9cd7f88993eb784294c4a90b6e78a10306
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f529bf143c286332c6b273cf3ab33d1d0d2a0489824ca8e7553d54d36625cc1c
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e887770d98d1f9ec5fbed62c9b199956f14e8517dba7374a550909a620bbec0f
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_074652/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/3o5fxwg8
|