Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.04118899412200606,0.0126889824613511,-0.040163276135288264,0.00815200025987197,23.07244607375266,18.6649999999984,0.5,9382.5,-0.7,-573.68,371.3,1.099103274345398,550000
|
| 3 |
+
0.0,0.0,-0.030008135939328204,-0.008992048154185616,-0.02940379557595182,0.006081800025782102,32.23302840129734,10.930999999999829,0.92,25122.68,-0.12,-313.44,216.62,0.6794412136077881,600000
|
| 4 |
+
0.0,0.0,-0.030655312772033726,-0.007770752275463481,-0.030719980852969155,-0.007077243136107773,31.013317776921337,9.820999999999652,0.92,35472.82,-0.1,-301.34,194.42,0.6020046949386597,650000
|
| 5 |
+
0.0,0.0,-0.022277000024816255,-0.010152697204534019,-0.021712389077348477,0.005571788114446964,32.022539921324395,8.249999999999448,0.92,45696.9,-0.12,-245.14,163.0,0.5121483945846558,700000
|
| 6 |
+
0.0,0.0,-0.030366678413727886,0.016975351690244347,-0.029337681349004552,0.0002898189709438615,33.81626139018056,6.886999999999804,1.0,53091.9,0.0,-202.86,135.74,0.4372579526901245,750000
|
| 7 |
+
0.0,0.0,-0.03705550732976782,0.010969012663494064,-0.036090268912330296,0.01965238535633766,33.41510835207034,6.304999999999662,0.98,59755.5,-0.04,-187.04,124.1,0.39975503921508787,800000
|
| 8 |
+
0.0,0.0,-0.02582120554042293,0.022628906769459077,-0.02347838504052851,0.015197291693341358,34.2225851725096,5.65499999999968,1.0,66064.06,0.0,-158.24,111.1,0.3536501884460449,850000
|
| 9 |
+
0.0,0.0,-0.02988204309452312,0.03504399075637713,-0.02658861099854311,0.028378065098748604,34.36298558388296,5.2039999999997475,0.98,71693.1,-0.04,-155.92,102.08,0.32357211589813234,900000
|
| 10 |
+
0.0,0.0,-0.01815278196485292,0.0364075582516158,-0.014275734256644189,0.034594579158593625,34.737793711264416,4.984999999999847,1.0,76745.16,0.0,-141.96,97.7,0.3137067842483521,950000
|
| 11 |
+
0.0,0.0,-0.04011082043855026,0.04676692625521386,-0.035306355804275026,0.03810357218451373,35.78219430991396,4.55499999999974,0.98,81322.82,-0.04,-138.2,89.1,0.2878027534484863,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.04118899412200606,0.0126889824613511,-0.040163276135288264,0.00815200025987197,23.07244607375266,18.6649999999984,0.5,9382.5,-0.7,-573.68,371.3,1.099103274345398,550000
|
| 3 |
+
0.0,0.0,-0.030008135939328204,-0.008992048154185616,-0.02940379557595182,0.006081800025782102,32.23302840129734,10.930999999999829,0.92,25122.68,-0.12,-313.44,216.62,0.6794412136077881,600000
|
| 4 |
+
0.0,0.0,-0.030655312772033726,-0.007770752275463481,-0.030719980852969155,-0.007077243136107773,31.013317776921337,9.820999999999652,0.92,35472.82,-0.1,-301.34,194.42,0.6020046949386597,650000
|
| 5 |
+
0.0,0.0,-0.022277000024816255,-0.010152697204534019,-0.021712389077348477,0.005571788114446964,32.022539921324395,8.249999999999448,0.92,45696.9,-0.12,-245.14,163.0,0.5121483945846558,700000
|
| 6 |
+
0.0,0.0,-0.030366678413727886,0.016975351690244347,-0.029337681349004552,0.0002898189709438615,33.81626139018056,6.886999999999804,1.0,53091.9,0.0,-202.86,135.74,0.4372579526901245,750000
|
| 7 |
+
0.0,0.0,-0.03705550732976782,0.010969012663494064,-0.036090268912330296,0.01965238535633766,33.41510835207034,6.304999999999662,0.98,59755.5,-0.04,-187.04,124.1,0.39975503921508787,800000
|
| 8 |
+
0.0,0.0,-0.02582120554042293,0.022628906769459077,-0.02347838504052851,0.015197291693341358,34.2225851725096,5.65499999999968,1.0,66064.06,0.0,-158.24,111.1,0.3536501884460449,850000
|
| 9 |
+
0.0,0.0,-0.02988204309452312,0.03504399075637713,-0.02658861099854311,0.028378065098748604,34.36298558388296,5.2039999999997475,0.98,71693.1,-0.04,-155.92,102.08,0.32357211589813234,900000
|
| 10 |
+
0.0,0.0,-0.01815278196485292,0.0364075582516158,-0.014275734256644189,0.034594579158593625,34.737793711264416,4.984999999999847,1.0,76745.16,0.0,-141.96,97.7,0.3137067842483521,950000
|
| 11 |
+
0.0,0.0,-0.04011082043855026,0.04676692625521386,-0.035306355804275026,0.03810357218451373,35.78219430991396,4.55499999999974,0.98,81322.82,-0.04,-138.2,89.1,0.2878027534484863,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.64115906,151.47078,0.007386628,-0.007391362,-13.500641,0.20737827,-151.37106,151.67078,1.2843298,5.668552,-64.38984,-154.08745,-193.75743,6.952882,3.0530581,-3.6793885,86.52069,505000
|
| 3 |
+
0.6339626,146.44354,0.007594293,-0.0062137167,-13.318209,0.22775419,-146.3424,146.66508,1.2882642,6.92341,-38.577126,-149.4335,-193.88535,8.211674,7.7369285,-8.084668,108.05992,510000
|
| 4 |
+
0.64343643,147.0672,0.007893995,-0.004922801,-13.123613,0.17129043,-146.96361,147.23357,2.2667286,6.117712,-43.359303,-150.11943,-194.26614,8.38444,1.3815638,-1.457663,77.939766,515000
|
| 5 |
+
0.6348855,146.98833,0.008041692,-0.023220178,-15.387474,0.17793922,-146.8646,147.14304,2.9864728,7.5639853,-43.83824,-150.3148,-199.34526,10.550458,2.8655946,-2.9862332,120.974106,520000
|
| 6 |
+
0.641117,146.32503,0.008095764,-0.006708396,-13.32863,0.17509739,-146.21713,146.49341,1.5349731,4.640433,-67.05228,-148.67873,-200.2801,6.175406,1.5605819,-1.620509,62.746082,525000
|
| 7 |
+
0.6456789,147.08755,0.008358137,-0.004993316,-13.09742,0.18527916,-146.97809,147.26784,1.679381,8.674501,-71.71513,-149.09476,-197.54333,10.353883,4.290274,-3.790325,113.91197,530000
|
| 8 |
+
0.6446261,146.25348,0.008449667,0.0065145316,-11.729019,0.20550552,-146.15439,146.4655,2.3890655,5.971564,-10.356891,-148.33012,-196.67082,8.360629,4.2360697,-3.3920007,105.041275,535000
|
| 9 |
+
0.6427683,144.7363,0.008248501,-0.006417451,-13.278014,0.16864687,-144.62677,144.89851,1.9592234,6.3229156,-50.283974,-148.15141,-197.61981,8.282139,1.3531208,-1.3228661,80.83486,540000
|
| 10 |
+
0.64484876,144.43185,0.00811409,0.008168026,-11.493353,0.19654348,-144.3386,144.63657,1.5880466,4.8051257,-10.0128565,-146.67809,-195.76237,6.3931723,2.4507732,-2.0494816,79.54104,545000
|
| 11 |
+
0.64234865,145.92404,0.008243834,-0.005037926,-13.1111145,0.16126022,-145.81598,146.08026,3.330298,6.152203,-48.617844,-148.6548,-194.54846,9.482501,4.1068172,-2.9974964,95.90861,550000
|
| 12 |
+
0.6460353,142.74915,0.008634192,-0.0015792222,-12.682903,0.19269416,-142.63965,142.94026,3.7884634,5.769195,-28.90694,-145.98547,-196.93689,9.557658,1.2918088,-1.4878584,105.38553,555000
|
| 13 |
+
0.63429195,141.4096,0.008779337,-0.017772846,-14.524395,0.19187321,-141.28209,141.58371,2.6731832,7.648492,-39.34383,-145.10806,-200.81065,10.321675,3.0612304,-2.7132392,113.05782,560000
|
| 14 |
+
0.64231414,144.02728,0.008691635,-0.009078971,-13.544564,0.18215942,-143.90956,144.20036,2.4178088,6.113767,-43.525066,-146.55074,-200.34581,8.531576,2.5636225,-1.5186279,73.669205,565000
|
| 15 |
+
0.6447574,137.66486,0.008583827,-0.010066728,-13.672755,0.17831327,-137.54749,137.8331,2.2618847,7.22179,-11.628499,-140.43489,-200.0928,9.483675,4.0483956,-3.139135,98.654854,570000
|
| 16 |
+
0.6436528,142.67892,0.008827754,-0.0027889137,-12.815926,0.20173123,-142.56578,142.87787,2.8914192,9.007509,-46.497932,-145.27505,-201.5458,11.898929,5.2609453,-6.910512,106.26834,575000
|
| 17 |
+
0.63899916,143.19916,0.008837893,-7.2737707e-06,-12.500823,0.167225,-143.08868,143.36638,2.818138,8.25191,-35.912388,-145.79196,-199.15706,11.070048,0.92026836,-1.0327636,90.19783,580000
|
| 18 |
+
0.6419296,141.8727,0.00857744,-0.0018275453,-12.713064,0.1797099,-141.76364,142.05057,4.276029,6.369999,-8.433832,-144.4842,-200.77174,10.6460285,1.3477923,-0.8554929,102.399475,585000
|
| 19 |
+
0.6439789,139.64272,0.008863692,-0.003754011,-12.923527,0.1724695,-139.52817,139.81143,5.967512,7.6569138,-33.82739,-142.17711,-196.76157,13.624426,3.7755635,-3.310035,151.81973,590000
|
| 20 |
+
0.64494663,139.93678,0.0088800555,0.014401949,-10.878169,0.16089192,-139.84018,140.11208,2.336083,9.818218,-28.585882,-141.99962,-199.2035,12.154301,5.741296,-5.3604817,130.14995,595000
|
| 21 |
+
0.6363981,134.50568,0.009158833,-0.0043596467,-12.976005,0.18827137,-134.38684,134.68959,3.2637613,6.6005855,-21.93687,-137.59024,-202.10756,9.8643465,1.7697905,-2.1444068,94.52597,600000
|
| 22 |
+
0.6441658,136.3682,0.009171406,0.014429367,-10.926701,0.1753734,-136.26797,136.558,4.008087,10.110026,-11.957599,-139.82542,-198.54527,14.1181135,2.4859831,-2.7199538,136.63719,605000
|
| 23 |
+
0.6403731,134.95474,0.0094042905,-0.010239988,-13.588863,0.1806503,-134.82697,135.12515,4.0667987,8.847638,-29.173996,-138.15694,-197.57422,12.914436,6.6367683,-6.1972256,187.21164,610000
|
| 24 |
+
0.63297796,133.50348,0.009349223,-0.005505736,-13.088898,0.15617536,-133.3811,133.65414,3.6416008,11.429552,1.4101886,-137.55368,-193.80833,15.071153,5.625752,-8.299414,181.17354,615000
|
| 25 |
+
0.6486115,134.75137,0.009205787,0.008244417,-11.604431,0.167775,-134.64453,134.92738,5.048521,11.450105,-12.254368,-137.25763,-200.97305,16.498627,5.9612594,-5.5254593,171.50844,620000
|
| 26 |
+
0.6395136,138.87225,0.009168005,-0.017408801,-14.398865,0.16372126,-138.74023,139.01857,5.343843,9.951118,-30.373798,-142.23051,-196.19778,15.294962,2.2793245,-2.1188529,112.97597,625000
|
| 27 |
+
0.64853805,135.02846,0.009318856,0.0052619944,-11.935339,0.15332152,-134.91724,135.18704,3.3581185,13.325172,-10.540414,-138.83316,-194.98886,16.68329,5.1118946,-5.8192654,187.32108,630000
|
| 28 |
+
0.63602746,134.45956,0.009252541,-0.014728404,-14.091823,0.16132674,-134.32918,134.60617,3.2329087,14.2916975,1.3294272,-138.13802,-195.75775,17.524607,6.2808785,-5.081433,169.0971,635000
|
| 29 |
+
0.6428751,131.48181,0.009370093,-0.0052017807,-13.055147,0.1730569,-131.35947,131.64966,2.6979663,6.615207,-21.667759,-134.86255,-196.23466,9.313173,2.7118027,-2.8213317,92.15067,640000
|
| 30 |
+
0.6517114,135.40875,0.0091324225,0.0116454465,-11.224824,0.16311523,-135.30624,135.58351,2.3112652,8.3381,-26.615433,-138.07397,-196.4741,10.649365,6.9738665,-5.201306,147.86319,645000
|
| 31 |
+
0.65049344,134.02136,0.0091923075,0.0104005635,-11.368558,0.18699738,-133.91687,134.21877,2.8191113,7.9507446,-9.304501,-135.49846,-200.76456,10.7698555,0.87516975,-1.2975373,114.70554,650000
|
| 32 |
+
0.6449049,134.02374,0.009412576,-0.0023583146,-12.750549,0.20122546,-133.90372,134.22261,2.7104175,8.811869,-31.305737,-136.88062,-194.90517,11.522286,1.8450334,-1.5847001,119.120995,655000
|
| 33 |
+
0.65416074,134.90305,0.0095208995,0.016173443,-10.80127,0.17845346,-134.8002,135.09767,5.4858713,9.056722,-19.039583,-137.9423,-200.76524,14.542593,6.9566927,-7.0370903,222.50443,660000
|
| 34 |
+
0.6370696,134.69511,0.009200754,-0.013553513,-13.973087,0.17757602,-134.56654,134.85915,3.1671886,8.536143,-1.1609197,-137.52252,-201.96115,11.703332,3.1009386,-4.456216,126.51463,665000
|
| 35 |
+
0.6458094,131.64905,0.009263303,0.02425207,-9.88192,0.16919476,-131.55753,131.84248,5.374736,10.336391,-6.822313,-133.95976,-196.71642,15.711127,3.2583513,-9.397792,237.86166,670000
|
| 36 |
+
0.64216083,136.21114,0.009453657,0.0045897355,-12.014502,0.1942154,-136.09755,136.40994,3.5501525,10.264066,-13.428291,-138.71599,-201.27003,13.8142185,3.697692,-3.2114873,198.98575,675000
|
| 37 |
+
0.6503367,132.29012,0.009311131,0.012868933,-11.117898,0.1597037,-132.1866,132.46268,2.4531476,10.356818,2.8817103,-135.01674,-195.26976,12.809966,3.4607196,-3.246385,141.92047,680000
|
| 38 |
+
0.63346547,133.63782,0.009470378,-0.024828682,-15.12172,0.17196274,-133.4946,133.78496,4.0854845,8.524919,-6.8006654,-137.17593,-193.92587,12.610403,0.8233037,-0.98874557,105.81446,685000
|
| 39 |
+
0.6446504,130.78423,0.009343038,0.01324394,-11.08248,0.15642238,-130.6807,130.95389,3.8897934,9.663524,-8.585822,-133.85399,-202.56334,13.553317,5.49211,-6.5613713,193.58682,690000
|
| 40 |
+
0.63896537,129.99953,0.009502844,-0.009468913,-13.496429,0.19615252,-129.87128,130.1862,3.0962682,11.695128,-1.6998159,-132.74297,-194.4358,14.791397,5.7970085,-5.167028,144.89662,695000
|
| 41 |
+
0.63686043,132.90869,0.009477263,-0.0092943655,-13.480701,0.1886166,-132.78091,133.08801,6.014976,10.530792,-22.538824,-136.23236,-200.37578,16.545769,1.5310786,-2.0966198,154.85837,700000
|
| 42 |
+
0.6399312,130.80818,0.009664157,-0.00656904,-13.179732,0.17355326,-130.68082,130.97516,8.812982,14.992879,-4.0062456,-133.8695,-196.51001,23.80586,5.280988,-5.4753504,254.1319,705000
|
| 43 |
+
0.63378364,130.42291,0.0097146435,-0.0045918724,-12.972675,0.16108356,-130.29689,130.5794,3.10216,9.329264,-19.811361,-133.40953,-198.83632,12.431423,4.1620636,-1.753137,130.59998,710000
|
| 44 |
+
0.6494521,130.47012,0.009513267,0.003691751,-12.111937,0.17453521,-130.35489,130.64835,2.8536537,9.036019,-6.046004,-132.59647,-201.63753,11.889673,2.8878353,-2.7299511,121.02315,715000
|
| 45 |
+
0.63751924,128.94087,0.009495959,0.0004991515,-12.447435,0.1709806,-128.82266,129.11235,2.7440877,10.132121,-15.233045,-132.01883,-203.34052,12.876209,2.5892663,-3.4068785,113.636925,720000
|
| 46 |
+
0.63608587,125.13534,0.009639305,0.0042457213,-12.059541,0.15226942,-125.01909,125.29185,3.0672326,12.592521,-5.66239,-128.0989,-192.41238,15.659754,1.830749,-1.8175281,123.68656,725000
|
| 47 |
+
0.6481874,130.2086,0.009423355,0.014987386,-10.909549,0.20120822,-130.1058,130.42479,4.10511,9.548141,-9.315554,-133.3861,-200.31711,13.653251,2.308039,-1.867134,122.67647,730000
|
| 48 |
+
0.6401909,128.1512,0.009587195,-0.011452361,-13.694548,0.18353856,-128.01991,128.32327,3.3128114,9.980926,-8.273938,-131.01846,-191.5406,13.293737,3.3038483,-3.7900805,127.10757,735000
|
| 49 |
+
0.6543422,125.632645,0.009379869,0.0068577304,-11.768888,0.14226973,-125.52225,125.78178,3.4949837,8.317082,0.7344019,-128.73317,-199.19594,11.812066,1.7023914,-0.9026097,101.38617,740000
|
| 50 |
+
0.6469857,126.99939,0.009337007,-0.001142042,-12.6223135,0.1494716,-126.88154,127.14772,3.6622016,10.625549,-4.6786838,-129.92085,-205.61522,14.287751,4.3080053,-4.838219,130.03244,745000
|
| 51 |
+
0.6416046,121.11925,0.009281994,0.00056796195,-12.43881,0.14800216,-121.003784,121.267815,5.2783923,13.970772,-1.1186365,-124.62206,-202.39465,19.249165,2.722152,-2.7329423,212.81836,750000
|
| 52 |
+
0.65340817,129.89816,0.009302744,0.0060321237,-11.851576,0.16234894,-129.78792,130.06654,3.723863,8.804921,2.0030198,-132.88872,-199.9468,12.528784,3.870852,-3.5189717,138.11124,755000
|
| 53 |
+
0.6475883,126.73375,0.009519633,-0.0040962594,-12.930296,0.1884712,-126.610664,126.91812,3.348128,10.320706,2.3890426,-129.83727,-188.40704,13.668835,1.7519842,-1.881941,125.45193,760000
|
| 54 |
+
0.64391804,125.1855,0.009422811,0.0040838923,-12.066595,0.1768919,-125.0718,125.36648,2.9711025,10.100297,-3.8676596,-128.21713,-193.67088,13.0714,1.8664325,-2.7640946,113.72586,765000
|
| 55 |
+
0.6420822,128.57314,0.009316932,-0.0032667231,-12.850622,0.17318459,-128.45341,128.74306,7.376024,9.565112,-11.459131,-131.29901,-198.26384,16.941135,6.531716,-6.013642,298.45206,770000
|
| 56 |
+
0.6406972,123.877045,0.009575874,-0.0067146528,-13.201205,0.17665374,-123.750626,124.04698,3.1382947,10.020911,-14.770311,-126.85561,-197.53236,13.159206,1.0711468,-0.781445,116.921425,775000
|
| 57 |
+
0.63243484,123.741714,0.00928333,-0.016671404,-14.295843,0.17305627,-123.60901,123.8981,3.9745483,12.430615,-4.8354936,-127.31313,-197.9491,16.405163,4.884416,-4.679324,147.10388,780000
|
| 58 |
+
0.6465733,122.78073,0.009317638,-0.0038751813,-12.915897,0.1692524,-122.660385,122.946106,3.0946367,6.60384,-3.4745245,-124.74153,-201.23607,9.698477,0.88683355,-0.6646373,91.36621,785000
|
| 59 |
+
0.63916713,120.31384,0.009533852,-0.0021078605,-12.721092,0.17329103,-120.192566,120.48503,5.24846,10.563865,-8.61488,-123.15566,-198.66965,15.812325,1.2715528,-1.1284006,123.277534,790000
|
| 60 |
+
0.64890516,121.77678,0.0092748795,0.011753432,-11.232767,0.15371849,-121.67259,121.94225,4.095108,11.039172,1.0874373,-124.26125,-195.86133,15.13428,2.8280551,-5.6451206,176.46153,795000
|
| 61 |
+
0.637367,124.09254,0.009339243,-0.0036530495,-12.89115,0.15591718,-123.972145,124.2448,4.2530627,8.901825,-8.814355,-127.239746,-196.4571,13.154888,2.2850523,-2.037319,121.42115,800000
|
| 62 |
+
0.6443135,123.790504,0.009473296,-0.0021175279,-12.723526,0.15993667,-123.669975,123.94832,3.3667035,13.746569,-3.625892,-127.050316,-196.08029,17.113272,1.3697973,-1.3131655,154.15573,805000
|
| 63 |
+
0.65009594,119.774254,0.009438396,0.0044958796,-12.023661,0.16341773,-119.66077,119.94216,4.326635,12.567731,-5.9381337,-123.12648,-198.67242,16.894365,3.9336452,-3.8251333,202.73671,810000
|
| 64 |
+
0.6424965,121.031784,0.009450858,0.004897308,-11.981813,0.17728186,-120.91855,121.21397,2.5704005,11.462024,-6.761825,-123.30725,-190.32983,14.032424,1.9068158,-2.0599833,149.21323,815000
|
| 65 |
+
0.63710713,120.56851,0.009610647,0.0016643866,-12.326818,0.1593282,-120.45005,120.7295,3.6971073,23.16978,-5.9290733,-124.06866,-203.9021,26.866888,4.5873737,-5.077392,261.38492,820000
|
| 66 |
+
0.6462773,122.87613,0.009500107,-0.0008346895,-12.587861,0.15695092,-122.75654,123.03225,2.67559,11.320803,-3.6617436,-125.7409,-200.66006,13.996393,2.1536672,-3.091761,136.16693,825000
|
| 67 |
+
0.6393799,115.25131,0.009541907,0.010506294,-11.3989315,0.1729065,-115.14255,115.43472,3.154124,11.03641,-7.131429,-117.55519,-197.11263,14.190535,1.5667274,-1.6702949,115.54337,830000
|
| 68 |
+
0.6440687,117.645775,0.009408264,0.009135575,-11.528984,0.17701219,-117.53731,117.83192,3.2160847,9.205414,-4.3175673,-120.474815,-196.9428,12.421498,5.246868,-5.2474213,150.49692,835000
|
| 69 |
+
0.6495659,122.84931,0.009444281,0.010233113,-11.416475,0.18673888,-122.74149,123.04628,3.3032746,10.260089,-7.213843,-125.866165,-192.41402,13.563364,2.3875465,-1.7395334,129.38898,840000
|
| 70 |
+
0.63684666,122.48055,0.009685291,-0.018351672,-14.394798,0.15852027,-122.34113,122.62073,2.598279,14.521106,-4.0492835,-125.513405,-197.03293,17.119385,6.9928565,-6.6658516,179.26176,845000
|
| 71 |
+
0.6416665,115.96068,0.009498726,0.0178901,-10.616579,0.15444508,-115.85983,116.13301,3.6024914,8.620467,-1.6335251,-118.515236,-200.45207,12.222959,4.012233,-4.9722614,156.00189,850000
|
| 72 |
+
0.64871114,120.02832,0.009413901,0.0088048475,-11.564697,0.14782083,-119.91945,120.184944,8.662666,10.341872,-4.0812445,-122.81695,-197.22516,19.00454,3.161993,-3.0323794,185.94951,855000
|
| 73 |
+
0.63883734,117.57738,0.00943554,-0.0003626818,-12.538438,0.15350541,-117.459076,117.730515,5.0954847,14.271598,-1.9055194,-120.51843,-194.0712,19.367083,2.5982742,-2.7737124,201.2472,860000
|
| 74 |
+
0.63888824,118.8931,0.009444101,-0.011681465,-13.736906,0.16070572,-118.76337,119.04212,2.605388,10.990046,-0.29166335,-121.41976,-199.57327,13.595433,2.945791,-2.4275472,147.84744,865000
|
| 75 |
+
0.64641494,119.32585,0.009415575,-0.006529015,-13.193427,0.14087653,-119.20163,119.4602,5.7958508,15.635269,-4.724848,-122.34292,-198.32414,21.43112,9.879428,-10.589703,228.91516,870000
|
| 76 |
+
0.6491601,112.93011,0.0097892815,0.0008001889,-12.418259,0.144052,-112.80854,113.07496,2.9193199,10.488506,1.3696377,-116.29241,-194.88577,13.407826,3.2304866,-3.0692139,177.84384,875000
|
| 77 |
+
0.64649564,114.27639,0.009640454,0.020963311,-10.325485,0.15488006,-114.17685,114.45223,3.904085,9.3024435,0.57135075,-117.50402,-195.83545,13.206529,1.9796354,-1.5406276,141.93921,880000
|
| 78 |
+
0.6455101,119.22926,0.009321593,-0.0049662488,-13.032768,0.12464798,-119.10778,119.348946,3.356363,10.258151,-2.5418446,-122.430786,-201.86865,13.614514,1.5661674,-1.6245717,114.233734,885000
|
| 79 |
+
0.6371798,122.80914,0.009370343,-0.010477714,-13.618178,0.17730519,-122.68154,122.975975,3.7526207,10.953334,-4.2014294,-125.22351,-203.13278,14.705955,1.7949674,-1.1990622,130.48651,890000
|
| 80 |
+
0.6414218,117.12268,0.009573294,-0.008928356,-13.4326315,0.1325323,-116.994095,117.246284,7.0479097,12.575999,-2.6929233,-120.310135,-195.81969,19.623909,3.558292,-2.649505,222.62866,895000
|
| 81 |
+
0.6408136,114.70831,0.00928511,-0.012335922,-13.82857,0.16886692,-114.57991,114.864845,5.479026,12.507359,-2.3703885,-117.82826,-197.88046,17.986385,7.713042,-7.81921,183.21956,900000
|
| 82 |
+
0.64120543,117.89312,0.0095293205,0.013899967,-11.0413475,0.16801552,-117.787895,118.075035,4.820117,11.63515,-3.3836436,-120.715675,-199.40741,16.455267,1.5992495,-1.3222691,151.39867,905000
|
| 83 |
+
0.64592564,121.51994,0.0095179,-0.0022765058,-12.7391815,0.14761661,-121.3987,121.66528,4.91865,11.571672,7.243404,-124.25183,-201.00058,16.490322,4.934762,-4.90159,198.85747,910000
|
| 84 |
+
0.65647995,114.81821,0.009766697,0.0012573489,-12.371262,0.16875248,-114.69738,114.98822,3.4133675,9.5693865,-1.3751962,-117.55005,-194.19745,12.982754,2.2836144,-2.0160208,141.97025,915000
|
| 85 |
+
0.64578134,117.678055,0.009541201,-0.0044967784,-12.971301,0.16405153,-117.5543,117.837616,4.569065,10.270363,-2.868859,-120.38928,-198.004,14.839428,3.2167072,-3.0077124,139.04904,920000
|
| 86 |
+
0.64717245,113.64228,0.009463928,-0.006794382,-13.217924,0.14366406,-113.51718,113.779144,5.0050693,17.51408,0.06483639,-117.33633,-201.9487,22.51915,4.8363285,-3.9367647,210.68793,925000
|
| 87 |
+
0.6556228,114.401245,0.009435162,0.014645135,-10.947813,0.14739919,-114.29796,114.56329,3.0109458,8.561332,-4.094603,-116.87925,-203.1488,11.572277,1.0943211,-1.3321385,116.714325,930000
|
| 88 |
+
0.6595001,116.578,0.009641636,0.023274528,-10.08604,0.16877814,-116.48076,116.77006,4.1667366,12.217608,-6.0564957,-118.79618,-202.37694,16.384346,3.2843807,-2.8842525,158.62328,935000
|
| 89 |
+
0.64175683,112.41008,0.009440913,-0.010032266,-13.562637,0.19525327,-112.28204,112.5953,5.6239963,10.909836,-1.0641075,-115.5169,-201.6677,16.533833,6.1284795,-3.6818862,215.45636,940000
|
| 90 |
+
0.6470103,115.78818,0.009609278,0.0029855426,-12.189306,0.15507972,-115.67105,115.94624,3.5520966,9.21227,5.078501,-119.22228,-196.35178,12.764366,1.2940526,-1.2713069,129.78502,945000
|
| 91 |
+
0.64584637,112.18138,0.009572002,0.0009818876,-12.397421,0.1757039,-112.06271,112.35807,5.085865,11.219294,-6.930212,-115.69,-197.56198,16.305159,2.827618,-3.0576813,185.97943,950000
|
| 92 |
+
0.6429365,114.632645,0.009526118,-0.008232023,-13.364153,0.1510723,-114.50533,114.77548,4.273542,10.166087,-2.4667594,-117.468765,-194.1475,14.439629,2.3866143,-2.7430317,146.55641,955000
|
| 93 |
+
0.6426695,113.780045,0.009461978,-0.0075667873,-13.299705,0.15507652,-113.6542,113.92755,4.492087,13.244295,-3.0991054,-116.22095,-200.17648,17.736382,5.164081,-5.032467,204.30852,960000
|
| 94 |
+
0.6469474,111.39033,0.009804824,0.009335442,-11.547873,0.16244766,-111.2771,111.56211,4.219217,9.205934,-2.2469501,-114.551895,-202.24544,13.42515,1.0681547,-1.4270226,112.53923,965000
|
| 95 |
+
0.64476967,109.80739,0.009678287,0.01631963,-10.813789,0.17435864,-109.70273,109.99807,3.6924608,13.060326,-6.93413,-112.35186,-197.67938,16.752787,2.3390026,-2.3840513,153.21286,970000
|
| 96 |
+
0.6487332,111.198425,0.009741454,0.0055994764,-11.925191,0.14091155,-111.08226,111.34494,7.4732056,21.624422,0.9021272,-114.31066,-203.17764,29.097628,6.4860435,-8.222426,282.0349,975000
|
| 97 |
+
0.63769406,114.44853,0.0095910765,-0.019059092,-14.487169,0.14898652,-114.30957,114.57846,5.2746615,11.539787,1.5297862,-118.058205,-188.22485,16.81445,3.8123424,-4.3512263,195.09262,980000
|
| 98 |
+
0.64049834,113.83164,0.009647656,0.00052204897,-12.4458885,0.14947167,-113.71157,113.981636,4.67142,12.702911,-5.5749316,-115.94297,-193.79695,17.374332,2.9837499,-2.6974895,167.11714,985000
|
| 99 |
+
0.6462904,112.9897,0.009707484,0.002975839,-12.193449,0.14664578,-112.87133,113.13932,4.781112,11.211001,-3.204215,-115.05391,-200.40112,15.992113,2.8311548,-2.9297924,214.21262,990000
|
| 100 |
+
0.63646966,106.66548,0.009640096,-0.01213801,-13.759117,0.1621923,-106.53285,106.81554,14.406348,16.549025,-0.38510764,-110.42413,-205.37886,30.955372,3.7113402,-5.122575,263.7284,995000
|
| 101 |
+
0.63828653,107.92594,0.009692868,-0.0032843177,-12.838839,0.13152093,-107.80149,108.054184,7.8299,9.276622,-5.193653,-111.06506,-201.32422,17.106522,2.6275022,-1.9431015,157.3268,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.64115906,151.47078,0.007386628,-0.007391362,-13.500641,0.20737827,-151.37106,151.67078,1.2843298,5.668552,-64.38984,-154.08745,-193.75743,6.952882,3.0530581,-3.6793885,86.52069,505000
|
| 3 |
+
0.6339626,146.44354,0.007594293,-0.0062137167,-13.318209,0.22775419,-146.3424,146.66508,1.2882642,6.92341,-38.577126,-149.4335,-193.88535,8.211674,7.7369285,-8.084668,108.05992,510000
|
| 4 |
+
0.64343643,147.0672,0.007893995,-0.004922801,-13.123613,0.17129043,-146.96361,147.23357,2.2667286,6.117712,-43.359303,-150.11943,-194.26614,8.38444,1.3815638,-1.457663,77.939766,515000
|
| 5 |
+
0.6348855,146.98833,0.008041692,-0.023220178,-15.387474,0.17793922,-146.8646,147.14304,2.9864728,7.5639853,-43.83824,-150.3148,-199.34526,10.550458,2.8655946,-2.9862332,120.974106,520000
|
| 6 |
+
0.641117,146.32503,0.008095764,-0.006708396,-13.32863,0.17509739,-146.21713,146.49341,1.5349731,4.640433,-67.05228,-148.67873,-200.2801,6.175406,1.5605819,-1.620509,62.746082,525000
|
| 7 |
+
0.6456789,147.08755,0.008358137,-0.004993316,-13.09742,0.18527916,-146.97809,147.26784,1.679381,8.674501,-71.71513,-149.09476,-197.54333,10.353883,4.290274,-3.790325,113.91197,530000
|
| 8 |
+
0.6446261,146.25348,0.008449667,0.0065145316,-11.729019,0.20550552,-146.15439,146.4655,2.3890655,5.971564,-10.356891,-148.33012,-196.67082,8.360629,4.2360697,-3.3920007,105.041275,535000
|
| 9 |
+
0.6427683,144.7363,0.008248501,-0.006417451,-13.278014,0.16864687,-144.62677,144.89851,1.9592234,6.3229156,-50.283974,-148.15141,-197.61981,8.282139,1.3531208,-1.3228661,80.83486,540000
|
| 10 |
+
0.64484876,144.43185,0.00811409,0.008168026,-11.493353,0.19654348,-144.3386,144.63657,1.5880466,4.8051257,-10.0128565,-146.67809,-195.76237,6.3931723,2.4507732,-2.0494816,79.54104,545000
|
| 11 |
+
0.64234865,145.92404,0.008243834,-0.005037926,-13.1111145,0.16126022,-145.81598,146.08026,3.330298,6.152203,-48.617844,-148.6548,-194.54846,9.482501,4.1068172,-2.9974964,95.90861,550000
|
| 12 |
+
0.6460353,142.74915,0.008634192,-0.0015792222,-12.682903,0.19269416,-142.63965,142.94026,3.7884634,5.769195,-28.90694,-145.98547,-196.93689,9.557658,1.2918088,-1.4878584,105.38553,555000
|
| 13 |
+
0.63429195,141.4096,0.008779337,-0.017772846,-14.524395,0.19187321,-141.28209,141.58371,2.6731832,7.648492,-39.34383,-145.10806,-200.81065,10.321675,3.0612304,-2.7132392,113.05782,560000
|
| 14 |
+
0.64231414,144.02728,0.008691635,-0.009078971,-13.544564,0.18215942,-143.90956,144.20036,2.4178088,6.113767,-43.525066,-146.55074,-200.34581,8.531576,2.5636225,-1.5186279,73.669205,565000
|
| 15 |
+
0.6447574,137.66486,0.008583827,-0.010066728,-13.672755,0.17831327,-137.54749,137.8331,2.2618847,7.22179,-11.628499,-140.43489,-200.0928,9.483675,4.0483956,-3.139135,98.654854,570000
|
| 16 |
+
0.6436528,142.67892,0.008827754,-0.0027889137,-12.815926,0.20173123,-142.56578,142.87787,2.8914192,9.007509,-46.497932,-145.27505,-201.5458,11.898929,5.2609453,-6.910512,106.26834,575000
|
| 17 |
+
0.63899916,143.19916,0.008837893,-7.2737707e-06,-12.500823,0.167225,-143.08868,143.36638,2.818138,8.25191,-35.912388,-145.79196,-199.15706,11.070048,0.92026836,-1.0327636,90.19783,580000
|
| 18 |
+
0.6419296,141.8727,0.00857744,-0.0018275453,-12.713064,0.1797099,-141.76364,142.05057,4.276029,6.369999,-8.433832,-144.4842,-200.77174,10.6460285,1.3477923,-0.8554929,102.399475,585000
|
| 19 |
+
0.6439789,139.64272,0.008863692,-0.003754011,-12.923527,0.1724695,-139.52817,139.81143,5.967512,7.6569138,-33.82739,-142.17711,-196.76157,13.624426,3.7755635,-3.310035,151.81973,590000
|
| 20 |
+
0.64494663,139.93678,0.0088800555,0.014401949,-10.878169,0.16089192,-139.84018,140.11208,2.336083,9.818218,-28.585882,-141.99962,-199.2035,12.154301,5.741296,-5.3604817,130.14995,595000
|
| 21 |
+
0.6363981,134.50568,0.009158833,-0.0043596467,-12.976005,0.18827137,-134.38684,134.68959,3.2637613,6.6005855,-21.93687,-137.59024,-202.10756,9.8643465,1.7697905,-2.1444068,94.52597,600000
|
| 22 |
+
0.6441658,136.3682,0.009171406,0.014429367,-10.926701,0.1753734,-136.26797,136.558,4.008087,10.110026,-11.957599,-139.82542,-198.54527,14.1181135,2.4859831,-2.7199538,136.63719,605000
|
| 23 |
+
0.6403731,134.95474,0.0094042905,-0.010239988,-13.588863,0.1806503,-134.82697,135.12515,4.0667987,8.847638,-29.173996,-138.15694,-197.57422,12.914436,6.6367683,-6.1972256,187.21164,610000
|
| 24 |
+
0.63297796,133.50348,0.009349223,-0.005505736,-13.088898,0.15617536,-133.3811,133.65414,3.6416008,11.429552,1.4101886,-137.55368,-193.80833,15.071153,5.625752,-8.299414,181.17354,615000
|
| 25 |
+
0.6486115,134.75137,0.009205787,0.008244417,-11.604431,0.167775,-134.64453,134.92738,5.048521,11.450105,-12.254368,-137.25763,-200.97305,16.498627,5.9612594,-5.5254593,171.50844,620000
|
| 26 |
+
0.6395136,138.87225,0.009168005,-0.017408801,-14.398865,0.16372126,-138.74023,139.01857,5.343843,9.951118,-30.373798,-142.23051,-196.19778,15.294962,2.2793245,-2.1188529,112.97597,625000
|
| 27 |
+
0.64853805,135.02846,0.009318856,0.0052619944,-11.935339,0.15332152,-134.91724,135.18704,3.3581185,13.325172,-10.540414,-138.83316,-194.98886,16.68329,5.1118946,-5.8192654,187.32108,630000
|
| 28 |
+
0.63602746,134.45956,0.009252541,-0.014728404,-14.091823,0.16132674,-134.32918,134.60617,3.2329087,14.2916975,1.3294272,-138.13802,-195.75775,17.524607,6.2808785,-5.081433,169.0971,635000
|
| 29 |
+
0.6428751,131.48181,0.009370093,-0.0052017807,-13.055147,0.1730569,-131.35947,131.64966,2.6979663,6.615207,-21.667759,-134.86255,-196.23466,9.313173,2.7118027,-2.8213317,92.15067,640000
|
| 30 |
+
0.6517114,135.40875,0.0091324225,0.0116454465,-11.224824,0.16311523,-135.30624,135.58351,2.3112652,8.3381,-26.615433,-138.07397,-196.4741,10.649365,6.9738665,-5.201306,147.86319,645000
|
| 31 |
+
0.65049344,134.02136,0.0091923075,0.0104005635,-11.368558,0.18699738,-133.91687,134.21877,2.8191113,7.9507446,-9.304501,-135.49846,-200.76456,10.7698555,0.87516975,-1.2975373,114.70554,650000
|
| 32 |
+
0.6449049,134.02374,0.009412576,-0.0023583146,-12.750549,0.20122546,-133.90372,134.22261,2.7104175,8.811869,-31.305737,-136.88062,-194.90517,11.522286,1.8450334,-1.5847001,119.120995,655000
|
| 33 |
+
0.65416074,134.90305,0.0095208995,0.016173443,-10.80127,0.17845346,-134.8002,135.09767,5.4858713,9.056722,-19.039583,-137.9423,-200.76524,14.542593,6.9566927,-7.0370903,222.50443,660000
|
| 34 |
+
0.6370696,134.69511,0.009200754,-0.013553513,-13.973087,0.17757602,-134.56654,134.85915,3.1671886,8.536143,-1.1609197,-137.52252,-201.96115,11.703332,3.1009386,-4.456216,126.51463,665000
|
| 35 |
+
0.6458094,131.64905,0.009263303,0.02425207,-9.88192,0.16919476,-131.55753,131.84248,5.374736,10.336391,-6.822313,-133.95976,-196.71642,15.711127,3.2583513,-9.397792,237.86166,670000
|
| 36 |
+
0.64216083,136.21114,0.009453657,0.0045897355,-12.014502,0.1942154,-136.09755,136.40994,3.5501525,10.264066,-13.428291,-138.71599,-201.27003,13.8142185,3.697692,-3.2114873,198.98575,675000
|
| 37 |
+
0.6503367,132.29012,0.009311131,0.012868933,-11.117898,0.1597037,-132.1866,132.46268,2.4531476,10.356818,2.8817103,-135.01674,-195.26976,12.809966,3.4607196,-3.246385,141.92047,680000
|
| 38 |
+
0.63346547,133.63782,0.009470378,-0.024828682,-15.12172,0.17196274,-133.4946,133.78496,4.0854845,8.524919,-6.8006654,-137.17593,-193.92587,12.610403,0.8233037,-0.98874557,105.81446,685000
|
| 39 |
+
0.6446504,130.78423,0.009343038,0.01324394,-11.08248,0.15642238,-130.6807,130.95389,3.8897934,9.663524,-8.585822,-133.85399,-202.56334,13.553317,5.49211,-6.5613713,193.58682,690000
|
| 40 |
+
0.63896537,129.99953,0.009502844,-0.009468913,-13.496429,0.19615252,-129.87128,130.1862,3.0962682,11.695128,-1.6998159,-132.74297,-194.4358,14.791397,5.7970085,-5.167028,144.89662,695000
|
| 41 |
+
0.63686043,132.90869,0.009477263,-0.0092943655,-13.480701,0.1886166,-132.78091,133.08801,6.014976,10.530792,-22.538824,-136.23236,-200.37578,16.545769,1.5310786,-2.0966198,154.85837,700000
|
| 42 |
+
0.6399312,130.80818,0.009664157,-0.00656904,-13.179732,0.17355326,-130.68082,130.97516,8.812982,14.992879,-4.0062456,-133.8695,-196.51001,23.80586,5.280988,-5.4753504,254.1319,705000
|
| 43 |
+
0.63378364,130.42291,0.0097146435,-0.0045918724,-12.972675,0.16108356,-130.29689,130.5794,3.10216,9.329264,-19.811361,-133.40953,-198.83632,12.431423,4.1620636,-1.753137,130.59998,710000
|
| 44 |
+
0.6494521,130.47012,0.009513267,0.003691751,-12.111937,0.17453521,-130.35489,130.64835,2.8536537,9.036019,-6.046004,-132.59647,-201.63753,11.889673,2.8878353,-2.7299511,121.02315,715000
|
| 45 |
+
0.63751924,128.94087,0.009495959,0.0004991515,-12.447435,0.1709806,-128.82266,129.11235,2.7440877,10.132121,-15.233045,-132.01883,-203.34052,12.876209,2.5892663,-3.4068785,113.636925,720000
|
| 46 |
+
0.63608587,125.13534,0.009639305,0.0042457213,-12.059541,0.15226942,-125.01909,125.29185,3.0672326,12.592521,-5.66239,-128.0989,-192.41238,15.659754,1.830749,-1.8175281,123.68656,725000
|
| 47 |
+
0.6481874,130.2086,0.009423355,0.014987386,-10.909549,0.20120822,-130.1058,130.42479,4.10511,9.548141,-9.315554,-133.3861,-200.31711,13.653251,2.308039,-1.867134,122.67647,730000
|
| 48 |
+
0.6401909,128.1512,0.009587195,-0.011452361,-13.694548,0.18353856,-128.01991,128.32327,3.3128114,9.980926,-8.273938,-131.01846,-191.5406,13.293737,3.3038483,-3.7900805,127.10757,735000
|
| 49 |
+
0.6543422,125.632645,0.009379869,0.0068577304,-11.768888,0.14226973,-125.52225,125.78178,3.4949837,8.317082,0.7344019,-128.73317,-199.19594,11.812066,1.7023914,-0.9026097,101.38617,740000
|
| 50 |
+
0.6469857,126.99939,0.009337007,-0.001142042,-12.6223135,0.1494716,-126.88154,127.14772,3.6622016,10.625549,-4.6786838,-129.92085,-205.61522,14.287751,4.3080053,-4.838219,130.03244,745000
|
| 51 |
+
0.6416046,121.11925,0.009281994,0.00056796195,-12.43881,0.14800216,-121.003784,121.267815,5.2783923,13.970772,-1.1186365,-124.62206,-202.39465,19.249165,2.722152,-2.7329423,212.81836,750000
|
| 52 |
+
0.65340817,129.89816,0.009302744,0.0060321237,-11.851576,0.16234894,-129.78792,130.06654,3.723863,8.804921,2.0030198,-132.88872,-199.9468,12.528784,3.870852,-3.5189717,138.11124,755000
|
| 53 |
+
0.6475883,126.73375,0.009519633,-0.0040962594,-12.930296,0.1884712,-126.610664,126.91812,3.348128,10.320706,2.3890426,-129.83727,-188.40704,13.668835,1.7519842,-1.881941,125.45193,760000
|
| 54 |
+
0.64391804,125.1855,0.009422811,0.0040838923,-12.066595,0.1768919,-125.0718,125.36648,2.9711025,10.100297,-3.8676596,-128.21713,-193.67088,13.0714,1.8664325,-2.7640946,113.72586,765000
|
| 55 |
+
0.6420822,128.57314,0.009316932,-0.0032667231,-12.850622,0.17318459,-128.45341,128.74306,7.376024,9.565112,-11.459131,-131.29901,-198.26384,16.941135,6.531716,-6.013642,298.45206,770000
|
| 56 |
+
0.6406972,123.877045,0.009575874,-0.0067146528,-13.201205,0.17665374,-123.750626,124.04698,3.1382947,10.020911,-14.770311,-126.85561,-197.53236,13.159206,1.0711468,-0.781445,116.921425,775000
|
| 57 |
+
0.63243484,123.741714,0.00928333,-0.016671404,-14.295843,0.17305627,-123.60901,123.8981,3.9745483,12.430615,-4.8354936,-127.31313,-197.9491,16.405163,4.884416,-4.679324,147.10388,780000
|
| 58 |
+
0.6465733,122.78073,0.009317638,-0.0038751813,-12.915897,0.1692524,-122.660385,122.946106,3.0946367,6.60384,-3.4745245,-124.74153,-201.23607,9.698477,0.88683355,-0.6646373,91.36621,785000
|
| 59 |
+
0.63916713,120.31384,0.009533852,-0.0021078605,-12.721092,0.17329103,-120.192566,120.48503,5.24846,10.563865,-8.61488,-123.15566,-198.66965,15.812325,1.2715528,-1.1284006,123.277534,790000
|
| 60 |
+
0.64890516,121.77678,0.0092748795,0.011753432,-11.232767,0.15371849,-121.67259,121.94225,4.095108,11.039172,1.0874373,-124.26125,-195.86133,15.13428,2.8280551,-5.6451206,176.46153,795000
|
| 61 |
+
0.637367,124.09254,0.009339243,-0.0036530495,-12.89115,0.15591718,-123.972145,124.2448,4.2530627,8.901825,-8.814355,-127.239746,-196.4571,13.154888,2.2850523,-2.037319,121.42115,800000
|
| 62 |
+
0.6443135,123.790504,0.009473296,-0.0021175279,-12.723526,0.15993667,-123.669975,123.94832,3.3667035,13.746569,-3.625892,-127.050316,-196.08029,17.113272,1.3697973,-1.3131655,154.15573,805000
|
| 63 |
+
0.65009594,119.774254,0.009438396,0.0044958796,-12.023661,0.16341773,-119.66077,119.94216,4.326635,12.567731,-5.9381337,-123.12648,-198.67242,16.894365,3.9336452,-3.8251333,202.73671,810000
|
| 64 |
+
0.6424965,121.031784,0.009450858,0.004897308,-11.981813,0.17728186,-120.91855,121.21397,2.5704005,11.462024,-6.761825,-123.30725,-190.32983,14.032424,1.9068158,-2.0599833,149.21323,815000
|
| 65 |
+
0.63710713,120.56851,0.009610647,0.0016643866,-12.326818,0.1593282,-120.45005,120.7295,3.6971073,23.16978,-5.9290733,-124.06866,-203.9021,26.866888,4.5873737,-5.077392,261.38492,820000
|
| 66 |
+
0.6462773,122.87613,0.009500107,-0.0008346895,-12.587861,0.15695092,-122.75654,123.03225,2.67559,11.320803,-3.6617436,-125.7409,-200.66006,13.996393,2.1536672,-3.091761,136.16693,825000
|
| 67 |
+
0.6393799,115.25131,0.009541907,0.010506294,-11.3989315,0.1729065,-115.14255,115.43472,3.154124,11.03641,-7.131429,-117.55519,-197.11263,14.190535,1.5667274,-1.6702949,115.54337,830000
|
| 68 |
+
0.6440687,117.645775,0.009408264,0.009135575,-11.528984,0.17701219,-117.53731,117.83192,3.2160847,9.205414,-4.3175673,-120.474815,-196.9428,12.421498,5.246868,-5.2474213,150.49692,835000
|
| 69 |
+
0.6495659,122.84931,0.009444281,0.010233113,-11.416475,0.18673888,-122.74149,123.04628,3.3032746,10.260089,-7.213843,-125.866165,-192.41402,13.563364,2.3875465,-1.7395334,129.38898,840000
|
| 70 |
+
0.63684666,122.48055,0.009685291,-0.018351672,-14.394798,0.15852027,-122.34113,122.62073,2.598279,14.521106,-4.0492835,-125.513405,-197.03293,17.119385,6.9928565,-6.6658516,179.26176,845000
|
| 71 |
+
0.6416665,115.96068,0.009498726,0.0178901,-10.616579,0.15444508,-115.85983,116.13301,3.6024914,8.620467,-1.6335251,-118.515236,-200.45207,12.222959,4.012233,-4.9722614,156.00189,850000
|
| 72 |
+
0.64871114,120.02832,0.009413901,0.0088048475,-11.564697,0.14782083,-119.91945,120.184944,8.662666,10.341872,-4.0812445,-122.81695,-197.22516,19.00454,3.161993,-3.0323794,185.94951,855000
|
| 73 |
+
0.63883734,117.57738,0.00943554,-0.0003626818,-12.538438,0.15350541,-117.459076,117.730515,5.0954847,14.271598,-1.9055194,-120.51843,-194.0712,19.367083,2.5982742,-2.7737124,201.2472,860000
|
| 74 |
+
0.63888824,118.8931,0.009444101,-0.011681465,-13.736906,0.16070572,-118.76337,119.04212,2.605388,10.990046,-0.29166335,-121.41976,-199.57327,13.595433,2.945791,-2.4275472,147.84744,865000
|
| 75 |
+
0.64641494,119.32585,0.009415575,-0.006529015,-13.193427,0.14087653,-119.20163,119.4602,5.7958508,15.635269,-4.724848,-122.34292,-198.32414,21.43112,9.879428,-10.589703,228.91516,870000
|
| 76 |
+
0.6491601,112.93011,0.0097892815,0.0008001889,-12.418259,0.144052,-112.80854,113.07496,2.9193199,10.488506,1.3696377,-116.29241,-194.88577,13.407826,3.2304866,-3.0692139,177.84384,875000
|
| 77 |
+
0.64649564,114.27639,0.009640454,0.020963311,-10.325485,0.15488006,-114.17685,114.45223,3.904085,9.3024435,0.57135075,-117.50402,-195.83545,13.206529,1.9796354,-1.5406276,141.93921,880000
|
| 78 |
+
0.6455101,119.22926,0.009321593,-0.0049662488,-13.032768,0.12464798,-119.10778,119.348946,3.356363,10.258151,-2.5418446,-122.430786,-201.86865,13.614514,1.5661674,-1.6245717,114.233734,885000
|
| 79 |
+
0.6371798,122.80914,0.009370343,-0.010477714,-13.618178,0.17730519,-122.68154,122.975975,3.7526207,10.953334,-4.2014294,-125.22351,-203.13278,14.705955,1.7949674,-1.1990622,130.48651,890000
|
| 80 |
+
0.6414218,117.12268,0.009573294,-0.008928356,-13.4326315,0.1325323,-116.994095,117.246284,7.0479097,12.575999,-2.6929233,-120.310135,-195.81969,19.623909,3.558292,-2.649505,222.62866,895000
|
| 81 |
+
0.6408136,114.70831,0.00928511,-0.012335922,-13.82857,0.16886692,-114.57991,114.864845,5.479026,12.507359,-2.3703885,-117.82826,-197.88046,17.986385,7.713042,-7.81921,183.21956,900000
|
| 82 |
+
0.64120543,117.89312,0.0095293205,0.013899967,-11.0413475,0.16801552,-117.787895,118.075035,4.820117,11.63515,-3.3836436,-120.715675,-199.40741,16.455267,1.5992495,-1.3222691,151.39867,905000
|
| 83 |
+
0.64592564,121.51994,0.0095179,-0.0022765058,-12.7391815,0.14761661,-121.3987,121.66528,4.91865,11.571672,7.243404,-124.25183,-201.00058,16.490322,4.934762,-4.90159,198.85747,910000
|
| 84 |
+
0.65647995,114.81821,0.009766697,0.0012573489,-12.371262,0.16875248,-114.69738,114.98822,3.4133675,9.5693865,-1.3751962,-117.55005,-194.19745,12.982754,2.2836144,-2.0160208,141.97025,915000
|
| 85 |
+
0.64578134,117.678055,0.009541201,-0.0044967784,-12.971301,0.16405153,-117.5543,117.837616,4.569065,10.270363,-2.868859,-120.38928,-198.004,14.839428,3.2167072,-3.0077124,139.04904,920000
|
| 86 |
+
0.64717245,113.64228,0.009463928,-0.006794382,-13.217924,0.14366406,-113.51718,113.779144,5.0050693,17.51408,0.06483639,-117.33633,-201.9487,22.51915,4.8363285,-3.9367647,210.68793,925000
|
| 87 |
+
0.6556228,114.401245,0.009435162,0.014645135,-10.947813,0.14739919,-114.29796,114.56329,3.0109458,8.561332,-4.094603,-116.87925,-203.1488,11.572277,1.0943211,-1.3321385,116.714325,930000
|
| 88 |
+
0.6595001,116.578,0.009641636,0.023274528,-10.08604,0.16877814,-116.48076,116.77006,4.1667366,12.217608,-6.0564957,-118.79618,-202.37694,16.384346,3.2843807,-2.8842525,158.62328,935000
|
| 89 |
+
0.64175683,112.41008,0.009440913,-0.010032266,-13.562637,0.19525327,-112.28204,112.5953,5.6239963,10.909836,-1.0641075,-115.5169,-201.6677,16.533833,6.1284795,-3.6818862,215.45636,940000
|
| 90 |
+
0.6470103,115.78818,0.009609278,0.0029855426,-12.189306,0.15507972,-115.67105,115.94624,3.5520966,9.21227,5.078501,-119.22228,-196.35178,12.764366,1.2940526,-1.2713069,129.78502,945000
|
| 91 |
+
0.64584637,112.18138,0.009572002,0.0009818876,-12.397421,0.1757039,-112.06271,112.35807,5.085865,11.219294,-6.930212,-115.69,-197.56198,16.305159,2.827618,-3.0576813,185.97943,950000
|
| 92 |
+
0.6429365,114.632645,0.009526118,-0.008232023,-13.364153,0.1510723,-114.50533,114.77548,4.273542,10.166087,-2.4667594,-117.468765,-194.1475,14.439629,2.3866143,-2.7430317,146.55641,955000
|
| 93 |
+
0.6426695,113.780045,0.009461978,-0.0075667873,-13.299705,0.15507652,-113.6542,113.92755,4.492087,13.244295,-3.0991054,-116.22095,-200.17648,17.736382,5.164081,-5.032467,204.30852,960000
|
| 94 |
+
0.6469474,111.39033,0.009804824,0.009335442,-11.547873,0.16244766,-111.2771,111.56211,4.219217,9.205934,-2.2469501,-114.551895,-202.24544,13.42515,1.0681547,-1.4270226,112.53923,965000
|
| 95 |
+
0.64476967,109.80739,0.009678287,0.01631963,-10.813789,0.17435864,-109.70273,109.99807,3.6924608,13.060326,-6.93413,-112.35186,-197.67938,16.752787,2.3390026,-2.3840513,153.21286,970000
|
| 96 |
+
0.6487332,111.198425,0.009741454,0.0055994764,-11.925191,0.14091155,-111.08226,111.34494,7.4732056,21.624422,0.9021272,-114.31066,-203.17764,29.097628,6.4860435,-8.222426,282.0349,975000
|
| 97 |
+
0.63769406,114.44853,0.0095910765,-0.019059092,-14.487169,0.14898652,-114.30957,114.57846,5.2746615,11.539787,1.5297862,-118.058205,-188.22485,16.81445,3.8123424,-4.3512263,195.09262,980000
|
| 98 |
+
0.64049834,113.83164,0.009647656,0.00052204897,-12.4458885,0.14947167,-113.71157,113.981636,4.67142,12.702911,-5.5749316,-115.94297,-193.79695,17.374332,2.9837499,-2.6974895,167.11714,985000
|
| 99 |
+
0.6462904,112.9897,0.009707484,0.002975839,-12.193449,0.14664578,-112.87133,113.13932,4.781112,11.211001,-3.204215,-115.05391,-200.40112,15.992113,2.8311548,-2.9297924,214.21262,990000
|
| 100 |
+
0.63646966,106.66548,0.009640096,-0.01213801,-13.759117,0.1621923,-106.53285,106.81554,14.406348,16.549025,-0.38510764,-110.42413,-205.37886,30.955372,3.7113402,-5.122575,263.7284,995000
|
| 101 |
+
0.63828653,107.92594,0.009692868,-0.0032843177,-12.838839,0.13152093,-107.80149,108.054184,7.8299,9.276622,-5.193653,-111.06506,-201.32422,17.106522,2.6275022,-1.9431015,157.3268,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c346c957937309eb3177507196b3786a25953008da72e705460e698c92661eb5
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fb49f351314224d96d54109c04ec28b9f0051b4d8160c5e2aa61a1b14106349
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a63297ebd465752b390707a12e8e1c99897e44bdc3bd4b5be374f45c90fdc0df
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:456f76371e7fef1766b0c84c9c3736bea48dbff9c7053cda8dfdc15a98929862
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98972491ce4170a52464cfaa649abb5888c991187633bb343e17a981ca2e596e
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ff87c2c6a51f8111987e63c96593bbabc2ba7bc9f821b495e9abbd27ca77b5d
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8ff238e54b9e9f0514f6bb5cba4726fc992b6c4f0d427c14d6ca02b44587d82
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f481737cac0489ecbd5aeaf7f7eaa48c50cba5f1a09e17917b31aa5d45e7619
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d4276da404c20a0b3ecde7546f5033dc3edf9d87fe5e02627e982be5dd901ca
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb2b485b8b2cdda22e34bbbeabf3021aa935ec4d2168079cabbf7a6aa64b8aa8
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_105154/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/a29ntbju
|