Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.06315714530372765,-0.0056378145267543455,-0.06309449140991447,-0.0009054537668175043,30.42675828983812,12.878999999999133,0.74,6031.24,-0.38,-383.1,255.58,0.8834370756149292,650000
|
| 3 |
+
0.0,0.0,-0.050882851406333765,0.00583191216121456,-0.05049870386994986,-0.003443690112795333,33.31454550980502,7.515999999999687,0.96,17193.28,-0.08,-232.18,148.32,0.4931029224395752,700000
|
| 4 |
+
0.0,0.0,-0.060840541310470876,0.0020255183661433847,-0.060195486396065666,0.0011200656301256727,32.857264314103006,6.802999999999797,1.0,24426.94,0.0,-201.32,134.06,0.48034269332885743,750000
|
| 5 |
+
0.0,0.0,-0.05702395709877929,0.05136840895374753,-0.056395023118587025,-0.0015764847725582888,33.36039406607582,5.659999999999655,0.98,30760.72,-0.04,-163.0,111.2,0.3797770595550537,800000
|
| 6 |
+
0.0,0.0,-0.051793976328267155,0.004741257035009317,-0.05086365986045667,0.002937900882424317,32.808313199420674,6.768999999999631,0.96,37112.9,-0.04,-189.0,133.38,0.44366607189178464,850000
|
| 7 |
+
0.0,0.0,-0.06340244327301088,0.010831251711723862,-0.06250790380194834,0.014459994785602243,32.273500898255946,6.581999999999658,0.96,43744.98,-0.04,-182.48,129.64,0.42889143943786623,900000
|
| 8 |
+
0.0,0.0,-0.05596592691412014,0.0052475249345267875,-0.055083951199347836,0.0018255945677322413,33.16682442012888,4.7979999999997345,0.98,49665.12,-0.02,-128.9,93.96,0.3230148696899414,950000
|
| 9 |
+
0.0,0.0,-0.045224109113456104,0.010653571119293364,-0.04452791919908719,0.009906061396591266,32.4711020393902,4.850999999999789,0.98,54587.1,-0.02,-134.98,95.02,0.31771321773529054,1000000
|
| 10 |
+
0.0,0.0,-0.05360750668701584,0.015591523770851259,-0.052682185825191304,-0.005845894941136392,34.03260366732331,4.603999999999783,1.0,59148.54,0.0,-126.16,90.08,0.3040682029724121,1050000
|
| 11 |
+
0.0,0.0,-0.052826061740312055,0.013485659460586294,-0.05111217679436544,-0.00808834849681005,33.934515002603426,5.194999999999673,0.98,64147.34,-0.04,-148.68,101.9,0.35953640460968017,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.06315714530372765,-0.0056378145267543455,-0.06309449140991447,-0.0009054537668175043,30.42675828983812,12.878999999999133,0.74,6031.24,-0.38,-383.1,255.58,0.8834370756149292,650000
|
| 3 |
+
0.0,0.0,-0.050882851406333765,0.00583191216121456,-0.05049870386994986,-0.003443690112795333,33.31454550980502,7.515999999999687,0.96,17193.28,-0.08,-232.18,148.32,0.4931029224395752,700000
|
| 4 |
+
0.0,0.0,-0.060840541310470876,0.0020255183661433847,-0.060195486396065666,0.0011200656301256727,32.857264314103006,6.802999999999797,1.0,24426.94,0.0,-201.32,134.06,0.48034269332885743,750000
|
| 5 |
+
0.0,0.0,-0.05702395709877929,0.05136840895374753,-0.056395023118587025,-0.0015764847725582888,33.36039406607582,5.659999999999655,0.98,30760.72,-0.04,-163.0,111.2,0.3797770595550537,800000
|
| 6 |
+
0.0,0.0,-0.051793976328267155,0.004741257035009317,-0.05086365986045667,0.002937900882424317,32.808313199420674,6.768999999999631,0.96,37112.9,-0.04,-189.0,133.38,0.44366607189178464,850000
|
| 7 |
+
0.0,0.0,-0.06340244327301088,0.010831251711723862,-0.06250790380194834,0.014459994785602243,32.273500898255946,6.581999999999658,0.96,43744.98,-0.04,-182.48,129.64,0.42889143943786623,900000
|
| 8 |
+
0.0,0.0,-0.05596592691412014,0.0052475249345267875,-0.055083951199347836,0.0018255945677322413,33.16682442012888,4.7979999999997345,0.98,49665.12,-0.02,-128.9,93.96,0.3230148696899414,950000
|
| 9 |
+
0.0,0.0,-0.045224109113456104,0.010653571119293364,-0.04452791919908719,0.009906061396591266,32.4711020393902,4.850999999999789,0.98,54587.1,-0.02,-134.98,95.02,0.31771321773529054,1000000
|
| 10 |
+
0.0,0.0,-0.05360750668701584,0.015591523770851259,-0.052682185825191304,-0.005845894941136392,34.03260366732331,4.603999999999783,1.0,59148.54,0.0,-126.16,90.08,0.3040682029724121,1050000
|
| 11 |
+
0.0,0.0,-0.052826061740312055,0.013485659460586294,-0.05111217679436544,-0.00808834849681005,33.934515002603426,5.194999999999673,0.98,64147.34,-0.04,-148.68,101.9,0.35953640460968017,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.64548874,150.8104,0.007411091,0.0018006833,-12.257029,0.18355003,-150.71957,150.99574,1.5090442,4.427874,-73.06295,-153.39738,-195.3517,5.9369183,3.287911,-3.295326,78.81692,605000
|
| 3 |
+
0.63423616,147.82486,0.0076426268,-0.018300582,-14.894541,0.18814299,-147.71103,147.9947,4.2588763,4.7889543,-47.9112,-150.74266,-192.67285,9.047831,2.5537255,-2.3811214,99.48657,610000
|
| 4 |
+
0.639863,149.47968,0.007312117,-0.0044536176,-13.109074,0.16253623,-149.38382,149.63776,1.4235862,5.0489764,-43.21124,-152.39522,-193.74557,6.472563,1.1103185,-1.2106696,65.73044,615000
|
| 5 |
+
0.63298196,147.56223,0.007908308,-0.027477149,-15.974466,0.16959476,-147.43588,147.70435,3.5900161,8.055021,-27.037195,-151.03006,-199.27751,11.645038,4.4638305,-4.987754,104.6268,620000
|
| 6 |
+
0.6469342,145.00229,0.008432505,-0.006142906,-13.228479,0.17114368,-144.89075,145.16728,1.4469994,4.977134,-66.52871,-147.77979,-200.19734,6.424134,2.8047082,-2.9369755,64.77774,625000
|
| 7 |
+
0.6472643,145.10797,0.008104044,-0.006337869,-13.282063,0.15032524,-145.00034,145.25197,2.294285,8.901448,-74.52154,-147.27081,-198.0986,11.195733,1.7084754,-1.9771442,108.10998,630000
|
| 8 |
+
0.6511408,145.14078,0.008370342,0.00048269064,-12.442333,0.17101362,-145.03664,145.31229,2.5787854,5.6908092,0.79983056,-147.7023,-197.49547,8.269594,2.8985553,-2.5658002,87.08915,635000
|
| 9 |
+
0.6374728,142.1056,0.008681536,-0.0050503006,-13.081729,0.17243233,-141.99203,142.273,6.754686,10.061877,-32.35202,-145.5514,-199.22653,16.816563,4.5398574,-5.049078,143.66249,640000
|
| 10 |
+
0.6506496,142.71524,0.008732287,0.0043611303,-12.000574,0.17827627,-142.61046,142.89789,1.8652642,6.910888,-45.194366,-145.0459,-198.23778,8.776153,3.7506757,-2.9279935,108.083725,645000
|
| 11 |
+
0.6440315,142.9573,0.00898228,-0.00015367709,-12.517109,0.21335231,-142.84486,143.1705,2.7191968,6.883962,-42.644394,-145.5739,-197.42274,9.603159,1.2063502,-1.8371133,94.4332,650000
|
| 12 |
+
0.63567984,138.0719,0.008831696,-0.014373379,-14.127477,0.21752667,-137.94714,138.27505,5.6974854,12.709803,-24.64603,-141.67342,-197.87817,18.407288,4.7303963,-3.2033749,158.51172,655000
|
| 13 |
+
0.63623804,137.46638,0.009263666,-0.013421749,-13.948859,0.20607637,-137.33716,137.65903,3.4032981,8.21361,-36.06813,-141.75467,-200.98817,11.616908,4.929565,-4.8117085,131.04234,660000
|
| 14 |
+
0.63963604,137.9961,0.009014813,-0.010593808,-13.675156,0.18530455,-137.8728,138.1708,3.2476585,7.109079,-8.5246,-140.88858,-199.55827,10.356737,2.2371557,-3.0394223,89.55348,665000
|
| 15 |
+
0.6395569,133.2652,0.009211847,-0.00073787826,-12.580101,0.18402633,-133.1493,133.44849,2.76834,9.373946,-19.889765,-136.00107,-198.4503,12.142286,1.6813269,-2.7929866,89.21693,670000
|
| 16 |
+
0.6485966,137.42767,0.009250066,0.00029897116,-12.467679,0.19743922,-137.31235,137.62541,2.389283,6.9309244,-33.421967,-140.37593,-201.18857,9.320208,2.026956,-1.9043684,87.8613,675000
|
| 17 |
+
0.63144016,137.75407,0.0094066,-0.021223987,-14.756287,0.160401,-137.61526,137.89325,4.9168634,10.215121,-20.492874,-140.98744,-200.64006,15.131985,2.0726125,-1.1277361,120.462875,680000
|
| 18 |
+
0.64020646,134.79355,0.009014654,0.0071165296,-11.71056,0.1742867,-134.68797,134.97495,4.6740317,12.454428,-8.539329,-137.54997,-199.57382,17.12846,4.7329793,-4.216344,185.3577,685000
|
| 19 |
+
0.6400877,135.00232,0.009060658,-0.0025740943,-12.784096,0.17599024,-134.88649,135.17574,3.350991,6.0773544,-8.33259,-137.62027,-203.55818,9.428346,2.7665098,-2.657054,109.92705,690000
|
| 20 |
+
0.64428806,133.97093,0.009122755,0.005186065,-11.931524,0.19546847,-133.86208,134.17159,2.4467533,7.3109775,-22.847443,-136.44743,-197.77386,9.7577305,2.4789689,-2.2731714,88.84099,695000
|
| 21 |
+
0.6358364,132.32816,0.009273592,-0.004794396,-13.016994,0.19637382,-132.20746,132.51974,2.6462228,8.906959,-7.49915,-135.56044,-202.05284,11.553182,1.6759752,-2.4750898,109.19887,700000
|
| 22 |
+
0.641631,135.57135,0.00913897,-0.005520287,-13.104038,0.19505444,-135.4516,135.76088,4.864945,13.727114,-4.7191224,-138.92064,-198.05759,18.592058,16.528944,-16.858261,241.32285,705000
|
| 23 |
+
0.63747144,130.89128,0.009281861,-0.007475043,-13.305339,0.17376587,-130.76778,131.05757,15.929665,8.838729,-28.309315,-133.51329,-198.48114,24.768394,3.0550013,-2.3479598,214.55525,710000
|
| 24 |
+
0.63731545,130.81732,0.009317149,-0.0038833304,-12.916794,0.17139229,-130.69698,130.98483,3.3586495,11.358935,1.769184,-134.70714,-196.91167,14.717585,5.336236,-6.138225,151.36894,715000
|
| 25 |
+
0.6488781,132.60677,0.009136835,0.011130899,-11.281755,0.17180052,-132.5037,132.78969,4.5275,9.924003,-19.114908,-135.4191,-201.0254,14.451503,5.203011,-3.6412268,153.43999,720000
|
| 26 |
+
0.6339715,135.63205,0.009069442,-0.025362894,-15.296522,0.14736578,-135.49333,135.75406,4.769716,11.583646,-7.742432,-138.97955,-194.85439,16.353361,1.9706419,-1.8785528,123.86465,725000
|
| 27 |
+
0.6472691,133.68213,0.009241253,0.0021044118,-12.272281,0.17676659,-133.5687,133.86101,2.9813726,8.96508,-43.672585,-137.2423,-199.53987,11.946453,4.289259,-3.8572793,113.941956,730000
|
| 28 |
+
0.6377163,133.26378,0.008962398,-0.0054894793,-13.112501,0.17783363,-133.14627,133.43613,2.862576,9.5964575,1.8333483,-136.51292,-196.37254,12.459034,6.4120765,-6.50399,154.62837,735000
|
| 29 |
+
0.65132284,130.89178,0.008833182,0.0059564942,-11.825668,0.14519161,-130.78734,131.04292,2.4271212,11.587679,-2.6682057,-134.21355,-203.25717,14.0148,2.6723654,-2.6984668,120.36099,740000
|
| 30 |
+
0.6547223,130.85564,0.009386276,0.008814278,-11.56094,0.14451587,-130.74713,131.00897,2.9675004,11.91864,-6.1773787,-133.17308,-194.92763,14.886141,4.473335,-4.6739044,143.28828,745000
|
| 31 |
+
0.6434861,132.57846,0.009218438,-0.0055969576,-13.107148,0.145913,-132.45763,132.71878,3.3122292,8.402913,-20.754156,-134.658,-200.42552,11.715142,1.0374793,-1.378666,97.07616,750000
|
| 32 |
+
0.65002954,129.66797,0.009129588,0.004979422,-11.954584,0.16181304,-129.55884,129.83476,2.349222,10.220754,-6.5027156,-132.43071,-194.83855,12.569976,3.2709618,-3.5807002,138.312,755000
|
| 33 |
+
0.65691954,130.73676,0.009181536,0.015227006,-10.841562,0.19725296,-130.6372,130.94923,4.703281,10.733401,-9.078466,-133.80426,-198.36879,15.436682,5.0775704,-3.7356696,150.82072,760000
|
| 34 |
+
0.6402673,131.39703,0.009042452,-0.011730363,-13.797255,0.18026003,-131.27228,131.56557,4.5546393,9.1648,-1.0650238,-134.56265,-200.21355,13.719439,3.5508714,-5.6338196,136.7819,765000
|
| 35 |
+
0.65127105,127.7375,0.009180651,0.017035034,-10.644464,0.16157572,-127.639786,127.916115,2.1526682,9.328837,-4.0051427,-130.26881,-197.85461,11.481505,1.6420817,-1.3943172,112.51332,770000
|
| 36 |
+
0.6432563,133.17017,0.00914138,-0.005879761,-13.143203,0.17637259,-133.05,133.34067,2.2674065,8.031833,-18.445778,-135.65042,-199.41968,10.299239,9.26328,-11.214177,149.73338,775000
|
| 37 |
+
0.6530268,129.02579,0.008986389,0.009331833,-11.461559,0.1676651,-128.92279,129.20279,2.520272,6.2087703,2.140582,-131.39546,-197.90439,8.729042,0.86676055,-1.0517943,81.686745,780000
|
| 38 |
+
0.63350284,125.86957,0.009225276,-0.02093663,-14.769485,0.19145401,-125.73332,126.040085,5.9003406,18.683432,-5.3717127,-129.31273,-194.9881,24.583773,5.1506743,-9.939047,223.73534,785000
|
| 39 |
+
0.6474864,127.1162,0.008985348,-0.0063554756,-13.207315,0.16013876,-126.99753,127.26999,4.512806,9.524898,-17.225616,-130.42265,-198.807,14.0377035,4.1561427,-3.2830482,180.8898,790000
|
| 40 |
+
0.64104253,127.81647,0.008956341,0.0007995464,-12.410728,0.16590819,-127.70532,127.98318,2.6771793,10.851982,-2.3091707,-130.50037,-197.1586,13.529161,4.252534,-4.037526,135.28267,795000
|
| 41 |
+
0.63548076,125.29637,0.009454649,-0.00980903,-13.537482,0.17146337,-125.168365,125.45802,3.7408092,9.673207,-1.389225,-129.13518,-198.72536,13.414017,5.6821203,-5.879489,162.60222,800000
|
| 42 |
+
0.63899374,127.279495,0.009020782,-0.016528634,-14.332284,0.18117389,-127.150215,127.444145,8.012087,9.635006,-5.063979,-130.98106,-196.29861,17.647093,2.5219657,-1.9213657,140.23526,805000
|
| 43 |
+
0.64677685,127.41939,0.009245198,-0.00030763957,-12.533276,0.16849852,-127.30351,127.58758,3.4464867,8.778473,0.9862002,-130.08478,-196.41269,12.224959,2.413326,-2.3847232,138.82446,810000
|
| 44 |
+
0.64065903,126.25369,0.009134617,-0.005545587,-13.107096,0.19197187,-126.13396,126.44012,2.803569,8.252367,-6.3219295,-128.96205,-201.7502,11.055936,1.3146433,-1.4739548,105.44423,815000
|
| 45 |
+
0.64454246,126.270874,0.00918372,-0.009831141,-13.570497,0.17664635,-126.14624,126.43768,3.0130792,9.440401,-3.2358665,-129.4868,-204.0863,12.45348,2.146763,-1.1137861,127.39749,820000
|
| 46 |
+
0.64130354,123.32402,0.009165368,0.004420464,-12.017699,0.18294431,-123.21387,123.51138,4.138459,11.64889,-1.6862003,-126.26951,-201.81102,15.787349,1.865061,-2.059171,158.98172,825000
|
| 47 |
+
0.64637834,125.81641,0.009112291,0.0078845285,-11.634737,0.17286256,-125.71039,125.99715,5.856348,10.683692,1.0740206,-129.04979,-201.28378,16.54004,3.195845,-3.817934,202.48907,830000
|
| 48 |
+
0.64171875,122.19771,0.009167968,-0.0062717474,-13.184093,0.17234871,-122.07684,122.363785,3.7944763,10.263959,-3.0644274,-125.36111,-195.38364,14.058435,4.6528625,-3.0885413,145.36685,835000
|
| 49 |
+
0.6504628,122.401535,0.009196626,0.01302639,-11.083569,0.18059237,-122.29961,122.59515,4.627168,9.75995,1.8155544,-125.49221,-204.72063,14.387117,0.9990605,-2.5302176,128.31845,840000
|
| 50 |
+
0.64520234,125.32684,0.0090018315,-0.013717574,-14.023865,0.1582903,-125.20061,125.47141,3.0980787,8.542325,-13.051948,-128.40956,-202.07146,11.640404,3.8898757,-4.3408732,124.64845,845000
|
| 51 |
+
0.63875604,114.513214,0.009333949,0.0069309403,-11.757448,0.1563901,-114.40348,114.67653,5.88703,11.777609,-5.403043,-118.07809,-201.68835,17.664639,3.1603963,-2.318939,161.62549,850000
|
| 52 |
+
0.65294385,129.08485,0.009076337,0.013357946,-11.028267,0.16223311,-128.98476,129.26044,4.2800765,10.5362215,-4.1386614,-132.07788,-199.70778,14.816298,4.888151,-6.351162,190.76434,855000
|
| 53 |
+
0.6455894,123.8411,0.009124527,-0.0058215046,-13.138006,0.17406857,-123.72123,124.00935,4.873342,10.267796,2.473476,-127.057884,-201.75064,15.141138,2.4737313,-2.397577,147.68564,860000
|
| 54 |
+
0.6344453,122.76438,0.009071885,-0.001893875,-12.708763,0.16047941,-122.649086,122.922966,4.1681647,11.218053,-5.9951468,-126.31189,-199.79445,15.386217,3.1480517,-4.94325,164.71046,865000
|
| 55 |
+
0.63795453,123.594086,0.009235439,-0.0045989063,-12.997963,0.13446747,-123.47405,123.72395,3.2970989,11.840903,-0.17041,-126.25713,-202.18724,15.138002,6.957887,-7.564168,215.81961,870000
|
| 56 |
+
0.63864315,120.118866,0.009210995,-0.007063658,-13.266872,0.1602009,-119.99667,120.272,4.5095067,10.843558,-1.8745737,-123.236084,-200.16522,15.3530655,2.0017357,-2.2630987,149.66716,875000
|
| 57 |
+
0.6359637,122.25983,0.009252929,-0.0012322844,-12.633178,0.17291602,-122.14293,122.4315,5.2595115,13.089539,-3.086068,-126.13259,-196.95357,18.34905,1.2724829,-1.1992205,154.65877,880000
|
| 58 |
+
0.6389341,120.109955,0.0091346735,0.002109142,-12.269106,0.122403264,-119.99788,120.23447,3.0179207,7.7200465,-9.786167,-122.49385,-200.29872,10.7379675,1.2558672,-1.3635117,111.45168,885000
|
| 59 |
+
0.6366698,114.80873,0.009273885,-0.005594679,-13.103272,0.14845562,-114.68721,114.95159,18.624197,14.464503,-6.539571,-118.15574,-201.17245,33.0887,2.1601722,-3.1501546,211.17096,890000
|
| 60 |
+
0.637873,117.059975,0.00916664,0.008028765,-11.624132,0.15113187,-116.95343,117.21913,3.3696008,9.533362,1.7814546,-119.80444,-202.93019,12.902964,1.1460733,-1.0049744,116.964355,895000
|
| 61 |
+
0.64138305,124.40807,0.009077662,-5.2921052e-05,-12.50583,0.18280141,-124.294556,124.59082,3.7288482,9.256257,-4.963084,-127.56963,-201.8019,12.9851055,1.4125638,-1.3084403,125.78841,900000
|
| 62 |
+
0.6483187,122.25958,0.009011689,0.0012154799,-12.365122,0.16807923,-122.14815,122.42887,3.7509563,10.321571,-0.64834744,-125.87691,-202.76593,14.072528,2.9678566,-2.6001115,140.40321,905000
|
| 63 |
+
0.6489439,119.10069,0.008961117,0.009954399,-11.389156,0.14155737,-118.998634,119.252205,8.453976,12.007688,-1.5034701,-122.3147,-199.25432,20.461662,4.565872,-4.8924956,268.87323,910000
|
| 64 |
+
0.63995427,120.2769,0.009030836,0.004367645,-12.016363,0.19290213,-120.16838,120.47417,2.9330673,11.471274,-3.8694277,-122.93245,-189.55621,14.404342,1.8233845,-1.8417668,131.72485,915000
|
| 65 |
+
0.63723844,118.721924,0.009076212,-0.0029920763,-12.829661,0.16113754,-118.60547,118.88007,4.861753,9.15174,-6.3458557,-121.92263,-193.60193,14.013493,1.1292986,-1.2244055,115.96152,920000
|
| 66 |
+
0.6484327,119.39964,0.009134948,0.0033438632,-12.133948,0.14715075,-119.2888,119.55013,4.795069,11.370532,-1.4909977,-121.53896,-198.96725,16.165602,5.176269,-4.3091927,193.72958,925000
|
| 67 |
+
0.64355636,118.65789,0.009056213,0.01024576,-11.368649,0.15799467,-118.55493,118.82613,3.299549,11.186944,-2.1969748,-121.12079,-195.13264,14.486493,1.8859658,-1.936069,122.21677,930000
|
| 68 |
+
0.6437866,118.91379,0.009137236,0.007217344,-11.710117,0.17481932,-118.806786,119.095825,4.002647,9.55947,2.8167555,-121.20066,-195.75401,13.562117,1.5318805,-1.2796526,137.35007,935000
|
| 69 |
+
0.64837974,118.85625,0.009071413,0.009312911,-11.473378,0.19926715,-118.75217,119.06483,5.0346694,15.887601,4.121621,-122.38323,-191.41768,20.92227,3.1165411,-2.9369977,294.34402,940000
|
| 70 |
+
0.64472455,126.47232,0.009166483,-0.015910095,-14.235682,0.16174683,-126.34183,126.61816,6.8243966,11.855559,-15.79392,-129.65784,-192.10088,18.679956,3.807382,-2.5643764,163.40152,945000
|
| 71 |
+
0.64496046,114.40094,0.009073888,0.0039024928,-12.069921,0.18235412,-114.29141,114.587204,4.476023,10.666323,-3.7646537,-116.83506,-201.7976,15.142345,3.6598384,-3.330017,154.28336,950000
|
| 72 |
+
0.645682,118.20758,0.008798594,0.006616516,-11.748003,0.1629672,-118.10422,118.37716,5.3422103,14.81799,-6.5057716,-120.94395,-195.5204,20.1602,5.2396717,-4.6692615,203.50403,955000
|
| 73 |
+
0.63369757,116.93909,0.008985574,0.002340296,-12.23955,0.14599863,-116.82911,117.087425,3.0614898,9.726741,-4.070353,-119.73114,-197.76974,12.788231,1.9773062,-1.2617353,111.10201,960000
|
| 74 |
+
0.64459586,118.777626,0.009016115,-0.010724651,-13.689498,0.16647708,-118.6542,118.93337,3.4700325,11.4828825,-0.22997528,-121.56573,-198.85333,14.952915,3.833399,-4.0033984,141.10706,965000
|
| 75 |
+
0.6442967,117.66928,0.009140146,-0.0002736615,-12.529941,0.1691444,-117.554756,117.83815,3.4219162,11.356181,0.18007255,-120.75474,-195.20703,14.778097,8.848051,-8.476851,204.867,970000
|
| 76 |
+
0.64540464,115.15419,0.008967323,0.006092378,-11.820602,0.14788702,-115.048195,115.308174,4.6522136,13.720438,0.8138359,-119.08605,-198.23894,18.372652,3.8114145,-3.888458,166.44426,975000
|
| 77 |
+
0.6470643,114.40196,0.009039805,0.001965595,-12.282562,0.15707147,-114.290924,114.561005,4.923786,16.705473,-1.1280168,-117.83555,-194.9676,21.62926,1.7891672,-1.5491067,196.01204,980000
|
| 78 |
+
0.64754117,115.56478,0.008944297,-0.0039106393,-12.937222,0.15714747,-115.44908,115.71802,3.0029457,9.37005,-0.50882584,-119.13,-192.77493,12.372996,2.7185116,-2.9024599,128.16049,985000
|
| 79 |
+
0.63874596,121.17827,0.008960809,-0.009602812,-13.571646,0.15379451,-121.05665,121.32246,3.1221414,10.728148,-4.8191285,-123.80271,-201.3842,13.85029,1.8158121,-1.8504375,133.22241,990000
|
| 80 |
+
0.6454062,117.05056,0.008956042,-0.0066101816,-13.23807,0.16767833,-116.93199,117.21163,4.758899,17.488749,5.338298,-120.91976,-196.3003,22.247648,3.0382419,-2.8560388,185.99777,995000
|
| 81 |
+
0.64731824,112.451416,0.008760965,0.00075338007,-12.414007,0.13154456,-112.34266,112.58372,8.1284275,9.773252,-4.9251156,-116.04305,-193.1701,17.90168,10.449256,-14.791387,166.94571,1000000
|
| 82 |
+
0.6415385,113.43013,0.008863633,0.0046134125,-11.979512,0.15292776,-113.323944,113.58768,5.5877395,11.670615,-0.73797745,-116.19031,-197.6764,17.258354,1.9099387,-2.100515,165.17464,1005000
|
| 83 |
+
0.6406224,118.62348,0.009015222,7.204777e-06,-12.499201,0.15410139,-118.5108,118.77759,3.0084012,9.1436405,-1.2859694,-120.75701,-194.61945,12.152041,0.88140893,-0.8382842,102.03757,1010000
|
| 84 |
+
0.65473694,117.18089,0.008878814,-0.0020890161,-12.735281,0.15644641,-117.067825,117.33525,3.9475312,8.235858,-4.8435917,-119.5333,-203.98254,12.18339,1.3828522,-0.933365,118.28592,1015000
|
| 85 |
+
0.64421433,117.49155,0.008670602,0.0019436369,-12.275836,0.1713018,-117.3851,117.664795,4.6867366,8.131165,-2.1649141,-120.32354,-196.46684,12.817902,0.90966547,-1.4106151,111.5549,1020000
|
| 86 |
+
0.64330924,114.57077,0.008634423,-0.0063225334,-13.232247,0.17857243,-114.45651,114.74302,5.4503846,11.879647,-0.32574785,-117.411156,-202.63498,17.330032,2.1401463,-1.9885571,168.686,1025000
|
| 87 |
+
0.6485826,112.4044,0.008814249,0.020358061,-10.190324,0.13645092,-112.31458,112.56121,3.0476525,8.479595,-3.36713,-114.95812,-192.06801,11.527247,2.6978247,-2.3827279,117.92287,1030000
|
| 88 |
+
0.6554735,118.58715,0.008526496,0.013309574,-10.9390335,0.1673339,-118.49388,118.7678,3.5174844,8.221016,-4.6501703,-120.27338,-199.64618,11.738501,1.3702745,-3.4708037,129.0237,1035000
|
| 89 |
+
0.633036,111.119705,0.008712473,-0.012938751,-13.985084,0.12545459,-110.997856,111.23222,5.3714027,12.101888,-3.867026,-115.047134,-202.09631,17.47329,3.5277996,-2.9393957,161.1915,1040000
|
| 90 |
+
0.640777,118.052185,0.008811244,-0.015225196,-14.227928,0.16139978,-117.92683,118.19836,4.349827,14.192024,-2.576127,-121.55572,-193.63931,18.541851,1.9507523,-2.3820186,162.47781,1045000
|
| 91 |
+
0.6472975,112.533264,0.008659835,0.0061951857,-11.784607,0.14986864,-112.43121,112.68933,4.9959583,11.984378,-2.633475,-114.76267,-197.88487,16.980335,2.4883854,-2.2352924,167.89854,1050000
|
| 92 |
+
0.63827443,113.466675,0.008592984,-0.0073416214,-13.354374,0.15324846,-113.35192,113.61259,4.05825,11.200887,-1.8257453,-116.93023,-193.59686,15.259136,1.9416494,-1.2063519,134.68027,1055000
|
| 93 |
+
0.6422363,111.698456,0.0087209195,-0.009334766,-13.570388,0.1417098,-111.58011,111.830826,4.0812454,12.43888,-5.621551,-114.869995,-202.29312,16.520126,4.1657343,-3.5756934,216.34358,1060000
|
| 94 |
+
0.64424145,115.002945,0.008727608,-0.007835609,-13.397796,0.15186536,-114.88602,115.14697,7.718065,10.620399,0.12972409,-117.40154,-203.41165,18.338465,2.3159292,-2.1204224,157.53412,1065000
|
| 95 |
+
0.6430882,109.730286,0.008566355,0.003785164,-12.058136,0.15722358,-109.62699,109.8913,3.9252992,17.025846,-3.1793075,-112.711845,-191.17403,20.951145,3.7029743,-4.373851,195.96883,1070000
|
| 96 |
+
0.64453286,113.31501,0.00859536,-0.008975193,-13.54419,0.14798376,-113.19859,113.454025,5.76289,14.078921,-7.0185328,-116.84789,-198.46365,19.841812,1.7990748,-2.007161,166.03069,1075000
|
| 97 |
+
0.6395069,115.98883,0.008536161,-0.008576986,-13.504783,0.16949692,-115.87355,116.14975,3.6858838,9.744466,0.58442235,-119.34639,-203.1849,13.430349,2.7388535,-3.0055685,124.05796,1080000
|
| 98 |
+
0.6403822,110.18609,0.008587385,0.0011805262,-12.362528,0.15526359,-110.079926,110.34254,3.804751,8.920447,-3.3337824,-112.99873,-201.88206,12.725199,2.0302877,-1.831586,113.27369,1085000
|
| 99 |
+
0.6467378,110.739456,0.00842496,0.013753616,-10.867516,0.12504458,-110.647896,110.87826,4.344004,20.284718,-7.0690207,-113.395164,-194.65454,24.628721,6.9020777,-6.8882017,221.74237,1090000
|
| 100 |
+
0.6404147,102.25562,0.008424615,-0.0011237228,-12.633386,0.12712602,-102.149185,102.38163,3.9435203,10.842885,7.8170795,-105.79122,-198.07872,14.786406,3.5977685,-4.390843,150.91971,1095000
|
| 101 |
+
0.6354557,105.13481,0.008491043,-0.008430958,-13.492924,0.14605631,-105.02025,105.27244,6.1955996,13.703727,-0.72251415,-107.570206,-198.51451,19.899326,2.4226484,-3.291892,183.64966,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.64548874,150.8104,0.007411091,0.0018006833,-12.257029,0.18355003,-150.71957,150.99574,1.5090442,4.427874,-73.06295,-153.39738,-195.3517,5.9369183,3.287911,-3.295326,78.81692,605000
|
| 3 |
+
0.63423616,147.82486,0.0076426268,-0.018300582,-14.894541,0.18814299,-147.71103,147.9947,4.2588763,4.7889543,-47.9112,-150.74266,-192.67285,9.047831,2.5537255,-2.3811214,99.48657,610000
|
| 4 |
+
0.639863,149.47968,0.007312117,-0.0044536176,-13.109074,0.16253623,-149.38382,149.63776,1.4235862,5.0489764,-43.21124,-152.39522,-193.74557,6.472563,1.1103185,-1.2106696,65.73044,615000
|
| 5 |
+
0.63298196,147.56223,0.007908308,-0.027477149,-15.974466,0.16959476,-147.43588,147.70435,3.5900161,8.055021,-27.037195,-151.03006,-199.27751,11.645038,4.4638305,-4.987754,104.6268,620000
|
| 6 |
+
0.6469342,145.00229,0.008432505,-0.006142906,-13.228479,0.17114368,-144.89075,145.16728,1.4469994,4.977134,-66.52871,-147.77979,-200.19734,6.424134,2.8047082,-2.9369755,64.77774,625000
|
| 7 |
+
0.6472643,145.10797,0.008104044,-0.006337869,-13.282063,0.15032524,-145.00034,145.25197,2.294285,8.901448,-74.52154,-147.27081,-198.0986,11.195733,1.7084754,-1.9771442,108.10998,630000
|
| 8 |
+
0.6511408,145.14078,0.008370342,0.00048269064,-12.442333,0.17101362,-145.03664,145.31229,2.5787854,5.6908092,0.79983056,-147.7023,-197.49547,8.269594,2.8985553,-2.5658002,87.08915,635000
|
| 9 |
+
0.6374728,142.1056,0.008681536,-0.0050503006,-13.081729,0.17243233,-141.99203,142.273,6.754686,10.061877,-32.35202,-145.5514,-199.22653,16.816563,4.5398574,-5.049078,143.66249,640000
|
| 10 |
+
0.6506496,142.71524,0.008732287,0.0043611303,-12.000574,0.17827627,-142.61046,142.89789,1.8652642,6.910888,-45.194366,-145.0459,-198.23778,8.776153,3.7506757,-2.9279935,108.083725,645000
|
| 11 |
+
0.6440315,142.9573,0.00898228,-0.00015367709,-12.517109,0.21335231,-142.84486,143.1705,2.7191968,6.883962,-42.644394,-145.5739,-197.42274,9.603159,1.2063502,-1.8371133,94.4332,650000
|
| 12 |
+
0.63567984,138.0719,0.008831696,-0.014373379,-14.127477,0.21752667,-137.94714,138.27505,5.6974854,12.709803,-24.64603,-141.67342,-197.87817,18.407288,4.7303963,-3.2033749,158.51172,655000
|
| 13 |
+
0.63623804,137.46638,0.009263666,-0.013421749,-13.948859,0.20607637,-137.33716,137.65903,3.4032981,8.21361,-36.06813,-141.75467,-200.98817,11.616908,4.929565,-4.8117085,131.04234,660000
|
| 14 |
+
0.63963604,137.9961,0.009014813,-0.010593808,-13.675156,0.18530455,-137.8728,138.1708,3.2476585,7.109079,-8.5246,-140.88858,-199.55827,10.356737,2.2371557,-3.0394223,89.55348,665000
|
| 15 |
+
0.6395569,133.2652,0.009211847,-0.00073787826,-12.580101,0.18402633,-133.1493,133.44849,2.76834,9.373946,-19.889765,-136.00107,-198.4503,12.142286,1.6813269,-2.7929866,89.21693,670000
|
| 16 |
+
0.6485966,137.42767,0.009250066,0.00029897116,-12.467679,0.19743922,-137.31235,137.62541,2.389283,6.9309244,-33.421967,-140.37593,-201.18857,9.320208,2.026956,-1.9043684,87.8613,675000
|
| 17 |
+
0.63144016,137.75407,0.0094066,-0.021223987,-14.756287,0.160401,-137.61526,137.89325,4.9168634,10.215121,-20.492874,-140.98744,-200.64006,15.131985,2.0726125,-1.1277361,120.462875,680000
|
| 18 |
+
0.64020646,134.79355,0.009014654,0.0071165296,-11.71056,0.1742867,-134.68797,134.97495,4.6740317,12.454428,-8.539329,-137.54997,-199.57382,17.12846,4.7329793,-4.216344,185.3577,685000
|
| 19 |
+
0.6400877,135.00232,0.009060658,-0.0025740943,-12.784096,0.17599024,-134.88649,135.17574,3.350991,6.0773544,-8.33259,-137.62027,-203.55818,9.428346,2.7665098,-2.657054,109.92705,690000
|
| 20 |
+
0.64428806,133.97093,0.009122755,0.005186065,-11.931524,0.19546847,-133.86208,134.17159,2.4467533,7.3109775,-22.847443,-136.44743,-197.77386,9.7577305,2.4789689,-2.2731714,88.84099,695000
|
| 21 |
+
0.6358364,132.32816,0.009273592,-0.004794396,-13.016994,0.19637382,-132.20746,132.51974,2.6462228,8.906959,-7.49915,-135.56044,-202.05284,11.553182,1.6759752,-2.4750898,109.19887,700000
|
| 22 |
+
0.641631,135.57135,0.00913897,-0.005520287,-13.104038,0.19505444,-135.4516,135.76088,4.864945,13.727114,-4.7191224,-138.92064,-198.05759,18.592058,16.528944,-16.858261,241.32285,705000
|
| 23 |
+
0.63747144,130.89128,0.009281861,-0.007475043,-13.305339,0.17376587,-130.76778,131.05757,15.929665,8.838729,-28.309315,-133.51329,-198.48114,24.768394,3.0550013,-2.3479598,214.55525,710000
|
| 24 |
+
0.63731545,130.81732,0.009317149,-0.0038833304,-12.916794,0.17139229,-130.69698,130.98483,3.3586495,11.358935,1.769184,-134.70714,-196.91167,14.717585,5.336236,-6.138225,151.36894,715000
|
| 25 |
+
0.6488781,132.60677,0.009136835,0.011130899,-11.281755,0.17180052,-132.5037,132.78969,4.5275,9.924003,-19.114908,-135.4191,-201.0254,14.451503,5.203011,-3.6412268,153.43999,720000
|
| 26 |
+
0.6339715,135.63205,0.009069442,-0.025362894,-15.296522,0.14736578,-135.49333,135.75406,4.769716,11.583646,-7.742432,-138.97955,-194.85439,16.353361,1.9706419,-1.8785528,123.86465,725000
|
| 27 |
+
0.6472691,133.68213,0.009241253,0.0021044118,-12.272281,0.17676659,-133.5687,133.86101,2.9813726,8.96508,-43.672585,-137.2423,-199.53987,11.946453,4.289259,-3.8572793,113.941956,730000
|
| 28 |
+
0.6377163,133.26378,0.008962398,-0.0054894793,-13.112501,0.17783363,-133.14627,133.43613,2.862576,9.5964575,1.8333483,-136.51292,-196.37254,12.459034,6.4120765,-6.50399,154.62837,735000
|
| 29 |
+
0.65132284,130.89178,0.008833182,0.0059564942,-11.825668,0.14519161,-130.78734,131.04292,2.4271212,11.587679,-2.6682057,-134.21355,-203.25717,14.0148,2.6723654,-2.6984668,120.36099,740000
|
| 30 |
+
0.6547223,130.85564,0.009386276,0.008814278,-11.56094,0.14451587,-130.74713,131.00897,2.9675004,11.91864,-6.1773787,-133.17308,-194.92763,14.886141,4.473335,-4.6739044,143.28828,745000
|
| 31 |
+
0.6434861,132.57846,0.009218438,-0.0055969576,-13.107148,0.145913,-132.45763,132.71878,3.3122292,8.402913,-20.754156,-134.658,-200.42552,11.715142,1.0374793,-1.378666,97.07616,750000
|
| 32 |
+
0.65002954,129.66797,0.009129588,0.004979422,-11.954584,0.16181304,-129.55884,129.83476,2.349222,10.220754,-6.5027156,-132.43071,-194.83855,12.569976,3.2709618,-3.5807002,138.312,755000
|
| 33 |
+
0.65691954,130.73676,0.009181536,0.015227006,-10.841562,0.19725296,-130.6372,130.94923,4.703281,10.733401,-9.078466,-133.80426,-198.36879,15.436682,5.0775704,-3.7356696,150.82072,760000
|
| 34 |
+
0.6402673,131.39703,0.009042452,-0.011730363,-13.797255,0.18026003,-131.27228,131.56557,4.5546393,9.1648,-1.0650238,-134.56265,-200.21355,13.719439,3.5508714,-5.6338196,136.7819,765000
|
| 35 |
+
0.65127105,127.7375,0.009180651,0.017035034,-10.644464,0.16157572,-127.639786,127.916115,2.1526682,9.328837,-4.0051427,-130.26881,-197.85461,11.481505,1.6420817,-1.3943172,112.51332,770000
|
| 36 |
+
0.6432563,133.17017,0.00914138,-0.005879761,-13.143203,0.17637259,-133.05,133.34067,2.2674065,8.031833,-18.445778,-135.65042,-199.41968,10.299239,9.26328,-11.214177,149.73338,775000
|
| 37 |
+
0.6530268,129.02579,0.008986389,0.009331833,-11.461559,0.1676651,-128.92279,129.20279,2.520272,6.2087703,2.140582,-131.39546,-197.90439,8.729042,0.86676055,-1.0517943,81.686745,780000
|
| 38 |
+
0.63350284,125.86957,0.009225276,-0.02093663,-14.769485,0.19145401,-125.73332,126.040085,5.9003406,18.683432,-5.3717127,-129.31273,-194.9881,24.583773,5.1506743,-9.939047,223.73534,785000
|
| 39 |
+
0.6474864,127.1162,0.008985348,-0.0063554756,-13.207315,0.16013876,-126.99753,127.26999,4.512806,9.524898,-17.225616,-130.42265,-198.807,14.0377035,4.1561427,-3.2830482,180.8898,790000
|
| 40 |
+
0.64104253,127.81647,0.008956341,0.0007995464,-12.410728,0.16590819,-127.70532,127.98318,2.6771793,10.851982,-2.3091707,-130.50037,-197.1586,13.529161,4.252534,-4.037526,135.28267,795000
|
| 41 |
+
0.63548076,125.29637,0.009454649,-0.00980903,-13.537482,0.17146337,-125.168365,125.45802,3.7408092,9.673207,-1.389225,-129.13518,-198.72536,13.414017,5.6821203,-5.879489,162.60222,800000
|
| 42 |
+
0.63899374,127.279495,0.009020782,-0.016528634,-14.332284,0.18117389,-127.150215,127.444145,8.012087,9.635006,-5.063979,-130.98106,-196.29861,17.647093,2.5219657,-1.9213657,140.23526,805000
|
| 43 |
+
0.64677685,127.41939,0.009245198,-0.00030763957,-12.533276,0.16849852,-127.30351,127.58758,3.4464867,8.778473,0.9862002,-130.08478,-196.41269,12.224959,2.413326,-2.3847232,138.82446,810000
|
| 44 |
+
0.64065903,126.25369,0.009134617,-0.005545587,-13.107096,0.19197187,-126.13396,126.44012,2.803569,8.252367,-6.3219295,-128.96205,-201.7502,11.055936,1.3146433,-1.4739548,105.44423,815000
|
| 45 |
+
0.64454246,126.270874,0.00918372,-0.009831141,-13.570497,0.17664635,-126.14624,126.43768,3.0130792,9.440401,-3.2358665,-129.4868,-204.0863,12.45348,2.146763,-1.1137861,127.39749,820000
|
| 46 |
+
0.64130354,123.32402,0.009165368,0.004420464,-12.017699,0.18294431,-123.21387,123.51138,4.138459,11.64889,-1.6862003,-126.26951,-201.81102,15.787349,1.865061,-2.059171,158.98172,825000
|
| 47 |
+
0.64637834,125.81641,0.009112291,0.0078845285,-11.634737,0.17286256,-125.71039,125.99715,5.856348,10.683692,1.0740206,-129.04979,-201.28378,16.54004,3.195845,-3.817934,202.48907,830000
|
| 48 |
+
0.64171875,122.19771,0.009167968,-0.0062717474,-13.184093,0.17234871,-122.07684,122.363785,3.7944763,10.263959,-3.0644274,-125.36111,-195.38364,14.058435,4.6528625,-3.0885413,145.36685,835000
|
| 49 |
+
0.6504628,122.401535,0.009196626,0.01302639,-11.083569,0.18059237,-122.29961,122.59515,4.627168,9.75995,1.8155544,-125.49221,-204.72063,14.387117,0.9990605,-2.5302176,128.31845,840000
|
| 50 |
+
0.64520234,125.32684,0.0090018315,-0.013717574,-14.023865,0.1582903,-125.20061,125.47141,3.0980787,8.542325,-13.051948,-128.40956,-202.07146,11.640404,3.8898757,-4.3408732,124.64845,845000
|
| 51 |
+
0.63875604,114.513214,0.009333949,0.0069309403,-11.757448,0.1563901,-114.40348,114.67653,5.88703,11.777609,-5.403043,-118.07809,-201.68835,17.664639,3.1603963,-2.318939,161.62549,850000
|
| 52 |
+
0.65294385,129.08485,0.009076337,0.013357946,-11.028267,0.16223311,-128.98476,129.26044,4.2800765,10.5362215,-4.1386614,-132.07788,-199.70778,14.816298,4.888151,-6.351162,190.76434,855000
|
| 53 |
+
0.6455894,123.8411,0.009124527,-0.0058215046,-13.138006,0.17406857,-123.72123,124.00935,4.873342,10.267796,2.473476,-127.057884,-201.75064,15.141138,2.4737313,-2.397577,147.68564,860000
|
| 54 |
+
0.6344453,122.76438,0.009071885,-0.001893875,-12.708763,0.16047941,-122.649086,122.922966,4.1681647,11.218053,-5.9951468,-126.31189,-199.79445,15.386217,3.1480517,-4.94325,164.71046,865000
|
| 55 |
+
0.63795453,123.594086,0.009235439,-0.0045989063,-12.997963,0.13446747,-123.47405,123.72395,3.2970989,11.840903,-0.17041,-126.25713,-202.18724,15.138002,6.957887,-7.564168,215.81961,870000
|
| 56 |
+
0.63864315,120.118866,0.009210995,-0.007063658,-13.266872,0.1602009,-119.99667,120.272,4.5095067,10.843558,-1.8745737,-123.236084,-200.16522,15.3530655,2.0017357,-2.2630987,149.66716,875000
|
| 57 |
+
0.6359637,122.25983,0.009252929,-0.0012322844,-12.633178,0.17291602,-122.14293,122.4315,5.2595115,13.089539,-3.086068,-126.13259,-196.95357,18.34905,1.2724829,-1.1992205,154.65877,880000
|
| 58 |
+
0.6389341,120.109955,0.0091346735,0.002109142,-12.269106,0.122403264,-119.99788,120.23447,3.0179207,7.7200465,-9.786167,-122.49385,-200.29872,10.7379675,1.2558672,-1.3635117,111.45168,885000
|
| 59 |
+
0.6366698,114.80873,0.009273885,-0.005594679,-13.103272,0.14845562,-114.68721,114.95159,18.624197,14.464503,-6.539571,-118.15574,-201.17245,33.0887,2.1601722,-3.1501546,211.17096,890000
|
| 60 |
+
0.637873,117.059975,0.00916664,0.008028765,-11.624132,0.15113187,-116.95343,117.21913,3.3696008,9.533362,1.7814546,-119.80444,-202.93019,12.902964,1.1460733,-1.0049744,116.964355,895000
|
| 61 |
+
0.64138305,124.40807,0.009077662,-5.2921052e-05,-12.50583,0.18280141,-124.294556,124.59082,3.7288482,9.256257,-4.963084,-127.56963,-201.8019,12.9851055,1.4125638,-1.3084403,125.78841,900000
|
| 62 |
+
0.6483187,122.25958,0.009011689,0.0012154799,-12.365122,0.16807923,-122.14815,122.42887,3.7509563,10.321571,-0.64834744,-125.87691,-202.76593,14.072528,2.9678566,-2.6001115,140.40321,905000
|
| 63 |
+
0.6489439,119.10069,0.008961117,0.009954399,-11.389156,0.14155737,-118.998634,119.252205,8.453976,12.007688,-1.5034701,-122.3147,-199.25432,20.461662,4.565872,-4.8924956,268.87323,910000
|
| 64 |
+
0.63995427,120.2769,0.009030836,0.004367645,-12.016363,0.19290213,-120.16838,120.47417,2.9330673,11.471274,-3.8694277,-122.93245,-189.55621,14.404342,1.8233845,-1.8417668,131.72485,915000
|
| 65 |
+
0.63723844,118.721924,0.009076212,-0.0029920763,-12.829661,0.16113754,-118.60547,118.88007,4.861753,9.15174,-6.3458557,-121.92263,-193.60193,14.013493,1.1292986,-1.2244055,115.96152,920000
|
| 66 |
+
0.6484327,119.39964,0.009134948,0.0033438632,-12.133948,0.14715075,-119.2888,119.55013,4.795069,11.370532,-1.4909977,-121.53896,-198.96725,16.165602,5.176269,-4.3091927,193.72958,925000
|
| 67 |
+
0.64355636,118.65789,0.009056213,0.01024576,-11.368649,0.15799467,-118.55493,118.82613,3.299549,11.186944,-2.1969748,-121.12079,-195.13264,14.486493,1.8859658,-1.936069,122.21677,930000
|
| 68 |
+
0.6437866,118.91379,0.009137236,0.007217344,-11.710117,0.17481932,-118.806786,119.095825,4.002647,9.55947,2.8167555,-121.20066,-195.75401,13.562117,1.5318805,-1.2796526,137.35007,935000
|
| 69 |
+
0.64837974,118.85625,0.009071413,0.009312911,-11.473378,0.19926715,-118.75217,119.06483,5.0346694,15.887601,4.121621,-122.38323,-191.41768,20.92227,3.1165411,-2.9369977,294.34402,940000
|
| 70 |
+
0.64472455,126.47232,0.009166483,-0.015910095,-14.235682,0.16174683,-126.34183,126.61816,6.8243966,11.855559,-15.79392,-129.65784,-192.10088,18.679956,3.807382,-2.5643764,163.40152,945000
|
| 71 |
+
0.64496046,114.40094,0.009073888,0.0039024928,-12.069921,0.18235412,-114.29141,114.587204,4.476023,10.666323,-3.7646537,-116.83506,-201.7976,15.142345,3.6598384,-3.330017,154.28336,950000
|
| 72 |
+
0.645682,118.20758,0.008798594,0.006616516,-11.748003,0.1629672,-118.10422,118.37716,5.3422103,14.81799,-6.5057716,-120.94395,-195.5204,20.1602,5.2396717,-4.6692615,203.50403,955000
|
| 73 |
+
0.63369757,116.93909,0.008985574,0.002340296,-12.23955,0.14599863,-116.82911,117.087425,3.0614898,9.726741,-4.070353,-119.73114,-197.76974,12.788231,1.9773062,-1.2617353,111.10201,960000
|
| 74 |
+
0.64459586,118.777626,0.009016115,-0.010724651,-13.689498,0.16647708,-118.6542,118.93337,3.4700325,11.4828825,-0.22997528,-121.56573,-198.85333,14.952915,3.833399,-4.0033984,141.10706,965000
|
| 75 |
+
0.6442967,117.66928,0.009140146,-0.0002736615,-12.529941,0.1691444,-117.554756,117.83815,3.4219162,11.356181,0.18007255,-120.75474,-195.20703,14.778097,8.848051,-8.476851,204.867,970000
|
| 76 |
+
0.64540464,115.15419,0.008967323,0.006092378,-11.820602,0.14788702,-115.048195,115.308174,4.6522136,13.720438,0.8138359,-119.08605,-198.23894,18.372652,3.8114145,-3.888458,166.44426,975000
|
| 77 |
+
0.6470643,114.40196,0.009039805,0.001965595,-12.282562,0.15707147,-114.290924,114.561005,4.923786,16.705473,-1.1280168,-117.83555,-194.9676,21.62926,1.7891672,-1.5491067,196.01204,980000
|
| 78 |
+
0.64754117,115.56478,0.008944297,-0.0039106393,-12.937222,0.15714747,-115.44908,115.71802,3.0029457,9.37005,-0.50882584,-119.13,-192.77493,12.372996,2.7185116,-2.9024599,128.16049,985000
|
| 79 |
+
0.63874596,121.17827,0.008960809,-0.009602812,-13.571646,0.15379451,-121.05665,121.32246,3.1221414,10.728148,-4.8191285,-123.80271,-201.3842,13.85029,1.8158121,-1.8504375,133.22241,990000
|
| 80 |
+
0.6454062,117.05056,0.008956042,-0.0066101816,-13.23807,0.16767833,-116.93199,117.21163,4.758899,17.488749,5.338298,-120.91976,-196.3003,22.247648,3.0382419,-2.8560388,185.99777,995000
|
| 81 |
+
0.64731824,112.451416,0.008760965,0.00075338007,-12.414007,0.13154456,-112.34266,112.58372,8.1284275,9.773252,-4.9251156,-116.04305,-193.1701,17.90168,10.449256,-14.791387,166.94571,1000000
|
| 82 |
+
0.6415385,113.43013,0.008863633,0.0046134125,-11.979512,0.15292776,-113.323944,113.58768,5.5877395,11.670615,-0.73797745,-116.19031,-197.6764,17.258354,1.9099387,-2.100515,165.17464,1005000
|
| 83 |
+
0.6406224,118.62348,0.009015222,7.204777e-06,-12.499201,0.15410139,-118.5108,118.77759,3.0084012,9.1436405,-1.2859694,-120.75701,-194.61945,12.152041,0.88140893,-0.8382842,102.03757,1010000
|
| 84 |
+
0.65473694,117.18089,0.008878814,-0.0020890161,-12.735281,0.15644641,-117.067825,117.33525,3.9475312,8.235858,-4.8435917,-119.5333,-203.98254,12.18339,1.3828522,-0.933365,118.28592,1015000
|
| 85 |
+
0.64421433,117.49155,0.008670602,0.0019436369,-12.275836,0.1713018,-117.3851,117.664795,4.6867366,8.131165,-2.1649141,-120.32354,-196.46684,12.817902,0.90966547,-1.4106151,111.5549,1020000
|
| 86 |
+
0.64330924,114.57077,0.008634423,-0.0063225334,-13.232247,0.17857243,-114.45651,114.74302,5.4503846,11.879647,-0.32574785,-117.411156,-202.63498,17.330032,2.1401463,-1.9885571,168.686,1025000
|
| 87 |
+
0.6485826,112.4044,0.008814249,0.020358061,-10.190324,0.13645092,-112.31458,112.56121,3.0476525,8.479595,-3.36713,-114.95812,-192.06801,11.527247,2.6978247,-2.3827279,117.92287,1030000
|
| 88 |
+
0.6554735,118.58715,0.008526496,0.013309574,-10.9390335,0.1673339,-118.49388,118.7678,3.5174844,8.221016,-4.6501703,-120.27338,-199.64618,11.738501,1.3702745,-3.4708037,129.0237,1035000
|
| 89 |
+
0.633036,111.119705,0.008712473,-0.012938751,-13.985084,0.12545459,-110.997856,111.23222,5.3714027,12.101888,-3.867026,-115.047134,-202.09631,17.47329,3.5277996,-2.9393957,161.1915,1040000
|
| 90 |
+
0.640777,118.052185,0.008811244,-0.015225196,-14.227928,0.16139978,-117.92683,118.19836,4.349827,14.192024,-2.576127,-121.55572,-193.63931,18.541851,1.9507523,-2.3820186,162.47781,1045000
|
| 91 |
+
0.6472975,112.533264,0.008659835,0.0061951857,-11.784607,0.14986864,-112.43121,112.68933,4.9959583,11.984378,-2.633475,-114.76267,-197.88487,16.980335,2.4883854,-2.2352924,167.89854,1050000
|
| 92 |
+
0.63827443,113.466675,0.008592984,-0.0073416214,-13.354374,0.15324846,-113.35192,113.61259,4.05825,11.200887,-1.8257453,-116.93023,-193.59686,15.259136,1.9416494,-1.2063519,134.68027,1055000
|
| 93 |
+
0.6422363,111.698456,0.0087209195,-0.009334766,-13.570388,0.1417098,-111.58011,111.830826,4.0812454,12.43888,-5.621551,-114.869995,-202.29312,16.520126,4.1657343,-3.5756934,216.34358,1060000
|
| 94 |
+
0.64424145,115.002945,0.008727608,-0.007835609,-13.397796,0.15186536,-114.88602,115.14697,7.718065,10.620399,0.12972409,-117.40154,-203.41165,18.338465,2.3159292,-2.1204224,157.53412,1065000
|
| 95 |
+
0.6430882,109.730286,0.008566355,0.003785164,-12.058136,0.15722358,-109.62699,109.8913,3.9252992,17.025846,-3.1793075,-112.711845,-191.17403,20.951145,3.7029743,-4.373851,195.96883,1070000
|
| 96 |
+
0.64453286,113.31501,0.00859536,-0.008975193,-13.54419,0.14798376,-113.19859,113.454025,5.76289,14.078921,-7.0185328,-116.84789,-198.46365,19.841812,1.7990748,-2.007161,166.03069,1075000
|
| 97 |
+
0.6395069,115.98883,0.008536161,-0.008576986,-13.504783,0.16949692,-115.87355,116.14975,3.6858838,9.744466,0.58442235,-119.34639,-203.1849,13.430349,2.7388535,-3.0055685,124.05796,1080000
|
| 98 |
+
0.6403822,110.18609,0.008587385,0.0011805262,-12.362528,0.15526359,-110.079926,110.34254,3.804751,8.920447,-3.3337824,-112.99873,-201.88206,12.725199,2.0302877,-1.831586,113.27369,1085000
|
| 99 |
+
0.6467378,110.739456,0.00842496,0.013753616,-10.867516,0.12504458,-110.647896,110.87826,4.344004,20.284718,-7.0690207,-113.395164,-194.65454,24.628721,6.9020777,-6.8882017,221.74237,1090000
|
| 100 |
+
0.6404147,102.25562,0.008424615,-0.0011237228,-12.633386,0.12712602,-102.149185,102.38163,3.9435203,10.842885,7.8170795,-105.79122,-198.07872,14.786406,3.5977685,-4.390843,150.91971,1095000
|
| 101 |
+
0.6354557,105.13481,0.008491043,-0.008430958,-13.492924,0.14605631,-105.02025,105.27244,6.1955996,13.703727,-0.72251415,-107.570206,-198.51451,19.899326,2.4226484,-3.291892,183.64966,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d092fad2e28f990ad923fc25f6cf96e9f979583433f1aecca7b908f2729a9ab9
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7352a402a73759b0b617217265d95452a5dbc0aa73ceffbafd749b3dd40c5c19
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d34060b15c46b12596e20e49e6b9560bed5a09c86415fd695bc0149474bc7bb
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be93fce5cdafa9e70314a6facae9247a69c868c1edb23de071cf4327be2bfa5c
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc39935326b1b3c5dcd2801106636035af0d3094aa3ea16c651be37e45d4c708
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:990a01686ae0a046b620fb24386a46193b5ce2a7b3f60ec1f922b2570acc0289
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:506257e273cbe06a2c4488ac86ce4c89ef5d4f8b509b15106cec859656639f2a
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1072536bf4f34b33e536de1fe301f3de20bec3217c8e0d7e7cfa72c47153c00
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1e56c2984cd3097a0a5d902ae6c06777754779b5e2409e9148c678e5b6cc35d
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4cb1b32c5c5f5866e2f87cf1892edca722b2ac89bf35805acdd1454162599dd0
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260318_180457/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/1d2bf09z
|