Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1150000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1200000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0037141819402860513,-0.009289666404831093,-0.0034901066756813388,-0.016999899443163036,29.95688333980875,8.420999999999397,0.88,3915.44,-0.22,-255.48,166.42,0.5122157192230224,850000
|
| 3 |
+
0.0,0.0,-0.02658017874024795,0.046486118340035264,-0.024917546389204712,0.019864161811453465,33.82047865722125,6.303999999999486,0.88,11723.44,-0.16,-202.78,124.08,0.39333457469940186,900000
|
| 4 |
+
0.0,0.0,-0.04197597927671605,0.056187300576824466,-0.03913382518229806,0.0455235340605454,34.2417699365257,5.427999999999692,0.94,17627.9,-0.08,-150.06,106.56,0.33767960548400877,950000
|
| 5 |
+
0.0,0.0,-0.021750175747535384,0.051829630244757126,-0.017914033468986613,0.0724665683540855,35.034315037742985,3.346999999999843,0.98,22633.9,-0.04,-101.72,64.94,0.21160626411437988,1000000
|
| 6 |
+
0.0,0.0,-0.025794843796654365,0.05589373991454091,-0.02286788870067844,0.05027851675338094,35.092480262648984,3.3319999999998777,0.98,25891.64,-0.02,-90.42,64.64,0.21178954124450683,1050000
|
| 7 |
+
0.0,0.0,-0.032187042773301804,0.0544784425440621,-0.027843778158183435,0.05528217541841143,35.36108935273834,2.947999999999887,0.98,28813.42,-0.02,-78.68,56.96,0.19253294467926024,1100000
|
| 8 |
+
0.0,0.0,-0.043726193858877646,0.05492452542655791,-0.039622267185384176,0.05168214281144776,34.87713305226147,2.982999999999994,1.0,32272.1,0.0,-83.46,57.66,0.18976866722106933,1150000
|
| 9 |
+
0.0,0.0,-0.030863250085507263,0.03285654907643072,-0.027995632740576135,0.03973955857695757,35.52488315508173,2.615999999999933,1.0,35126.06,0.0,-74.22,50.32,0.16743730068206786,1200000
|
| 10 |
+
0.0,0.0,-0.03771843582007817,0.058275073658081517,-0.03362099612239974,0.04850245855705484,35.47649560288758,2.410999999999956,1.0,37646.76,0.0,-67.74,46.22,0.1603921604156494,1250000
|
| 11 |
+
0.0,0.0,-0.04037502866839213,0.06706707377473228,-0.03641735791310133,0.06655941541558974,35.56324940651917,3.3609999999998315,0.96,40734.28,-0.06,-100.74,65.22,0.2126008701324463,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0037141819402860513,-0.009289666404831093,-0.0034901066756813388,-0.016999899443163036,29.95688333980875,8.420999999999397,0.88,3915.44,-0.22,-255.48,166.42,0.5122157192230224,850000
|
| 3 |
+
0.0,0.0,-0.02658017874024795,0.046486118340035264,-0.024917546389204712,0.019864161811453465,33.82047865722125,6.303999999999486,0.88,11723.44,-0.16,-202.78,124.08,0.39333457469940186,900000
|
| 4 |
+
0.0,0.0,-0.04197597927671605,0.056187300576824466,-0.03913382518229806,0.0455235340605454,34.2417699365257,5.427999999999692,0.94,17627.9,-0.08,-150.06,106.56,0.33767960548400877,950000
|
| 5 |
+
0.0,0.0,-0.021750175747535384,0.051829630244757126,-0.017914033468986613,0.0724665683540855,35.034315037742985,3.346999999999843,0.98,22633.9,-0.04,-101.72,64.94,0.21160626411437988,1000000
|
| 6 |
+
0.0,0.0,-0.025794843796654365,0.05589373991454091,-0.02286788870067844,0.05027851675338094,35.092480262648984,3.3319999999998777,0.98,25891.64,-0.02,-90.42,64.64,0.21178954124450683,1050000
|
| 7 |
+
0.0,0.0,-0.032187042773301804,0.0544784425440621,-0.027843778158183435,0.05528217541841143,35.36108935273834,2.947999999999887,0.98,28813.42,-0.02,-78.68,56.96,0.19253294467926024,1100000
|
| 8 |
+
0.0,0.0,-0.043726193858877646,0.05492452542655791,-0.039622267185384176,0.05168214281144776,34.87713305226147,2.982999999999994,1.0,32272.1,0.0,-83.46,57.66,0.18976866722106933,1150000
|
| 9 |
+
0.0,0.0,-0.030863250085507263,0.03285654907643072,-0.027995632740576135,0.03973955857695757,35.52488315508173,2.615999999999933,1.0,35126.06,0.0,-74.22,50.32,0.16743730068206786,1200000
|
| 10 |
+
0.0,0.0,-0.03771843582007817,0.058275073658081517,-0.03362099612239974,0.04850245855705484,35.47649560288758,2.410999999999956,1.0,37646.76,0.0,-67.74,46.22,0.1603921604156494,1250000
|
| 11 |
+
0.0,0.0,-0.04037502866839213,0.06706707377473228,-0.03641735791310133,0.06655941541558974,35.56324940651917,3.3609999999998315,0.96,40734.28,-0.06,-100.74,65.22,0.2126008701324463,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,0.9999999,0.02410361,2.4103608,1.0241035,1.9091374,-23.43616,-105.48879,-183.12996,0.3193689,-0.26776817,14.730891,805000
|
| 3 |
+
1.0,1.0,0.02380301,2.380301,1.023803,0.63779444,-19.59643,-103.25744,-178.30934,0.17955501,-0.20740387,9.6517935,810000
|
| 4 |
+
1.0,1.0,0.021237172,2.1237173,1.0212371,0.6028103,-29.289673,-107.38372,-177.52257,0.067119695,-0.10765349,6.445495,815000
|
| 5 |
+
1.0,1.0,0.021798328,2.1798327,1.0217984,1.0461649,-19.682823,-108.66001,-191.23906,0.12859859,-0.17938888,10.883982,820000
|
| 6 |
+
1.0,1.0,0.021467896,2.1467896,1.0214679,1.0746031,-45.20725,-108.43286,-187.32812,0.17011768,-0.20696712,12.279442,825000
|
| 7 |
+
1.0,1.0000001,0.021989597,2.19896,1.0219897,1.2194186,-28.921995,-107.67217,-194.63306,0.3559876,-0.34644085,18.425617,830000
|
| 8 |
+
1.0,1.0,0.023784399,2.3784401,1.0237844,1.0930882,-3.1446528,-105.84029,-183.90959,0.5489834,-0.70402634,21.732082,835000
|
| 9 |
+
1.0,1.0,0.022845447,2.2845447,1.0228455,1.1617107,-20.739492,-105.533035,-195.2949,0.2514022,-0.27630228,15.18858,840000
|
| 10 |
+
1.0,1.0,0.02214571,2.2145712,1.0221457,1.0246687,-12.891713,-104.629654,-204.23555,0.29006028,-0.1701543,14.682644,845000
|
| 11 |
+
1.0,1.0,0.026822837,2.6822839,1.0268228,1.5776218,-27.90459,-103.158936,-177.78853,0.43840292,-0.36219645,25.57153,850000
|
| 12 |
+
1.0,1.0,0.02487234,2.4872344,1.0248723,1.8112202,-6.64865,-100.07806,-186.64462,0.30563253,-0.380165,22.543392,855000
|
| 13 |
+
1.0,1.0,0.025530342,2.5530343,1.0255303,1.8197628,-11.423798,-98.85901,-197.05936,0.42484275,-0.38403285,21.27657,860000
|
| 14 |
+
1.0,0.99999994,0.025199259,2.519926,1.0251992,1.3544217,-14.683274,-96.66158,-196.8271,0.5492832,-0.43808,24.157415,865000
|
| 15 |
+
1.0,1.0,0.025838764,2.5838766,1.0258387,1.0243921,-9.718414,-94.69698,-203.35918,0.1120887,-0.16515662,10.502487,870000
|
| 16 |
+
1.0,0.9999999,0.026386408,2.6386406,1.0263863,1.8566955,-5.803877,-98.53196,-202.72218,0.288699,-0.30139923,17.357609,875000
|
| 17 |
+
1.0,0.9999999,0.026414484,2.6414485,1.0264144,1.3589294,-5.9641685,-99.2282,-198.88034,0.32935855,-0.3784812,15.693888,880000
|
| 18 |
+
1.0,1.0,0.02575148,2.575148,1.0257515,1.794418,-16.33981,-98.48187,-196.0891,0.2273706,-0.28211713,19.674442,885000
|
| 19 |
+
1.0,1.0,0.026709914,2.6709914,1.0267099,1.3998841,-17.18051,-97.0176,-198.82697,0.23145735,-0.21120808,15.720755,890000
|
| 20 |
+
1.0,0.9999888,0.02622561,2.622561,1.0262144,1.2723486,2.7037196,-97.409485,-198.91637,0.30216652,-0.1645944,16.31403,895000
|
| 21 |
+
1.0,1.0000001,0.026585024,2.6585026,1.0265851,1.2911261,-6.8098044,-91.00967,-174.95529,0.2362828,-0.18194292,15.0081215,900000
|
| 22 |
+
1.0,1.0,0.026594447,2.6594448,1.0265944,1.1429278,-4.050094,-95.38822,-202.42056,0.1419669,-0.1704781,13.195405,905000
|
| 23 |
+
1.0,1.0,0.026483906,2.6483908,1.0264839,0.97905505,1.2121545,-94.06665,-184.30733,0.10747885,-0.19091994,11.711199,910000
|
| 24 |
+
1.0,0.9999942,0.02572804,2.572804,1.0257223,1.1595924,1.5111568,-92.30213,-187.41649,0.12882903,-0.29800177,13.06944,915000
|
| 25 |
+
1.0,0.9999999,0.02692746,2.6927462,1.0269274,1.2043654,-4.751182,-90.24686,-162.6774,0.28412586,-0.26157898,15.384199,920000
|
| 26 |
+
1.0,1.0,0.0268546,2.68546,1.0268546,1.0888764,-1.7485965,-90.94399,-193.85298,0.24317265,-0.1228862,13.895265,925000
|
| 27 |
+
1.0,1.0,0.02812236,2.812236,1.0281223,4.518034,-13.943093,-93.157814,-186.87042,1.9493235,-1.6208564,51.138176,930000
|
| 28 |
+
1.0,0.99994934,0.026854776,2.6854777,1.0268041,1.4749054,2.3279257,-91.032906,-200.07137,0.6845144,-0.4231808,19.631756,935000
|
| 29 |
+
1.0,1.0,0.028163737,2.8163738,1.0281638,1.838271,1.5905452,-90.0653,-187.4637,0.22870138,-0.3578775,23.080559,940000
|
| 30 |
+
1.0,1.0,0.027880792,2.7880793,1.0278808,1.2045025,1.9804647,-89.935265,-198.53224,0.38935673,-0.1583278,15.457857,945000
|
| 31 |
+
1.0,1.0,0.0278222,2.7822201,1.0278223,1.5444173,-7.8328266,-91.02927,-201.11586,1.0994151,-1.0327189,25.87619,950000
|
| 32 |
+
1.0,0.99999994,0.025508858,2.5508862,1.0255088,3.6661155,-9.278952,-89.51774,-171.5341,0.8341637,-0.55734116,39.27726,955000
|
| 33 |
+
1.0,1.0,0.027337873,2.7337875,1.0273379,1.3344606,-5.0243726,-92.6448,-201.80017,0.26704118,-0.30315393,16.471146,960000
|
| 34 |
+
1.0,1.0,0.025625892,2.5625892,1.025626,1.4673868,-0.57178795,-87.42965,-179.18938,0.17463446,-0.17264393,15.3209305,965000
|
| 35 |
+
1.0,0.99999994,0.028759431,2.8759432,1.0287594,1.3849434,-4.4453197,-89.08459,-200.34576,0.19579662,-0.29231024,21.097317,970000
|
| 36 |
+
1.0,1.0,0.027680473,2.7680473,1.0276805,0.94592,-5.615648,-92.13196,-196.51187,0.17338726,-0.12570286,11.878268,975000
|
| 37 |
+
1.0,0.9999543,0.026159452,2.6159453,1.0261137,3.8358307,1.3802553,-88.78031,-199.75237,4.244095,-4.2476616,100.88022,980000
|
| 38 |
+
1.0,0.99999994,0.029272322,2.9272323,1.0292723,0.98873484,0.29833764,-87.59891,-191.22249,0.17490108,-0.50172913,14.716304,985000
|
| 39 |
+
1.0,1.0,0.027006544,2.7006545,1.0270065,1.478874,-5.2570996,-88.1299,-202.8943,0.19663839,-0.42494738,23.0531,990000
|
| 40 |
+
1.0,1.0,0.027398303,2.73983,1.0273983,1.3263129,-7.3087096,-88.00531,-202.00954,0.20980613,-0.106129535,12.981856,995000
|
| 41 |
+
1.0,0.9999999,0.02758297,2.758297,1.0275829,1.156066,2.0123827,-85.99822,-202.29607,0.20731233,-0.27509582,15.95223,1000000
|
| 42 |
+
1.0,0.99999994,0.02840494,2.8404942,1.0284048,1.1819504,-2.949977,-85.01765,-197.52666,0.28943932,-0.21426341,15.668646,1005000
|
| 43 |
+
1.0,1.0,0.029072225,2.9072225,1.0290723,1.2035801,-5.5902543,-87.78769,-169.65141,0.25580984,-0.12875043,14.730901,1010000
|
| 44 |
+
1.0,1.0,0.03051268,3.051268,1.0305127,1.5635412,-6.253939,-87.56074,-191.10498,0.24542692,-0.17928849,16.90411,1015000
|
| 45 |
+
1.0,1.0,0.027650677,2.7650676,1.0276507,1.1588738,-3.5886083,-84.179634,-194.71281,0.291935,-0.39546272,19.399126,1020000
|
| 46 |
+
1.0,0.9999999,0.029216282,2.921628,1.0292162,0.9481535,-2.66734,-81.281334,-162.45715,0.14313228,-0.17854276,11.602129,1025000
|
| 47 |
+
1.0,0.99999994,0.03013879,3.013879,1.0301387,1.1779976,0.12067218,-86.52738,-169.82628,0.14696845,-0.17708358,12.521473,1030000
|
| 48 |
+
1.0,1.0,0.028147578,2.8147578,1.0281476,1.874497,-3.753836,-81.959015,-174.15164,1.1648431,-1.0007125,36.18038,1035000
|
| 49 |
+
1.0,1.0,0.028468922,2.8468924,1.028469,1.2965643,1.53752,-85.57175,-188.52634,0.23975125,-0.18645357,16.854118,1040000
|
| 50 |
+
1.0,1.0,0.031447463,3.1447463,1.0314474,1.2081183,-1.688546,-85.07387,-177.73816,0.20183364,-0.24944961,15.6082,1045000
|
| 51 |
+
1.0,1.0,0.026308257,2.6308255,1.0263083,1.7783566,-2.1014814,-79.8583,-190.85182,0.7923367,-0.7265445,28.220688,1050000
|
| 52 |
+
1.0,1.0,0.028486082,2.8486083,1.0284861,1.1333393,-0.15658858,-86.24452,-190.41249,0.14912944,-0.3790294,16.48212,1055000
|
| 53 |
+
1.0,1.0,0.02872777,2.872777,1.0287278,1.2299031,0.92720354,-80.925224,-191.72128,0.37867957,-0.2589805,15.436908,1060000
|
| 54 |
+
1.0,1.0,0.02957786,2.957786,1.0295779,1.08959,-4.9060955,-84.02163,-201.15358,0.26207647,-0.13344666,12.699772,1065000
|
| 55 |
+
1.0,1.0,0.028453149,2.845315,1.0284531,1.0091734,-2.4246533,-81.91949,-164.98116,0.1869911,-0.22520712,11.340364,1070000
|
| 56 |
+
1.0,1.0,0.026629947,2.6629946,1.0266299,1.3216813,-2.9514027,-83.30842,-203.57175,0.24107005,-0.33764654,17.410635,1075000
|
| 57 |
+
1.0,1.0,0.028455796,2.8455796,1.0284559,1.2046213,-8.961839,-83.774414,-190.82774,0.12978865,-0.3406704,13.700312,1080000
|
| 58 |
+
1.0,1.0,0.028488662,2.848866,1.0284886,1.2936741,-1.1913927,-79.097374,-158.88066,0.18888363,-0.2508616,14.776207,1085000
|
| 59 |
+
1.0,1.0,0.02846583,2.8465831,1.0284659,1.3511019,-1.1688342,-78.458145,-191.40349,0.38997006,-0.3957321,17.081982,1090000
|
| 60 |
+
1.0,0.99999994,0.028188035,2.8188038,1.028188,1.1219037,0.89476395,-77.98512,-177.16919,0.16934058,-0.23914768,14.945656,1095000
|
| 61 |
+
1.0,1.0,0.02676082,2.6760821,1.0267608,0.9075324,-4.5654683,-82.61029,-172.79932,0.10339762,-0.13725029,9.866718,1100000
|
| 62 |
+
1.0,1.0000001,0.030250352,3.0250351,1.0302504,2.6628182,-2.9716854,-83.00551,-177.32939,0.596265,-0.7174866,26.92434,1105000
|
| 63 |
+
1.0,1.0,0.03213961,3.2139611,1.0321397,1.1516432,-3.5491974,-79.270325,-191.36688,0.8391836,-0.8282829,18.952702,1110000
|
| 64 |
+
1.0,0.9999998,0.02807482,2.8074822,1.0280746,1.1628659,-4.4387555,-79.92703,-163.53581,0.16011095,-0.2888382,16.356178,1115000
|
| 65 |
+
1.0,1.0,0.028499074,2.8499076,1.0284991,1.3380702,-1.7178695,-80.566505,-183.29852,0.30179745,-0.22225456,16.128666,1120000
|
| 66 |
+
1.0,0.9999999,0.030178145,3.0178146,1.0301781,0.89896435,-1.9377646,-78.30114,-167.58029,0.15899986,-0.18136847,11.935469,1125000
|
| 67 |
+
1.0,1.0,0.02781725,2.781725,1.0278172,1.29538,2.6289089,-74.859764,-182.39056,0.22651467,-0.24372941,16.315674,1130000
|
| 68 |
+
1.0,1.0,0.030926492,3.0926492,1.0309265,1.716401,-0.23301135,-76.810875,-200.80482,0.39863804,-0.33516392,24.925766,1135000
|
| 69 |
+
1.0,0.9999999,0.030366203,3.0366206,1.0303661,1.2152563,-2.468185,-78.17031,-170.4856,0.31099916,-0.29580683,15.880432,1140000
|
| 70 |
+
1.0,0.9999999,0.030128393,3.0128396,1.0301282,0.8468012,-2.0958297,-82.2239,-184.58897,0.14410515,-0.21615106,11.852083,1145000
|
| 71 |
+
1.0,0.99999994,0.027594794,2.7594795,1.0275947,1.680952,0.35136867,-74.69525,-183.61014,0.6418698,-0.72181183,26.003872,1150000
|
| 72 |
+
1.0,1.0,0.03006816,3.006816,1.0300682,0.924746,-0.25669122,-80.83091,-174.65176,0.34838358,-0.15688168,12.000358,1155000
|
| 73 |
+
1.0,1.0,0.028254047,2.8254046,1.028254,1.466363,1.1734523,-74.56835,-195.79265,0.24552226,-0.2584075,19.539204,1160000
|
| 74 |
+
1.0,1.0,0.02859028,2.8590283,1.0285903,1.0310937,-0.20960355,-78.48393,-182.68034,0.25074357,-0.14760591,13.582213,1165000
|
| 75 |
+
1.0,1.0,0.029276432,2.9276433,1.0292765,1.0159237,-5.6357927,-77.24181,-177.89029,0.14679231,-0.5055061,14.373636,1170000
|
| 76 |
+
1.0,1.0,0.028866805,2.8866806,1.0288668,1.2225064,0.6839527,-74.79818,-198.15187,0.29366404,-0.31396753,17.150095,1175000
|
| 77 |
+
1.0,1.0,0.02713696,2.7136958,1.0271369,1.6237978,-1.2452569,-77.52636,-178.07689,0.37828296,-0.37598723,16.76959,1180000
|
| 78 |
+
1.0,1.0,0.028936177,2.8936179,1.0289361,0.7920421,1.2362982,-76.67555,-181.70906,0.110951714,-0.20024571,10.141432,1185000
|
| 79 |
+
1.0,1.0,0.03239873,3.2398734,1.0323987,0.9608206,-3.8412406,-80.61489,-177.72766,0.23019694,-0.39168304,16.526571,1190000
|
| 80 |
+
1.0,1.0,0.030598074,3.0598075,1.030598,1.202679,-4.773767,-78.36965,-161.75505,0.24627611,-0.37814817,17.769703,1195000
|
| 81 |
+
1.0,1.0000001,0.028449062,2.8449063,1.0284492,1.0357367,-1.0556793,-75.887566,-185.10309,0.24589923,-0.21604285,14.169531,1200000
|
| 82 |
+
1.0,1.0,0.030330122,3.0330124,1.0303302,0.9415167,-0.4582742,-77.47803,-173.94662,0.29593295,-0.26257968,13.230233,1205000
|
| 83 |
+
1.0,1.0,0.02906382,2.906382,1.0290638,1.3304344,-1.630199,-78.930534,-188.27322,0.45628884,-0.2339343,19.281055,1210000
|
| 84 |
+
1.0,1.0,0.02821558,2.821558,1.0282155,1.7465264,-5.3495994,-74.536354,-157.08803,0.7749874,-0.78746825,19.406725,1215000
|
| 85 |
+
1.0,1.0,0.031386077,3.138608,1.0313861,1.320227,1.5465013,-75.31381,-173.94577,0.12612827,-0.28249577,13.31835,1220000
|
| 86 |
+
1.0,1.0,0.028708294,2.8708296,1.0287083,1.6065212,-4.5836215,-72.45255,-197.12827,0.5800811,-0.34553543,23.466255,1225000
|
| 87 |
+
1.0,1.0000001,0.029934548,2.993455,1.0299346,1.6642891,-2.5047626,-70.16891,-156.56259,0.3276697,-0.32197854,20.784538,1230000
|
| 88 |
+
1.0,1.0,0.033349648,3.334965,1.0333496,1.222254,-6.6965213,-76.935326,-196.06874,0.14251712,-0.13907796,13.686083,1235000
|
| 89 |
+
1.0,0.9999999,0.03026352,3.026352,1.0302634,0.9269018,4.340566,-70.311745,-180.38322,0.3826728,-0.1935906,13.252422,1240000
|
| 90 |
+
1.0,1.0,0.03074823,3.074823,1.0307482,1.0598925,-2.8623817,-75.03533,-162.90001,0.45341796,-0.4570985,12.965721,1245000
|
| 91 |
+
1.0,1.0,0.028995546,2.8995547,1.0289955,0.8979678,-2.4398894,-73.82891,-178.77165,0.25564182,-0.14450528,13.346901,1250000
|
| 92 |
+
1.0,0.9999999,0.029063072,2.9063072,1.029063,0.87690157,-2.3838649,-74.12319,-155.9497,0.17950605,-0.16691108,11.488896,1255000
|
| 93 |
+
1.0,1.0,0.029767655,2.9767656,1.0297676,1.6096207,-3.153565,-70.48086,-144.95871,0.5189822,-0.79094136,23.26599,1260000
|
| 94 |
+
1.0,1.0,0.03140136,3.140136,1.0314014,1.0392185,-2.3279724,-70.23532,-153.92537,0.13538271,-0.1542456,12.497112,1265000
|
| 95 |
+
1.0,1.0,0.03153889,3.1538892,1.0315388,0.99915355,0.043501794,-71.25774,-166.37413,0.6275582,-0.6981232,18.812523,1270000
|
| 96 |
+
1.0,0.9999999,0.02799375,2.799375,1.0279937,1.3436955,-0.88075817,-70.6794,-166.75859,0.19288035,-0.13468301,13.970972,1275000
|
| 97 |
+
1.0,1.0,0.030890591,3.0890594,1.0308906,16.47075,0.9823109,-70.11011,-152.18504,1.9891517,-1.5257243,101.17121,1280000
|
| 98 |
+
1.0,0.9999999,0.029944956,2.9944956,1.0299449,2.2475736,0.07484229,-70.267,-195.94066,0.2640414,-0.27297005,20.908789,1285000
|
| 99 |
+
1.0,1.0,0.03083427,3.0834272,1.0308343,1.2790583,-0.50386167,-71.30391,-162.85318,0.32527977,-0.8129202,21.440079,1290000
|
| 100 |
+
1.0,0.99999994,0.030233573,3.0233574,1.0302335,1.2709656,-1.8874278,-68.87472,-173.6553,0.5272106,-0.3058184,21.133642,1295000
|
| 101 |
+
1.0,1.0,0.029598529,2.9598527,1.0295985,0.8845865,-1.6508212,-67.65377,-170.14865,0.18037783,-0.12003369,9.05088,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,0.9999999,0.02410361,2.4103608,1.0241035,1.9091374,-23.43616,-105.48879,-183.12996,0.3193689,-0.26776817,14.730891,805000
|
| 3 |
+
1.0,1.0,0.02380301,2.380301,1.023803,0.63779444,-19.59643,-103.25744,-178.30934,0.17955501,-0.20740387,9.6517935,810000
|
| 4 |
+
1.0,1.0,0.021237172,2.1237173,1.0212371,0.6028103,-29.289673,-107.38372,-177.52257,0.067119695,-0.10765349,6.445495,815000
|
| 5 |
+
1.0,1.0,0.021798328,2.1798327,1.0217984,1.0461649,-19.682823,-108.66001,-191.23906,0.12859859,-0.17938888,10.883982,820000
|
| 6 |
+
1.0,1.0,0.021467896,2.1467896,1.0214679,1.0746031,-45.20725,-108.43286,-187.32812,0.17011768,-0.20696712,12.279442,825000
|
| 7 |
+
1.0,1.0000001,0.021989597,2.19896,1.0219897,1.2194186,-28.921995,-107.67217,-194.63306,0.3559876,-0.34644085,18.425617,830000
|
| 8 |
+
1.0,1.0,0.023784399,2.3784401,1.0237844,1.0930882,-3.1446528,-105.84029,-183.90959,0.5489834,-0.70402634,21.732082,835000
|
| 9 |
+
1.0,1.0,0.022845447,2.2845447,1.0228455,1.1617107,-20.739492,-105.533035,-195.2949,0.2514022,-0.27630228,15.18858,840000
|
| 10 |
+
1.0,1.0,0.02214571,2.2145712,1.0221457,1.0246687,-12.891713,-104.629654,-204.23555,0.29006028,-0.1701543,14.682644,845000
|
| 11 |
+
1.0,1.0,0.026822837,2.6822839,1.0268228,1.5776218,-27.90459,-103.158936,-177.78853,0.43840292,-0.36219645,25.57153,850000
|
| 12 |
+
1.0,1.0,0.02487234,2.4872344,1.0248723,1.8112202,-6.64865,-100.07806,-186.64462,0.30563253,-0.380165,22.543392,855000
|
| 13 |
+
1.0,1.0,0.025530342,2.5530343,1.0255303,1.8197628,-11.423798,-98.85901,-197.05936,0.42484275,-0.38403285,21.27657,860000
|
| 14 |
+
1.0,0.99999994,0.025199259,2.519926,1.0251992,1.3544217,-14.683274,-96.66158,-196.8271,0.5492832,-0.43808,24.157415,865000
|
| 15 |
+
1.0,1.0,0.025838764,2.5838766,1.0258387,1.0243921,-9.718414,-94.69698,-203.35918,0.1120887,-0.16515662,10.502487,870000
|
| 16 |
+
1.0,0.9999999,0.026386408,2.6386406,1.0263863,1.8566955,-5.803877,-98.53196,-202.72218,0.288699,-0.30139923,17.357609,875000
|
| 17 |
+
1.0,0.9999999,0.026414484,2.6414485,1.0264144,1.3589294,-5.9641685,-99.2282,-198.88034,0.32935855,-0.3784812,15.693888,880000
|
| 18 |
+
1.0,1.0,0.02575148,2.575148,1.0257515,1.794418,-16.33981,-98.48187,-196.0891,0.2273706,-0.28211713,19.674442,885000
|
| 19 |
+
1.0,1.0,0.026709914,2.6709914,1.0267099,1.3998841,-17.18051,-97.0176,-198.82697,0.23145735,-0.21120808,15.720755,890000
|
| 20 |
+
1.0,0.9999888,0.02622561,2.622561,1.0262144,1.2723486,2.7037196,-97.409485,-198.91637,0.30216652,-0.1645944,16.31403,895000
|
| 21 |
+
1.0,1.0000001,0.026585024,2.6585026,1.0265851,1.2911261,-6.8098044,-91.00967,-174.95529,0.2362828,-0.18194292,15.0081215,900000
|
| 22 |
+
1.0,1.0,0.026594447,2.6594448,1.0265944,1.1429278,-4.050094,-95.38822,-202.42056,0.1419669,-0.1704781,13.195405,905000
|
| 23 |
+
1.0,1.0,0.026483906,2.6483908,1.0264839,0.97905505,1.2121545,-94.06665,-184.30733,0.10747885,-0.19091994,11.711199,910000
|
| 24 |
+
1.0,0.9999942,0.02572804,2.572804,1.0257223,1.1595924,1.5111568,-92.30213,-187.41649,0.12882903,-0.29800177,13.06944,915000
|
| 25 |
+
1.0,0.9999999,0.02692746,2.6927462,1.0269274,1.2043654,-4.751182,-90.24686,-162.6774,0.28412586,-0.26157898,15.384199,920000
|
| 26 |
+
1.0,1.0,0.0268546,2.68546,1.0268546,1.0888764,-1.7485965,-90.94399,-193.85298,0.24317265,-0.1228862,13.895265,925000
|
| 27 |
+
1.0,1.0,0.02812236,2.812236,1.0281223,4.518034,-13.943093,-93.157814,-186.87042,1.9493235,-1.6208564,51.138176,930000
|
| 28 |
+
1.0,0.99994934,0.026854776,2.6854777,1.0268041,1.4749054,2.3279257,-91.032906,-200.07137,0.6845144,-0.4231808,19.631756,935000
|
| 29 |
+
1.0,1.0,0.028163737,2.8163738,1.0281638,1.838271,1.5905452,-90.0653,-187.4637,0.22870138,-0.3578775,23.080559,940000
|
| 30 |
+
1.0,1.0,0.027880792,2.7880793,1.0278808,1.2045025,1.9804647,-89.935265,-198.53224,0.38935673,-0.1583278,15.457857,945000
|
| 31 |
+
1.0,1.0,0.0278222,2.7822201,1.0278223,1.5444173,-7.8328266,-91.02927,-201.11586,1.0994151,-1.0327189,25.87619,950000
|
| 32 |
+
1.0,0.99999994,0.025508858,2.5508862,1.0255088,3.6661155,-9.278952,-89.51774,-171.5341,0.8341637,-0.55734116,39.27726,955000
|
| 33 |
+
1.0,1.0,0.027337873,2.7337875,1.0273379,1.3344606,-5.0243726,-92.6448,-201.80017,0.26704118,-0.30315393,16.471146,960000
|
| 34 |
+
1.0,1.0,0.025625892,2.5625892,1.025626,1.4673868,-0.57178795,-87.42965,-179.18938,0.17463446,-0.17264393,15.3209305,965000
|
| 35 |
+
1.0,0.99999994,0.028759431,2.8759432,1.0287594,1.3849434,-4.4453197,-89.08459,-200.34576,0.19579662,-0.29231024,21.097317,970000
|
| 36 |
+
1.0,1.0,0.027680473,2.7680473,1.0276805,0.94592,-5.615648,-92.13196,-196.51187,0.17338726,-0.12570286,11.878268,975000
|
| 37 |
+
1.0,0.9999543,0.026159452,2.6159453,1.0261137,3.8358307,1.3802553,-88.78031,-199.75237,4.244095,-4.2476616,100.88022,980000
|
| 38 |
+
1.0,0.99999994,0.029272322,2.9272323,1.0292723,0.98873484,0.29833764,-87.59891,-191.22249,0.17490108,-0.50172913,14.716304,985000
|
| 39 |
+
1.0,1.0,0.027006544,2.7006545,1.0270065,1.478874,-5.2570996,-88.1299,-202.8943,0.19663839,-0.42494738,23.0531,990000
|
| 40 |
+
1.0,1.0,0.027398303,2.73983,1.0273983,1.3263129,-7.3087096,-88.00531,-202.00954,0.20980613,-0.106129535,12.981856,995000
|
| 41 |
+
1.0,0.9999999,0.02758297,2.758297,1.0275829,1.156066,2.0123827,-85.99822,-202.29607,0.20731233,-0.27509582,15.95223,1000000
|
| 42 |
+
1.0,0.99999994,0.02840494,2.8404942,1.0284048,1.1819504,-2.949977,-85.01765,-197.52666,0.28943932,-0.21426341,15.668646,1005000
|
| 43 |
+
1.0,1.0,0.029072225,2.9072225,1.0290723,1.2035801,-5.5902543,-87.78769,-169.65141,0.25580984,-0.12875043,14.730901,1010000
|
| 44 |
+
1.0,1.0,0.03051268,3.051268,1.0305127,1.5635412,-6.253939,-87.56074,-191.10498,0.24542692,-0.17928849,16.90411,1015000
|
| 45 |
+
1.0,1.0,0.027650677,2.7650676,1.0276507,1.1588738,-3.5886083,-84.179634,-194.71281,0.291935,-0.39546272,19.399126,1020000
|
| 46 |
+
1.0,0.9999999,0.029216282,2.921628,1.0292162,0.9481535,-2.66734,-81.281334,-162.45715,0.14313228,-0.17854276,11.602129,1025000
|
| 47 |
+
1.0,0.99999994,0.03013879,3.013879,1.0301387,1.1779976,0.12067218,-86.52738,-169.82628,0.14696845,-0.17708358,12.521473,1030000
|
| 48 |
+
1.0,1.0,0.028147578,2.8147578,1.0281476,1.874497,-3.753836,-81.959015,-174.15164,1.1648431,-1.0007125,36.18038,1035000
|
| 49 |
+
1.0,1.0,0.028468922,2.8468924,1.028469,1.2965643,1.53752,-85.57175,-188.52634,0.23975125,-0.18645357,16.854118,1040000
|
| 50 |
+
1.0,1.0,0.031447463,3.1447463,1.0314474,1.2081183,-1.688546,-85.07387,-177.73816,0.20183364,-0.24944961,15.6082,1045000
|
| 51 |
+
1.0,1.0,0.026308257,2.6308255,1.0263083,1.7783566,-2.1014814,-79.8583,-190.85182,0.7923367,-0.7265445,28.220688,1050000
|
| 52 |
+
1.0,1.0,0.028486082,2.8486083,1.0284861,1.1333393,-0.15658858,-86.24452,-190.41249,0.14912944,-0.3790294,16.48212,1055000
|
| 53 |
+
1.0,1.0,0.02872777,2.872777,1.0287278,1.2299031,0.92720354,-80.925224,-191.72128,0.37867957,-0.2589805,15.436908,1060000
|
| 54 |
+
1.0,1.0,0.02957786,2.957786,1.0295779,1.08959,-4.9060955,-84.02163,-201.15358,0.26207647,-0.13344666,12.699772,1065000
|
| 55 |
+
1.0,1.0,0.028453149,2.845315,1.0284531,1.0091734,-2.4246533,-81.91949,-164.98116,0.1869911,-0.22520712,11.340364,1070000
|
| 56 |
+
1.0,1.0,0.026629947,2.6629946,1.0266299,1.3216813,-2.9514027,-83.30842,-203.57175,0.24107005,-0.33764654,17.410635,1075000
|
| 57 |
+
1.0,1.0,0.028455796,2.8455796,1.0284559,1.2046213,-8.961839,-83.774414,-190.82774,0.12978865,-0.3406704,13.700312,1080000
|
| 58 |
+
1.0,1.0,0.028488662,2.848866,1.0284886,1.2936741,-1.1913927,-79.097374,-158.88066,0.18888363,-0.2508616,14.776207,1085000
|
| 59 |
+
1.0,1.0,0.02846583,2.8465831,1.0284659,1.3511019,-1.1688342,-78.458145,-191.40349,0.38997006,-0.3957321,17.081982,1090000
|
| 60 |
+
1.0,0.99999994,0.028188035,2.8188038,1.028188,1.1219037,0.89476395,-77.98512,-177.16919,0.16934058,-0.23914768,14.945656,1095000
|
| 61 |
+
1.0,1.0,0.02676082,2.6760821,1.0267608,0.9075324,-4.5654683,-82.61029,-172.79932,0.10339762,-0.13725029,9.866718,1100000
|
| 62 |
+
1.0,1.0000001,0.030250352,3.0250351,1.0302504,2.6628182,-2.9716854,-83.00551,-177.32939,0.596265,-0.7174866,26.92434,1105000
|
| 63 |
+
1.0,1.0,0.03213961,3.2139611,1.0321397,1.1516432,-3.5491974,-79.270325,-191.36688,0.8391836,-0.8282829,18.952702,1110000
|
| 64 |
+
1.0,0.9999998,0.02807482,2.8074822,1.0280746,1.1628659,-4.4387555,-79.92703,-163.53581,0.16011095,-0.2888382,16.356178,1115000
|
| 65 |
+
1.0,1.0,0.028499074,2.8499076,1.0284991,1.3380702,-1.7178695,-80.566505,-183.29852,0.30179745,-0.22225456,16.128666,1120000
|
| 66 |
+
1.0,0.9999999,0.030178145,3.0178146,1.0301781,0.89896435,-1.9377646,-78.30114,-167.58029,0.15899986,-0.18136847,11.935469,1125000
|
| 67 |
+
1.0,1.0,0.02781725,2.781725,1.0278172,1.29538,2.6289089,-74.859764,-182.39056,0.22651467,-0.24372941,16.315674,1130000
|
| 68 |
+
1.0,1.0,0.030926492,3.0926492,1.0309265,1.716401,-0.23301135,-76.810875,-200.80482,0.39863804,-0.33516392,24.925766,1135000
|
| 69 |
+
1.0,0.9999999,0.030366203,3.0366206,1.0303661,1.2152563,-2.468185,-78.17031,-170.4856,0.31099916,-0.29580683,15.880432,1140000
|
| 70 |
+
1.0,0.9999999,0.030128393,3.0128396,1.0301282,0.8468012,-2.0958297,-82.2239,-184.58897,0.14410515,-0.21615106,11.852083,1145000
|
| 71 |
+
1.0,0.99999994,0.027594794,2.7594795,1.0275947,1.680952,0.35136867,-74.69525,-183.61014,0.6418698,-0.72181183,26.003872,1150000
|
| 72 |
+
1.0,1.0,0.03006816,3.006816,1.0300682,0.924746,-0.25669122,-80.83091,-174.65176,0.34838358,-0.15688168,12.000358,1155000
|
| 73 |
+
1.0,1.0,0.028254047,2.8254046,1.028254,1.466363,1.1734523,-74.56835,-195.79265,0.24552226,-0.2584075,19.539204,1160000
|
| 74 |
+
1.0,1.0,0.02859028,2.8590283,1.0285903,1.0310937,-0.20960355,-78.48393,-182.68034,0.25074357,-0.14760591,13.582213,1165000
|
| 75 |
+
1.0,1.0,0.029276432,2.9276433,1.0292765,1.0159237,-5.6357927,-77.24181,-177.89029,0.14679231,-0.5055061,14.373636,1170000
|
| 76 |
+
1.0,1.0,0.028866805,2.8866806,1.0288668,1.2225064,0.6839527,-74.79818,-198.15187,0.29366404,-0.31396753,17.150095,1175000
|
| 77 |
+
1.0,1.0,0.02713696,2.7136958,1.0271369,1.6237978,-1.2452569,-77.52636,-178.07689,0.37828296,-0.37598723,16.76959,1180000
|
| 78 |
+
1.0,1.0,0.028936177,2.8936179,1.0289361,0.7920421,1.2362982,-76.67555,-181.70906,0.110951714,-0.20024571,10.141432,1185000
|
| 79 |
+
1.0,1.0,0.03239873,3.2398734,1.0323987,0.9608206,-3.8412406,-80.61489,-177.72766,0.23019694,-0.39168304,16.526571,1190000
|
| 80 |
+
1.0,1.0,0.030598074,3.0598075,1.030598,1.202679,-4.773767,-78.36965,-161.75505,0.24627611,-0.37814817,17.769703,1195000
|
| 81 |
+
1.0,1.0000001,0.028449062,2.8449063,1.0284492,1.0357367,-1.0556793,-75.887566,-185.10309,0.24589923,-0.21604285,14.169531,1200000
|
| 82 |
+
1.0,1.0,0.030330122,3.0330124,1.0303302,0.9415167,-0.4582742,-77.47803,-173.94662,0.29593295,-0.26257968,13.230233,1205000
|
| 83 |
+
1.0,1.0,0.02906382,2.906382,1.0290638,1.3304344,-1.630199,-78.930534,-188.27322,0.45628884,-0.2339343,19.281055,1210000
|
| 84 |
+
1.0,1.0,0.02821558,2.821558,1.0282155,1.7465264,-5.3495994,-74.536354,-157.08803,0.7749874,-0.78746825,19.406725,1215000
|
| 85 |
+
1.0,1.0,0.031386077,3.138608,1.0313861,1.320227,1.5465013,-75.31381,-173.94577,0.12612827,-0.28249577,13.31835,1220000
|
| 86 |
+
1.0,1.0,0.028708294,2.8708296,1.0287083,1.6065212,-4.5836215,-72.45255,-197.12827,0.5800811,-0.34553543,23.466255,1225000
|
| 87 |
+
1.0,1.0000001,0.029934548,2.993455,1.0299346,1.6642891,-2.5047626,-70.16891,-156.56259,0.3276697,-0.32197854,20.784538,1230000
|
| 88 |
+
1.0,1.0,0.033349648,3.334965,1.0333496,1.222254,-6.6965213,-76.935326,-196.06874,0.14251712,-0.13907796,13.686083,1235000
|
| 89 |
+
1.0,0.9999999,0.03026352,3.026352,1.0302634,0.9269018,4.340566,-70.311745,-180.38322,0.3826728,-0.1935906,13.252422,1240000
|
| 90 |
+
1.0,1.0,0.03074823,3.074823,1.0307482,1.0598925,-2.8623817,-75.03533,-162.90001,0.45341796,-0.4570985,12.965721,1245000
|
| 91 |
+
1.0,1.0,0.028995546,2.8995547,1.0289955,0.8979678,-2.4398894,-73.82891,-178.77165,0.25564182,-0.14450528,13.346901,1250000
|
| 92 |
+
1.0,0.9999999,0.029063072,2.9063072,1.029063,0.87690157,-2.3838649,-74.12319,-155.9497,0.17950605,-0.16691108,11.488896,1255000
|
| 93 |
+
1.0,1.0,0.029767655,2.9767656,1.0297676,1.6096207,-3.153565,-70.48086,-144.95871,0.5189822,-0.79094136,23.26599,1260000
|
| 94 |
+
1.0,1.0,0.03140136,3.140136,1.0314014,1.0392185,-2.3279724,-70.23532,-153.92537,0.13538271,-0.1542456,12.497112,1265000
|
| 95 |
+
1.0,1.0,0.03153889,3.1538892,1.0315388,0.99915355,0.043501794,-71.25774,-166.37413,0.6275582,-0.6981232,18.812523,1270000
|
| 96 |
+
1.0,0.9999999,0.02799375,2.799375,1.0279937,1.3436955,-0.88075817,-70.6794,-166.75859,0.19288035,-0.13468301,13.970972,1275000
|
| 97 |
+
1.0,1.0,0.030890591,3.0890594,1.0308906,16.47075,0.9823109,-70.11011,-152.18504,1.9891517,-1.5257243,101.17121,1280000
|
| 98 |
+
1.0,0.9999999,0.029944956,2.9944956,1.0299449,2.2475736,0.07484229,-70.267,-195.94066,0.2640414,-0.27297005,20.908789,1285000
|
| 99 |
+
1.0,1.0,0.03083427,3.0834272,1.0308343,1.2790583,-0.50386167,-71.30391,-162.85318,0.32527977,-0.8129202,21.440079,1290000
|
| 100 |
+
1.0,0.99999994,0.030233573,3.0233574,1.0302335,1.2709656,-1.8874278,-68.87472,-173.6553,0.5272106,-0.3058184,21.133642,1295000
|
| 101 |
+
1.0,1.0,0.029598529,2.9598527,1.0295985,0.8845865,-1.6508212,-67.65377,-170.14865,0.18037783,-0.12003369,9.05088,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:052cb44194eabf1bce806bee8609620a90b75eee0cbbf8339d1ed1e2a9506f56
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba97070910d40095f6c6ba86275955ec8bb7e735b3f2a9d1c82e4d0b1eacfd4d
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d53e5898aa9e6d75a24c8ba98ea964d35f84d1452bfeeee205d6f3b4b2172ac6
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e04bc57ddc455c5b6f1847fa366c0f60958bf8ccc03dda88a8eea2d012ca2775
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d401be0e0137a65cf2e7d0c75e60741380bf01e36b6ed6dec494e26bd030a979
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d0b8a7c77f99639ce4ceb31e8a2e37cca421badd2a11e49dd0d85967a5fedbfc
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:effe80dd851f39fda2b4c2307c3156e3f2fa352e2005ea77a1a5ce2ffc6ded04
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd1d3bcf87b0586b7b9c21feace91f5b6e401a0c99e946a6106193cf8fa01324
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38d84798d677f024225ac3c5f1c18b270bc8adc455472c77c2fe67a20c1dd6ba
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:489b91f28e8da1251d6f0ae8515c9319f2201aa9ecfc7d881470128c07a6ecdd
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_183856/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/xcal32xu
|