Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/env.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.05712552604435312,0.0015704520905593575,-0.057138486090771656,0.0008089946214056917,28.215217202193443,48.23500000001452,0.06,24693.02,-0.96,-976.1,962.7,2.9817286205291746,650000
|
| 3 |
+
0.0,0.0,-0.05863619700061523,-0.0025006610676322305,-0.05871199042069875,-0.0015901827331341206,19.065921458226434,50.10000000001527,0.0,75635.0,-1.02,-1019.56,1000.0,3.0746968460083006,700000
|
| 4 |
+
0.0,0.0,-0.06987029751946698,0.001545646425902135,-0.0697254938365458,0.002955438800513621,6.095805723753126,50.10000000001527,0.0,127635.0,-1.02,-1019.54,1000.0,2.9496012496948243,750000
|
| 5 |
+
0.0,0.0,-0.04572518316659198,-0.002870355957222373,-0.045897444178700765,-0.0029638727224520984,11.225588277794193,50.10000000001527,0.0,179635.0,-1.0,-1000.0,1000.0,3.01509672164917,800000
|
| 6 |
+
0.0,0.0,-0.039923241164484834,0.00027932536425071696,-0.039916876160841615,6.940351690062607e-05,13.269760303169694,50.10000000001527,0.0,231635.0,-1.0,-1000.0,1000.0,3.027917199134827,850000
|
| 7 |
+
0.0,0.0,-0.04569142901956919,1.3866437109373371e-05,-0.045688577956766806,-0.00014369431661239912,18.17619031927948,50.10000000001527,0.0,283635.0,-1.04,-1015.46,1000.0,3.098211817741394,900000
|
| 8 |
+
0.0,0.0,-0.03585208166998389,-0.001968288062684646,-0.03594963809382633,-0.0016284100185153963,13.077191707467163,49.67300000001487,0.02,335404.42,-0.98,-991.44,991.46,3.008499851226807,950000
|
| 9 |
+
0.0,0.0,-0.04953088314073273,0.00027719758089047425,-0.04950684798449512,0.0003629821922244814,13.900090275291552,50.10000000001527,0.0,387208.0,-1.04,-1025.8,1000.0,3.0469428491592407,1000000
|
| 10 |
+
0.0,0.0,-0.042480020458023106,-0.0003683363891727848,-0.04249170164603074,-0.00014621267604678743,9.030377721244957,50.10000000001527,0.0,439208.0,-1.02,-1018.28,1000.0,2.9817713689804077,1050000
|
| 11 |
+
0.0,0.0,-0.052533800394744916,-0.0005942520426830409,-0.05256890692719791,-0.0006795108610470496,15.92815608365772,49.298000000014966,0.02,491047.6,-1.0,-987.48,983.96,3.0134100914001465,1100000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.05712552604435312,0.0015704520905593575,-0.057138486090771656,0.0008089946214056917,28.215217202193443,48.23500000001452,0.06,24693.02,-0.96,-976.1,962.7,2.9817286205291746,650000
|
| 3 |
+
0.0,0.0,-0.05863619700061523,-0.0025006610676322305,-0.05871199042069875,-0.0015901827331341206,19.065921458226434,50.10000000001527,0.0,75635.0,-1.02,-1019.56,1000.0,3.0746968460083006,700000
|
| 4 |
+
0.0,0.0,-0.06987029751946698,0.001545646425902135,-0.0697254938365458,0.002955438800513621,6.095805723753126,50.10000000001527,0.0,127635.0,-1.02,-1019.54,1000.0,2.9496012496948243,750000
|
| 5 |
+
0.0,0.0,-0.04572518316659198,-0.002870355957222373,-0.045897444178700765,-0.0029638727224520984,11.225588277794193,50.10000000001527,0.0,179635.0,-1.0,-1000.0,1000.0,3.01509672164917,800000
|
| 6 |
+
0.0,0.0,-0.039923241164484834,0.00027932536425071696,-0.039916876160841615,6.940351690062607e-05,13.269760303169694,50.10000000001527,0.0,231635.0,-1.0,-1000.0,1000.0,3.027917199134827,850000
|
| 7 |
+
0.0,0.0,-0.04569142901956919,1.3866437109373371e-05,-0.045688577956766806,-0.00014369431661239912,18.17619031927948,50.10000000001527,0.0,283635.0,-1.04,-1015.46,1000.0,3.098211817741394,900000
|
| 8 |
+
0.0,0.0,-0.03585208166998389,-0.001968288062684646,-0.03594963809382633,-0.0016284100185153963,13.077191707467163,49.67300000001487,0.02,335404.42,-0.98,-991.44,991.46,3.008499851226807,950000
|
| 9 |
+
0.0,0.0,-0.04953088314073273,0.00027719758089047425,-0.04950684798449512,0.0003629821922244814,13.900090275291552,50.10000000001527,0.0,387208.0,-1.04,-1025.8,1000.0,3.0469428491592407,1000000
|
| 10 |
+
0.0,0.0,-0.042480020458023106,-0.0003683363891727848,-0.04249170164603074,-0.00014621267604678743,9.030377721244957,50.10000000001527,0.0,439208.0,-1.02,-1018.28,1000.0,2.9817713689804077,1050000
|
| 11 |
+
0.0,0.0,-0.052533800394744916,-0.0005942520426830409,-0.05256890692719791,-0.0006795108610470496,15.92815608365772,49.298000000014966,0.02,491047.6,-1.0,-987.48,983.96,3.0134100914001465,1100000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6504997,284.54138,0.004085998,-0.006619001,-14.119923,0.18388626,-284.4837,284.71866,3.3807702,28.504883,-90.47297,-285.5665,-302.4439,31.885653,10.357768,-9.98289,357.6926,605000
|
| 3 |
+
0.6478016,282.0464,0.0041553117,0.0011283954,-12.228445,0.1998589,-281.99554,282.24738,1.6476917,4.8711123,-150.77429,-283.01205,-302.34824,6.518804,0.42126134,-0.4458101,74.35222,610000
|
| 4 |
+
0.6428064,278.70673,0.003999462,-0.0025444117,-13.1361885,0.1751615,-278.65417,278.87936,1.5612558,5.9666696,-105.690865,-279.7839,-302.40845,7.5279255,1.1755121,-0.9647153,79.861786,615000
|
| 5 |
+
0.65051603,284.6095,0.00403049,-0.0007004203,-12.67378,0.18762535,-284.55844,284.79642,1.4117234,5.2962317,-170.39906,-285.60486,-302.07907,6.7079554,7.2454515,-8.526174,113.6392,620000
|
| 6 |
+
0.65095305,281.02594,0.004117626,-0.0033451552,-13.312399,0.18457477,-280.97113,281.20715,1.9785382,4.303195,-107.55443,-282.2463,-302.52435,6.281733,0.54824436,-0.39599818,64.1126,625000
|
| 7 |
+
0.6672955,281.88956,0.004308097,0.002936804,-11.818306,0.16768706,-281.83862,282.06018,1.7201141,3.3921661,1.635172,-282.88974,-302.20084,5.1122804,0.5732792,-0.49829602,60.24721,630000
|
| 8 |
+
0.6563405,285.43433,0.0044907224,0.0013745882,-12.193905,0.16701141,-285.37958,285.60272,1.2410973,6.4775863,-106.57421,-286.42197,-302.7244,7.7186837,0.51974833,-0.45442742,74.35426,635000
|
| 9 |
+
0.66647935,281.2837,0.0042677447,0.0053611523,-11.243797,0.17635617,-281.23572,281.46542,1.8867676,2.9301317,-100.42018,-282.05408,-302.1565,4.8168993,0.47594327,-0.4701286,54.659355,640000
|
| 10 |
+
0.65959454,282.0415,0.004293465,0.0077485754,-10.695263,0.18814553,-281.99557,282.2374,1.6822592,4.3437076,-100.66572,-282.64505,-302.84976,6.0259666,1.1514333,-0.97716403,75.38043,645000
|
| 11 |
+
0.6689639,280.47922,0.0039736377,0.005617475,-11.086314,0.20154971,-280.43518,280.68637,1.5160433,6.0953474,-101.79381,-281.1651,-302.23923,7.6113906,2.2220263,-1.7671739,116.399475,650000
|
| 12 |
+
0.6572093,280.24698,0.004085283,0.0025522965,-11.875246,0.21364272,-280.1985,280.4632,1.4064198,3.6725278,-95.70005,-281.22263,-302.1655,5.0789475,0.39335644,-0.36552173,54.769554,655000
|
| 13 |
+
0.6657053,280.43997,0.0040647928,0.003560799,-11.62399,0.21182105,-280.3927,280.65536,1.545876,4.971494,-101.13999,-281.2424,-302.2554,6.51737,0.9346866,-1.0780209,70.63568,660000
|
| 14 |
+
0.6591513,281.7384,0.0039912565,0.004345073,-11.411352,0.20291078,-281.69287,281.94565,1.2389992,3.0742466,-100.09523,-282.65137,-302.4358,4.313246,0.62534416,-0.61118966,63.528027,665000
|
| 15 |
+
0.65842336,274.20706,0.004229038,0.0036845137,-11.628758,0.19117351,-274.1579,274.40192,1.1736748,4.314482,-98.26389,-275.28586,-302.11145,5.4881573,0.6001086,-0.34835243,64.18293,670000
|
| 16 |
+
0.6333573,273.40933,0.004018726,-0.014900785,-16.207838,0.19432135,-273.3442,273.58878,3.2481675,6.4277163,-36.504097,-274.8353,-302.07788,9.675884,2.0589952,-2.1460817,125.88228,675000
|
| 17 |
+
0.64016646,275.03864,0.004235787,-0.013594109,-15.709347,0.18526626,-274.9721,275.21033,1.3921396,4.1134486,-101.48277,-276.3065,-302.10587,5.505588,0.4094207,-0.36997956,58.90889,680000
|
| 18 |
+
0.65633583,276.80267,0.0041421023,-0.00014315585,-12.534561,0.185472,-276.75073,276.988,1.932114,5.8326573,-69.66645,-277.55573,-302.93954,7.7647715,2.1212542,-2.6440485,123.62842,685000
|
| 19 |
+
0.6460991,278.14743,0.0040827747,-0.0017143452,-12.919897,0.17955594,-278.09467,278.3253,1.3917009,3.627028,-99.606125,-278.97775,-302.10345,5.0187287,0.5414173,-0.4970579,51.83245,690000
|
| 20 |
+
0.6518273,278.3634,0.004073792,-0.0006380841,-12.656631,0.21752767,-278.31186,278.5803,1.3495818,3.6974697,-100.43741,-279.07812,-302.2596,5.0470514,0.5975506,-0.59598887,60.641315,695000
|
| 21 |
+
0.6426185,274.3374,0.0041777957,-0.011646687,-15.287759,0.21071759,-274.27353,274.53647,1.5470618,5.1642427,-99.64983,-275.7501,-301.9394,6.7113047,0.9408855,-0.98743033,80.95,700000
|
| 22 |
+
0.6646004,278.33905,0.0042292015,0.00130375,-12.191727,0.19021134,-278.28748,278.53058,1.2506421,3.2056794,-100.340744,-279.20273,-302.38498,4.4563217,0.54955494,-0.45509213,55.71193,705000
|
| 23 |
+
0.6563952,278.41217,0.00397848,-0.0050121234,-13.759809,0.18463866,-278.35742,278.5918,1.7949384,3.8294868,-96.6458,-279.26117,-302.24255,5.6244254,0.436922,-0.6102747,69.45284,710000
|
| 24 |
+
0.6432556,274.26245,0.0039531756,-0.009997808,-15.0290575,0.18166175,-274.20306,274.4341,1.1201746,4.0488467,-100.46453,-275.58627,-302.2386,5.1690216,0.8554217,-0.78579766,57.415466,715000
|
| 25 |
+
0.6629102,271.6477,0.0043629864,0.011909936,-9.770233,0.18386328,-271.6051,271.84348,1.2721682,3.2004807,-100.518936,-272.09937,-302.2771,4.4726486,0.4227449,-0.5670564,64.25774,720000
|
| 26 |
+
0.67181593,278.6777,0.00396659,0.010518604,-9.8482,0.15314496,-278.63864,278.84137,1.5694951,5.0820017,-100.72572,-279.76205,-302.3493,6.651497,1.1189889,-0.83936894,70.42675,725000
|
| 27 |
+
0.66567016,276.03925,0.003949973,0.002528952,-11.859755,0.21087712,-275.99243,276.25266,1.2611805,3.2480752,-100.8085,-277.00754,-302.20322,4.509256,0.60976607,-0.5477825,52.63303,730000
|
| 28 |
+
0.6554237,277.1397,0.0037298677,0.0014420612,-12.113375,0.17121547,-277.09454,277.31235,1.3417376,4.2222295,-97.66419,-277.69467,-302.37436,5.563967,0.7630162,-0.7661927,70.9166,735000
|
| 29 |
+
0.65816236,273.05164,0.0039736964,0.0007909148,-12.300962,0.15830058,-273.00278,273.21072,1.0523132,2.92368,-100.41741,-273.71085,-302.07947,3.9759932,0.2418563,-0.33570126,41.563328,740000
|
| 30 |
+
0.65038824,269.95764,0.0040777046,0.005911154,-11.050372,0.1617017,-269.91254,270.12527,1.5199156,6.1452117,-100.90999,-270.91153,-302.12967,7.6651273,0.907551,-0.6612625,72.58172,745000
|
| 31 |
+
0.6583076,276.97766,0.0038434432,0.0060604415,-10.923174,0.16184947,-276.93567,277.14557,1.1972314,2.7274868,-100.85541,-277.5212,-302.00195,3.9247184,0.30106747,-0.31178424,47.47381,750000
|
| 32 |
+
0.66255355,274.28235,0.003938374,0.0006676046,-12.330487,0.17374106,-274.23376,274.45676,1.39605,3.6623726,-100.0489,-275.38913,-301.96262,5.0584226,0.4549357,-0.4355612,63.335648,755000
|
| 33 |
+
0.65908486,269.36945,0.003732257,0.005999233,-10.892599,0.21081056,-269.3288,269.58627,1.3376502,4.295505,-100.49804,-270.31723,-302.3182,5.6331553,0.43589658,-0.32912967,63.18409,760000
|
| 34 |
+
0.654271,270.6336,0.0038690357,0.00040097794,-12.396362,0.1748643,-270.58563,270.80887,1.4215109,3.1396298,-65.47958,-271.91568,-302.22836,4.561141,0.85873544,-0.3902073,63.998184,765000
|
| 35 |
+
0.6535411,270.37848,0.0037162814,0.0012282297,-12.1695,0.19127241,-270.33325,270.57098,9.628949,10.581454,-97.89274,-271.30173,-302.0192,20.210403,3.7526968,-4.461035,181.94443,770000
|
| 36 |
+
0.65444213,270.98657,0.0038277912,-0.0009124413,-12.738373,0.18418024,-270.93784,271.16983,1.7234051,10.418031,-66.42629,-272.03937,-302.20514,12.141436,1.9032061,-2.2997203,120.38511,775000
|
| 37 |
+
0.644589,271.7322,0.0037581518,-0.0015895489,-12.92296,0.18992153,-271.68365,271.92053,2.7545533,3.2652986,-100.53064,-272.47272,-302.20938,6.0198517,0.3402415,-0.45462695,60.52932,780000
|
| 38 |
+
0.65918934,267.29782,0.003657455,0.001175498,-12.178602,0.19614746,-267.25327,267.49515,1.1689037,2.72911,-100.53631,-267.92908,-302.15457,3.8980136,0.3721612,-0.2927095,47.185394,785000
|
| 39 |
+
0.6551297,267.60748,0.0037770476,-0.0014016604,-12.871099,0.18457575,-267.55884,267.79065,1.1505593,3.8500214,-92.784584,-268.28668,-302.09323,5.000581,0.46957052,-0.51787186,55.484776,790000
|
| 40 |
+
0.64437544,274.30844,0.0037624014,-0.002751668,-13.2313595,0.17728835,-274.25864,274.48297,1.0767606,3.2063332,-99.75592,-275.05817,-302.25314,4.283094,0.3948908,-0.35243744,53.785606,795000
|
| 41 |
+
0.65053517,267.83148,0.0037197846,-0.0017665621,-12.97491,0.18130696,-267.7832,268.01102,1.32043,3.9499817,-100.02249,-268.51007,-301.8238,5.2704115,0.63997614,-0.593239,71.694534,800000
|
| 42 |
+
0.64911443,266.47412,0.0038120935,-0.0040965127,-13.57461,0.19973576,-266.4224,266.66977,1.2004035,3.8844197,-100.1654,-266.97552,-301.8238,5.084823,0.53984654,-1.0335474,73.162186,805000
|
| 43 |
+
0.655495,269.58185,0.0038578957,0.0039517735,-11.475666,0.1841974,-269.5376,269.77,1.6872886,4.3029757,-64.073006,-270.49017,-301.93796,5.9902644,0.32790726,-0.4501238,57.56745,810000
|
| 44 |
+
0.6573909,266.58142,0.0039331736,-0.0014566542,-12.870351,0.19900122,-266.53082,266.77896,1.3577803,3.5429757,-99.69999,-267.13876,-301.8658,4.900756,1.1475478,-1.1596252,74.87616,815000
|
| 45 |
+
0.63936394,270.84436,0.0038150756,-0.007658297,-14.507378,0.18479577,-270.78903,271.02148,2.0919387,5.2788625,-100.3765,-271.8668,-302.6625,7.370801,1.3846251,-1.6038991,86.65119,820000
|
| 46 |
+
0.648729,272.79358,0.0037088124,-0.006062066,-14.134503,0.17409143,-272.74115,272.9616,1.2881786,3.2632987,-100.42457,-273.70084,-302.21527,4.5514774,0.41460955,-0.39032212,52.774597,825000
|
| 47 |
+
0.6610179,272.65576,0.0038955153,-0.001395998,-12.85836,0.1935377,-272.60565,272.8479,1.3838911,3.6604664,-100.497955,-273.98846,-302.25656,5.0443573,2.9671757,-3.3839705,117.773285,830000
|
| 48 |
+
0.6601801,269.15533,0.0037171321,0.0059726527,-10.893209,0.19334565,-269.11487,269.35468,1.3788083,3.7868855,-35.912914,-269.70132,-302.29657,5.1656938,0.48227572,-0.47729427,62.551277,835000
|
| 49 |
+
0.6527548,272.41525,0.0037419512,-0.0061187977,-14.135189,0.18249744,-272.36237,272.5916,1.8275216,4.13918,-100.51181,-273.72638,-302.16803,5.9667015,0.7288239,-0.54262584,83.50334,840000
|
| 50 |
+
0.6582282,263.89417,0.0037672666,0.0036577238,-11.529078,0.16643319,-263.8507,264.06427,1.1193393,3.2770524,-100.352936,-264.5088,-301.87292,4.396392,0.30061695,-0.6510931,49.94743,845000
|
| 51 |
+
0.67328995,273.64423,0.0036910675,0.008979313,-10.067286,0.17413989,-273.60706,273.82733,1.07295,2.4257796,-100.51886,-274.5745,-302.0506,3.4987297,0.37312174,-0.35395652,41.047,850000
|
| 52 |
+
0.6620949,267.72824,0.0035442256,0.006353452,-10.707379,0.15968688,-267.6903,267.8943,1.1134614,2.7622223,-100.443535,-268.42258,-301.9861,3.8756838,0.4541137,-0.40776974,45.2773,855000
|
| 53 |
+
0.6618397,266.52298,0.00393807,0.0030862617,-11.716301,0.18310657,-266.47684,266.70917,1.3041114,7.2750688,-100.46683,-267.1515,-301.76785,8.57918,2.2191865,-2.6580071,121.59244,860000
|
| 54 |
+
0.6533215,267.40057,0.003762342,-0.007454606,-14.481374,0.16725983,-267.34607,267.5604,1.1724706,6.3376794,-100.29237,-268.59262,-302.06616,7.51015,2.2160082,-2.8992822,124.3933,865000
|
| 55 |
+
0.6562492,271.96085,0.003866181,-0.004631611,-13.697981,0.15756208,-271.9079,272.11377,1.0999882,2.9069898,-100.504135,-272.65515,-302.09705,4.006978,0.65927917,-0.74607915,55.26154,870000
|
| 56 |
+
0.66913724,264.36664,0.003611368,0.004257561,-11.321067,0.1507858,-264.32574,264.5217,1.5345849,4.6152334,-46.244503,-265.6049,-302.18274,6.1498184,1.1026285,-1.3601733,86.59449,875000
|
| 57 |
+
0.6636683,264.8285,0.0036402615,0.0029365495,-11.693314,0.16008234,-264.7859,264.99152,0.9788808,2.366919,-100.44101,-265.53162,-301.95114,3.3458,0.26526368,-0.25968072,41.559334,880000
|
| 58 |
+
0.6468257,270.21588,0.0036241903,-0.004829083,-13.8324585,0.14689961,-270.16577,270.35797,1.1687931,9.422801,-100.35209,-270.97925,-302.22025,10.591594,2.018222,-3.1048057,110.07703,885000
|
| 59 |
+
0.6461447,263.09058,0.0037098632,0.0005012923,-12.364876,0.17943624,-263.0447,263.2705,1.6749378,5.9441333,-100.33116,-264.10522,-302.1419,7.619071,2.151794,-1.8088377,102.804405,890000
|
| 60 |
+
0.66021454,269.9526,0.0035095215,0.006792475,-10.564558,0.15969497,-269.91553,270.1191,0.9322872,3.10505,-100.58293,-270.9451,-302.07788,4.0373373,0.45424384,-0.43698892,54.323105,895000
|
| 61 |
+
0.66197664,265.7981,0.0033639732,0.006701088,-10.507984,0.19541635,-265.76276,266.0002,1.0816616,3.0193062,-100.48033,-266.77637,-301.99734,4.100968,0.4085725,-0.6530709,62.319313,900000
|
| 62 |
+
0.6671115,265.05884,0.003592237,0.0070099793,-10.548575,0.19399711,-265.02094,265.25986,0.93832505,2.6000278,-100.5473,-265.7778,-302.05096,3.538353,0.9639817,-0.9009894,55.30027,905000
|
| 63 |
+
0.66151917,262.91718,0.003659395,-0.0023302846,-13.136795,0.1573484,-262.8691,263.0722,1.1342088,2.7609224,-100.5795,-263.65567,-301.95334,3.895131,0.45977432,-0.4626112,50.46396,910000
|
| 64 |
+
0.653595,258.65723,0.0036228236,0.0018967156,-11.976454,0.19648008,-258.61386,258.8556,1.764592,3.58401,-100.4971,-259.36542,-302.02216,5.348602,0.62245154,-0.7341853,62.574986,915000
|
| 65 |
+
0.6483198,254.42593,0.0036639783,0.005047957,-11.122274,0.17202798,-254.38518,254.60301,1.5955162,4.5989075,-100.49905,-255.17793,-301.9841,6.1944237,2.6763644,-2.3275902,58.103752,920000
|
| 66 |
+
0.6476367,266.43842,0.0034137154,-0.004865089,-13.925159,0.17111172,-266.39087,266.60468,1.137902,3.1888254,-100.59291,-267.6923,-302.3684,4.3267274,0.705848,-0.570204,63.18871,925000
|
| 67 |
+
0.65318525,262.54663,0.0033162443,-0.0038323011,-13.655615,0.16889957,-262.50137,262.7117,1.1323286,4.0779185,-99.20918,-263.7438,-302.0204,5.210247,1.4590633,-1.5592431,58.879574,930000
|
| 68 |
+
0.66932404,259.51343,0.0033202062,0.004214187,-11.230745,0.19490075,-259.47614,259.71255,1.5599394,3.2903168,-100.100006,-260.10397,-302.09268,4.850256,0.5375072,-1.2153078,72.12131,935000
|
| 69 |
+
0.66374177,268.33942,0.0036102177,0.0020057033,-11.944437,0.22149695,-268.2963,268.56293,1.0244169,3.1041832,-76.29529,-269.1538,-302.13806,4.1286,0.29003885,-0.45158648,46.08079,940000
|
| 70 |
+
0.6504146,268.75314,0.0035731783,-0.005332145,-13.9922695,0.18293487,-268.70312,268.93073,1.3270473,3.0762575,-100.547104,-269.61417,-302.02628,4.403305,0.54000056,-0.5164204,53.686012,945000
|
| 71 |
+
0.6574165,260.4666,0.0034873101,0.00211318,-11.894037,0.19335115,-260.42517,260.66208,1.4661762,3.7327282,-100.40828,-261.40952,-302.10504,5.1989045,0.49723673,-0.49004614,57.166683,950000
|
| 72 |
+
0.65548146,262.17993,0.0035360537,-0.0051515875,-13.956875,0.16228181,-262.1306,262.33707,1.3766781,3.0639176,-100.202965,-263.32184,-301.86752,4.4405956,0.5528027,-0.39287478,51.95656,955000
|
| 73 |
+
0.65107197,261.82092,0.003388576,0.00159385,-12.02964,0.1729756,-261.78015,261.99548,1.1703867,3.114214,-100.347694,-262.77863,-301.9634,4.2846007,0.4648233,-0.3965727,48.606712,960000
|
| 74 |
+
0.6661549,265.3406,0.0035074237,0.0054434114,-10.948031,0.18667775,-265.30222,265.5327,0.9779215,2.6708443,-100.29151,-266.2422,-302.21854,3.6487658,0.51597095,-0.42489243,50.358677,965000
|
| 75 |
+
0.6575464,255.9065,0.0034098045,-0.00066408486,-12.694757,0.17721546,-255.86319,256.08304,0.90043783,2.6858575,-100.386986,-256.65182,-302.25586,3.5862954,0.4231449,-0.25437003,43.70842,970000
|
| 76 |
+
0.649308,266.07803,0.0034312573,-0.0066645863,-14.442316,0.16034284,-266.0285,266.23172,1.2724144,3.9939384,-100.48485,-266.4668,-302.31454,5.2663527,0.3400584,-0.46184403,54.462784,975000
|
| 77 |
+
0.6522926,261.80508,0.0036192944,0.0019656194,-11.956905,0.16428359,-261.76184,261.9713,0.9875607,2.919735,-100.33143,-262.27228,-302.10007,3.9072957,0.53268695,-0.78171146,61.83064,980000
|
| 78 |
+
0.6512202,262.42133,0.0035295177,-0.0071881423,-14.536579,0.17982444,-262.37006,262.59393,1.0968493,4.3913054,-49.4598,-262.97372,-301.75958,5.488155,0.5305307,-0.50646114,62.904163,985000
|
| 79 |
+
0.66661865,257.80447,0.00354901,0.0055935145,-10.923923,0.17467946,-257.7657,257.98474,1.313959,6.9371614,-99.07322,-258.62634,-302.39502,8.251121,1.8784924,-1.8434556,122.2343,990000
|
| 80 |
+
0.6636648,260.98584,0.0035597538,0.00076375203,-12.285448,0.1873773,-260.94214,261.17398,1.108559,4.47976,-83.279655,-261.97324,-302.2838,5.5883193,0.8410831,-0.46107504,67.765884,995000
|
| 81 |
+
0.66208524,259.30103,0.003445495,0.0014641915,-12.075042,0.14321694,-259.2594,259.4457,1.4018606,2.8618677,-100.24382,-260.07614,-302.0657,4.263728,0.62505955,-0.67501634,57.50255,1000000
|
| 82 |
+
0.6563843,261.56732,0.003291683,0.0008740645,-12.234463,0.16956082,-261.52704,261.73776,1.2287104,2.3021333,-98.687386,-262.32965,-301.73425,3.5308437,0.3339681,-0.20846432,40.827415,1005000
|
| 83 |
+
0.6575555,261.71902,0.0034246047,-0.002886303,-13.3428135,0.16029927,-261.67334,261.87643,1.0223477,3.6841028,-100.32084,-262.9382,-302.02954,4.7064505,0.5777801,-0.42657185,49.97992,1010000
|
| 84 |
+
0.65986913,253.97835,0.0032079625,0.004040791,-11.240387,0.1672875,-253.94228,254.14967,0.9039529,2.9982402,-77.38086,-254.51314,-301.83215,3.902193,0.37866285,-0.52929825,52.62655,1015000
|
| 85 |
+
0.65653205,261.25128,0.0035637603,-0.00025887645,-12.572641,0.17411378,-261.20648,261.42514,1.5223082,3.4719715,-87.04904,-261.87656,-301.99847,4.99428,0.35514015,-0.4967986,57.897858,1020000
|
| 86 |
+
0.6466819,262.68057,0.003413686,-0.006351027,-14.36046,0.1829174,-262.63153,262.85715,1.4623327,2.860129,-100.20497,-263.39075,-301.71704,4.322462,0.30967557,-0.55739844,46.266136,1025000
|
| 87 |
+
0.63788277,258.57867,0.0035358616,-0.0064326907,-14.319271,0.16495992,-258.528,258.73718,1.4346595,3.6145241,-100.49186,-259.68927,-302.07196,5.049184,0.6463211,-0.49093282,60.29489,1030000
|
| 88 |
+
0.66567755,255.84885,0.0033925078,0.0022620838,-11.833212,0.19438323,-255.80872,256.0455,1.970167,3.3068447,-100.24884,-256.7745,-302.01016,5.277012,0.37441555,-0.5104859,58.61408,1035000
|
| 89 |
+
0.66435033,255.17026,0.0033634163,0.0012540288,-12.127156,0.13133073,-255.12949,255.30284,1.1782786,3.4121118,-100.32861,-255.84526,-301.78882,4.59039,0.36319596,-0.36807364,50.360268,1040000
|
| 90 |
+
0.6757802,250.94873,0.003363038,0.007452863,-10.28389,0.162705,-250.91415,251.11888,1.2173586,3.2410038,-100.325714,-251.69609,-301.66815,4.4583626,0.3045745,-0.33514184,47.349785,1045000
|
| 91 |
+
0.65868413,256.05756,0.0033161256,-0.0014648307,-12.94173,0.17703392,-256.01468,256.23312,1.0264419,6.2512813,-100.41937,-257.07617,-301.8181,7.2777233,4.16162,-4.355138,157.3187,1050000
|
| 92 |
+
0.66043305,258.94485,0.0032934318,0.005597549,-10.80039,0.1677081,-258.9093,259.11813,1.2221743,2.8265827,-100.393105,-259.7606,-301.74634,4.048757,0.57991415,-0.5750266,43.316387,1055000
|
| 93 |
+
0.67259246,249.124,0.0033077463,0.008967727,-9.788871,0.14581458,-249.09161,249.27878,0.99595225,2.7984827,-100.28707,-249.64258,-301.91867,3.794435,0.46866822,-0.37264475,49.812122,1060000
|
| 94 |
+
0.6648399,253.57108,0.00321276,1.9814413e-05,-12.493833,0.17383426,-253.53094,253.74492,0.9703397,2.2629964,-76.37273,-254.23257,-301.6983,3.2333362,0.30220306,-0.27435437,41.834404,1065000
|
| 95 |
+
0.6508809,257.8426,0.0032236075,-0.004686635,-13.953848,0.19176298,-257.79764,258.02966,1.0857394,2.135378,-100.252884,-258.66818,-302.21246,3.2211173,0.61322963,-0.3952656,40.82026,1070000
|
| 96 |
+
0.6628362,252.9418,0.003208201,-0.0011395738,-12.8552065,0.172108,-252.90054,253.11276,0.9686883,3.159973,-98.78411,-253.5697,-301.7716,4.128661,0.43265274,-0.5022519,50.93865,1075000
|
| 97 |
+
0.6601302,261.19073,0.003412633,0.0012177253,-12.143171,0.17706582,-261.14926,261.36902,1.3875456,6.8427033,-100.40241,-262.5093,-302.16165,8.230249,0.96499413,-1.0618275,85.32804,1080000
|
| 98 |
+
0.65358746,260.44183,0.003528148,-0.0050064507,-13.919003,0.1806401,-260.3927,260.61746,1.5575346,3.9258919,-100.04229,-261.48953,-301.78098,5.4834266,0.67183113,-0.6458342,62.174324,1085000
|
| 99 |
+
0.6409463,253.99141,0.0033565736,-0.0072531854,-14.66089,0.148981,-253.9422,254.13315,1.1538728,4.4246626,-98.58921,-254.87425,-301.86902,5.5785356,0.36390615,-0.41233966,50.758873,1090000
|
| 100 |
+
0.6549215,252.58218,0.0031111427,-0.002677074,-13.360479,0.14474939,-252.5406,252.72426,1.5096258,3.3212554,-100.328896,-253.3897,-301.99347,4.830881,0.30282882,-0.45452234,52.2667,1095000
|
| 101 |
+
0.65415996,260.1411,0.0031734062,-0.007133554,-14.747917,0.17787759,-260.09427,260.31186,1.0177258,3.4760556,-100.3434,-260.94058,-302.06018,4.4937816,0.54474056,-0.6318835,54.95204,1100000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6504997,284.54138,0.004085998,-0.006619001,-14.119923,0.18388626,-284.4837,284.71866,3.3807702,28.504883,-90.47297,-285.5665,-302.4439,31.885653,10.357768,-9.98289,357.6926,605000
|
| 3 |
+
0.6478016,282.0464,0.0041553117,0.0011283954,-12.228445,0.1998589,-281.99554,282.24738,1.6476917,4.8711123,-150.77429,-283.01205,-302.34824,6.518804,0.42126134,-0.4458101,74.35222,610000
|
| 4 |
+
0.6428064,278.70673,0.003999462,-0.0025444117,-13.1361885,0.1751615,-278.65417,278.87936,1.5612558,5.9666696,-105.690865,-279.7839,-302.40845,7.5279255,1.1755121,-0.9647153,79.861786,615000
|
| 5 |
+
0.65051603,284.6095,0.00403049,-0.0007004203,-12.67378,0.18762535,-284.55844,284.79642,1.4117234,5.2962317,-170.39906,-285.60486,-302.07907,6.7079554,7.2454515,-8.526174,113.6392,620000
|
| 6 |
+
0.65095305,281.02594,0.004117626,-0.0033451552,-13.312399,0.18457477,-280.97113,281.20715,1.9785382,4.303195,-107.55443,-282.2463,-302.52435,6.281733,0.54824436,-0.39599818,64.1126,625000
|
| 7 |
+
0.6672955,281.88956,0.004308097,0.002936804,-11.818306,0.16768706,-281.83862,282.06018,1.7201141,3.3921661,1.635172,-282.88974,-302.20084,5.1122804,0.5732792,-0.49829602,60.24721,630000
|
| 8 |
+
0.6563405,285.43433,0.0044907224,0.0013745882,-12.193905,0.16701141,-285.37958,285.60272,1.2410973,6.4775863,-106.57421,-286.42197,-302.7244,7.7186837,0.51974833,-0.45442742,74.35426,635000
|
| 9 |
+
0.66647935,281.2837,0.0042677447,0.0053611523,-11.243797,0.17635617,-281.23572,281.46542,1.8867676,2.9301317,-100.42018,-282.05408,-302.1565,4.8168993,0.47594327,-0.4701286,54.659355,640000
|
| 10 |
+
0.65959454,282.0415,0.004293465,0.0077485754,-10.695263,0.18814553,-281.99557,282.2374,1.6822592,4.3437076,-100.66572,-282.64505,-302.84976,6.0259666,1.1514333,-0.97716403,75.38043,645000
|
| 11 |
+
0.6689639,280.47922,0.0039736377,0.005617475,-11.086314,0.20154971,-280.43518,280.68637,1.5160433,6.0953474,-101.79381,-281.1651,-302.23923,7.6113906,2.2220263,-1.7671739,116.399475,650000
|
| 12 |
+
0.6572093,280.24698,0.004085283,0.0025522965,-11.875246,0.21364272,-280.1985,280.4632,1.4064198,3.6725278,-95.70005,-281.22263,-302.1655,5.0789475,0.39335644,-0.36552173,54.769554,655000
|
| 13 |
+
0.6657053,280.43997,0.0040647928,0.003560799,-11.62399,0.21182105,-280.3927,280.65536,1.545876,4.971494,-101.13999,-281.2424,-302.2554,6.51737,0.9346866,-1.0780209,70.63568,660000
|
| 14 |
+
0.6591513,281.7384,0.0039912565,0.004345073,-11.411352,0.20291078,-281.69287,281.94565,1.2389992,3.0742466,-100.09523,-282.65137,-302.4358,4.313246,0.62534416,-0.61118966,63.528027,665000
|
| 15 |
+
0.65842336,274.20706,0.004229038,0.0036845137,-11.628758,0.19117351,-274.1579,274.40192,1.1736748,4.314482,-98.26389,-275.28586,-302.11145,5.4881573,0.6001086,-0.34835243,64.18293,670000
|
| 16 |
+
0.6333573,273.40933,0.004018726,-0.014900785,-16.207838,0.19432135,-273.3442,273.58878,3.2481675,6.4277163,-36.504097,-274.8353,-302.07788,9.675884,2.0589952,-2.1460817,125.88228,675000
|
| 17 |
+
0.64016646,275.03864,0.004235787,-0.013594109,-15.709347,0.18526626,-274.9721,275.21033,1.3921396,4.1134486,-101.48277,-276.3065,-302.10587,5.505588,0.4094207,-0.36997956,58.90889,680000
|
| 18 |
+
0.65633583,276.80267,0.0041421023,-0.00014315585,-12.534561,0.185472,-276.75073,276.988,1.932114,5.8326573,-69.66645,-277.55573,-302.93954,7.7647715,2.1212542,-2.6440485,123.62842,685000
|
| 19 |
+
0.6460991,278.14743,0.0040827747,-0.0017143452,-12.919897,0.17955594,-278.09467,278.3253,1.3917009,3.627028,-99.606125,-278.97775,-302.10345,5.0187287,0.5414173,-0.4970579,51.83245,690000
|
| 20 |
+
0.6518273,278.3634,0.004073792,-0.0006380841,-12.656631,0.21752767,-278.31186,278.5803,1.3495818,3.6974697,-100.43741,-279.07812,-302.2596,5.0470514,0.5975506,-0.59598887,60.641315,695000
|
| 21 |
+
0.6426185,274.3374,0.0041777957,-0.011646687,-15.287759,0.21071759,-274.27353,274.53647,1.5470618,5.1642427,-99.64983,-275.7501,-301.9394,6.7113047,0.9408855,-0.98743033,80.95,700000
|
| 22 |
+
0.6646004,278.33905,0.0042292015,0.00130375,-12.191727,0.19021134,-278.28748,278.53058,1.2506421,3.2056794,-100.340744,-279.20273,-302.38498,4.4563217,0.54955494,-0.45509213,55.71193,705000
|
| 23 |
+
0.6563952,278.41217,0.00397848,-0.0050121234,-13.759809,0.18463866,-278.35742,278.5918,1.7949384,3.8294868,-96.6458,-279.26117,-302.24255,5.6244254,0.436922,-0.6102747,69.45284,710000
|
| 24 |
+
0.6432556,274.26245,0.0039531756,-0.009997808,-15.0290575,0.18166175,-274.20306,274.4341,1.1201746,4.0488467,-100.46453,-275.58627,-302.2386,5.1690216,0.8554217,-0.78579766,57.415466,715000
|
| 25 |
+
0.6629102,271.6477,0.0043629864,0.011909936,-9.770233,0.18386328,-271.6051,271.84348,1.2721682,3.2004807,-100.518936,-272.09937,-302.2771,4.4726486,0.4227449,-0.5670564,64.25774,720000
|
| 26 |
+
0.67181593,278.6777,0.00396659,0.010518604,-9.8482,0.15314496,-278.63864,278.84137,1.5694951,5.0820017,-100.72572,-279.76205,-302.3493,6.651497,1.1189889,-0.83936894,70.42675,725000
|
| 27 |
+
0.66567016,276.03925,0.003949973,0.002528952,-11.859755,0.21087712,-275.99243,276.25266,1.2611805,3.2480752,-100.8085,-277.00754,-302.20322,4.509256,0.60976607,-0.5477825,52.63303,730000
|
| 28 |
+
0.6554237,277.1397,0.0037298677,0.0014420612,-12.113375,0.17121547,-277.09454,277.31235,1.3417376,4.2222295,-97.66419,-277.69467,-302.37436,5.563967,0.7630162,-0.7661927,70.9166,735000
|
| 29 |
+
0.65816236,273.05164,0.0039736964,0.0007909148,-12.300962,0.15830058,-273.00278,273.21072,1.0523132,2.92368,-100.41741,-273.71085,-302.07947,3.9759932,0.2418563,-0.33570126,41.563328,740000
|
| 30 |
+
0.65038824,269.95764,0.0040777046,0.005911154,-11.050372,0.1617017,-269.91254,270.12527,1.5199156,6.1452117,-100.90999,-270.91153,-302.12967,7.6651273,0.907551,-0.6612625,72.58172,745000
|
| 31 |
+
0.6583076,276.97766,0.0038434432,0.0060604415,-10.923174,0.16184947,-276.93567,277.14557,1.1972314,2.7274868,-100.85541,-277.5212,-302.00195,3.9247184,0.30106747,-0.31178424,47.47381,750000
|
| 32 |
+
0.66255355,274.28235,0.003938374,0.0006676046,-12.330487,0.17374106,-274.23376,274.45676,1.39605,3.6623726,-100.0489,-275.38913,-301.96262,5.0584226,0.4549357,-0.4355612,63.335648,755000
|
| 33 |
+
0.65908486,269.36945,0.003732257,0.005999233,-10.892599,0.21081056,-269.3288,269.58627,1.3376502,4.295505,-100.49804,-270.31723,-302.3182,5.6331553,0.43589658,-0.32912967,63.18409,760000
|
| 34 |
+
0.654271,270.6336,0.0038690357,0.00040097794,-12.396362,0.1748643,-270.58563,270.80887,1.4215109,3.1396298,-65.47958,-271.91568,-302.22836,4.561141,0.85873544,-0.3902073,63.998184,765000
|
| 35 |
+
0.6535411,270.37848,0.0037162814,0.0012282297,-12.1695,0.19127241,-270.33325,270.57098,9.628949,10.581454,-97.89274,-271.30173,-302.0192,20.210403,3.7526968,-4.461035,181.94443,770000
|
| 36 |
+
0.65444213,270.98657,0.0038277912,-0.0009124413,-12.738373,0.18418024,-270.93784,271.16983,1.7234051,10.418031,-66.42629,-272.03937,-302.20514,12.141436,1.9032061,-2.2997203,120.38511,775000
|
| 37 |
+
0.644589,271.7322,0.0037581518,-0.0015895489,-12.92296,0.18992153,-271.68365,271.92053,2.7545533,3.2652986,-100.53064,-272.47272,-302.20938,6.0198517,0.3402415,-0.45462695,60.52932,780000
|
| 38 |
+
0.65918934,267.29782,0.003657455,0.001175498,-12.178602,0.19614746,-267.25327,267.49515,1.1689037,2.72911,-100.53631,-267.92908,-302.15457,3.8980136,0.3721612,-0.2927095,47.185394,785000
|
| 39 |
+
0.6551297,267.60748,0.0037770476,-0.0014016604,-12.871099,0.18457575,-267.55884,267.79065,1.1505593,3.8500214,-92.784584,-268.28668,-302.09323,5.000581,0.46957052,-0.51787186,55.484776,790000
|
| 40 |
+
0.64437544,274.30844,0.0037624014,-0.002751668,-13.2313595,0.17728835,-274.25864,274.48297,1.0767606,3.2063332,-99.75592,-275.05817,-302.25314,4.283094,0.3948908,-0.35243744,53.785606,795000
|
| 41 |
+
0.65053517,267.83148,0.0037197846,-0.0017665621,-12.97491,0.18130696,-267.7832,268.01102,1.32043,3.9499817,-100.02249,-268.51007,-301.8238,5.2704115,0.63997614,-0.593239,71.694534,800000
|
| 42 |
+
0.64911443,266.47412,0.0038120935,-0.0040965127,-13.57461,0.19973576,-266.4224,266.66977,1.2004035,3.8844197,-100.1654,-266.97552,-301.8238,5.084823,0.53984654,-1.0335474,73.162186,805000
|
| 43 |
+
0.655495,269.58185,0.0038578957,0.0039517735,-11.475666,0.1841974,-269.5376,269.77,1.6872886,4.3029757,-64.073006,-270.49017,-301.93796,5.9902644,0.32790726,-0.4501238,57.56745,810000
|
| 44 |
+
0.6573909,266.58142,0.0039331736,-0.0014566542,-12.870351,0.19900122,-266.53082,266.77896,1.3577803,3.5429757,-99.69999,-267.13876,-301.8658,4.900756,1.1475478,-1.1596252,74.87616,815000
|
| 45 |
+
0.63936394,270.84436,0.0038150756,-0.007658297,-14.507378,0.18479577,-270.78903,271.02148,2.0919387,5.2788625,-100.3765,-271.8668,-302.6625,7.370801,1.3846251,-1.6038991,86.65119,820000
|
| 46 |
+
0.648729,272.79358,0.0037088124,-0.006062066,-14.134503,0.17409143,-272.74115,272.9616,1.2881786,3.2632987,-100.42457,-273.70084,-302.21527,4.5514774,0.41460955,-0.39032212,52.774597,825000
|
| 47 |
+
0.6610179,272.65576,0.0038955153,-0.001395998,-12.85836,0.1935377,-272.60565,272.8479,1.3838911,3.6604664,-100.497955,-273.98846,-302.25656,5.0443573,2.9671757,-3.3839705,117.773285,830000
|
| 48 |
+
0.6601801,269.15533,0.0037171321,0.0059726527,-10.893209,0.19334565,-269.11487,269.35468,1.3788083,3.7868855,-35.912914,-269.70132,-302.29657,5.1656938,0.48227572,-0.47729427,62.551277,835000
|
| 49 |
+
0.6527548,272.41525,0.0037419512,-0.0061187977,-14.135189,0.18249744,-272.36237,272.5916,1.8275216,4.13918,-100.51181,-273.72638,-302.16803,5.9667015,0.7288239,-0.54262584,83.50334,840000
|
| 50 |
+
0.6582282,263.89417,0.0037672666,0.0036577238,-11.529078,0.16643319,-263.8507,264.06427,1.1193393,3.2770524,-100.352936,-264.5088,-301.87292,4.396392,0.30061695,-0.6510931,49.94743,845000
|
| 51 |
+
0.67328995,273.64423,0.0036910675,0.008979313,-10.067286,0.17413989,-273.60706,273.82733,1.07295,2.4257796,-100.51886,-274.5745,-302.0506,3.4987297,0.37312174,-0.35395652,41.047,850000
|
| 52 |
+
0.6620949,267.72824,0.0035442256,0.006353452,-10.707379,0.15968688,-267.6903,267.8943,1.1134614,2.7622223,-100.443535,-268.42258,-301.9861,3.8756838,0.4541137,-0.40776974,45.2773,855000
|
| 53 |
+
0.6618397,266.52298,0.00393807,0.0030862617,-11.716301,0.18310657,-266.47684,266.70917,1.3041114,7.2750688,-100.46683,-267.1515,-301.76785,8.57918,2.2191865,-2.6580071,121.59244,860000
|
| 54 |
+
0.6533215,267.40057,0.003762342,-0.007454606,-14.481374,0.16725983,-267.34607,267.5604,1.1724706,6.3376794,-100.29237,-268.59262,-302.06616,7.51015,2.2160082,-2.8992822,124.3933,865000
|
| 55 |
+
0.6562492,271.96085,0.003866181,-0.004631611,-13.697981,0.15756208,-271.9079,272.11377,1.0999882,2.9069898,-100.504135,-272.65515,-302.09705,4.006978,0.65927917,-0.74607915,55.26154,870000
|
| 56 |
+
0.66913724,264.36664,0.003611368,0.004257561,-11.321067,0.1507858,-264.32574,264.5217,1.5345849,4.6152334,-46.244503,-265.6049,-302.18274,6.1498184,1.1026285,-1.3601733,86.59449,875000
|
| 57 |
+
0.6636683,264.8285,0.0036402615,0.0029365495,-11.693314,0.16008234,-264.7859,264.99152,0.9788808,2.366919,-100.44101,-265.53162,-301.95114,3.3458,0.26526368,-0.25968072,41.559334,880000
|
| 58 |
+
0.6468257,270.21588,0.0036241903,-0.004829083,-13.8324585,0.14689961,-270.16577,270.35797,1.1687931,9.422801,-100.35209,-270.97925,-302.22025,10.591594,2.018222,-3.1048057,110.07703,885000
|
| 59 |
+
0.6461447,263.09058,0.0037098632,0.0005012923,-12.364876,0.17943624,-263.0447,263.2705,1.6749378,5.9441333,-100.33116,-264.10522,-302.1419,7.619071,2.151794,-1.8088377,102.804405,890000
|
| 60 |
+
0.66021454,269.9526,0.0035095215,0.006792475,-10.564558,0.15969497,-269.91553,270.1191,0.9322872,3.10505,-100.58293,-270.9451,-302.07788,4.0373373,0.45424384,-0.43698892,54.323105,895000
|
| 61 |
+
0.66197664,265.7981,0.0033639732,0.006701088,-10.507984,0.19541635,-265.76276,266.0002,1.0816616,3.0193062,-100.48033,-266.77637,-301.99734,4.100968,0.4085725,-0.6530709,62.319313,900000
|
| 62 |
+
0.6671115,265.05884,0.003592237,0.0070099793,-10.548575,0.19399711,-265.02094,265.25986,0.93832505,2.6000278,-100.5473,-265.7778,-302.05096,3.538353,0.9639817,-0.9009894,55.30027,905000
|
| 63 |
+
0.66151917,262.91718,0.003659395,-0.0023302846,-13.136795,0.1573484,-262.8691,263.0722,1.1342088,2.7609224,-100.5795,-263.65567,-301.95334,3.895131,0.45977432,-0.4626112,50.46396,910000
|
| 64 |
+
0.653595,258.65723,0.0036228236,0.0018967156,-11.976454,0.19648008,-258.61386,258.8556,1.764592,3.58401,-100.4971,-259.36542,-302.02216,5.348602,0.62245154,-0.7341853,62.574986,915000
|
| 65 |
+
0.6483198,254.42593,0.0036639783,0.005047957,-11.122274,0.17202798,-254.38518,254.60301,1.5955162,4.5989075,-100.49905,-255.17793,-301.9841,6.1944237,2.6763644,-2.3275902,58.103752,920000
|
| 66 |
+
0.6476367,266.43842,0.0034137154,-0.004865089,-13.925159,0.17111172,-266.39087,266.60468,1.137902,3.1888254,-100.59291,-267.6923,-302.3684,4.3267274,0.705848,-0.570204,63.18871,925000
|
| 67 |
+
0.65318525,262.54663,0.0033162443,-0.0038323011,-13.655615,0.16889957,-262.50137,262.7117,1.1323286,4.0779185,-99.20918,-263.7438,-302.0204,5.210247,1.4590633,-1.5592431,58.879574,930000
|
| 68 |
+
0.66932404,259.51343,0.0033202062,0.004214187,-11.230745,0.19490075,-259.47614,259.71255,1.5599394,3.2903168,-100.100006,-260.10397,-302.09268,4.850256,0.5375072,-1.2153078,72.12131,935000
|
| 69 |
+
0.66374177,268.33942,0.0036102177,0.0020057033,-11.944437,0.22149695,-268.2963,268.56293,1.0244169,3.1041832,-76.29529,-269.1538,-302.13806,4.1286,0.29003885,-0.45158648,46.08079,940000
|
| 70 |
+
0.6504146,268.75314,0.0035731783,-0.005332145,-13.9922695,0.18293487,-268.70312,268.93073,1.3270473,3.0762575,-100.547104,-269.61417,-302.02628,4.403305,0.54000056,-0.5164204,53.686012,945000
|
| 71 |
+
0.6574165,260.4666,0.0034873101,0.00211318,-11.894037,0.19335115,-260.42517,260.66208,1.4661762,3.7327282,-100.40828,-261.40952,-302.10504,5.1989045,0.49723673,-0.49004614,57.166683,950000
|
| 72 |
+
0.65548146,262.17993,0.0035360537,-0.0051515875,-13.956875,0.16228181,-262.1306,262.33707,1.3766781,3.0639176,-100.202965,-263.32184,-301.86752,4.4405956,0.5528027,-0.39287478,51.95656,955000
|
| 73 |
+
0.65107197,261.82092,0.003388576,0.00159385,-12.02964,0.1729756,-261.78015,261.99548,1.1703867,3.114214,-100.347694,-262.77863,-301.9634,4.2846007,0.4648233,-0.3965727,48.606712,960000
|
| 74 |
+
0.6661549,265.3406,0.0035074237,0.0054434114,-10.948031,0.18667775,-265.30222,265.5327,0.9779215,2.6708443,-100.29151,-266.2422,-302.21854,3.6487658,0.51597095,-0.42489243,50.358677,965000
|
| 75 |
+
0.6575464,255.9065,0.0034098045,-0.00066408486,-12.694757,0.17721546,-255.86319,256.08304,0.90043783,2.6858575,-100.386986,-256.65182,-302.25586,3.5862954,0.4231449,-0.25437003,43.70842,970000
|
| 76 |
+
0.649308,266.07803,0.0034312573,-0.0066645863,-14.442316,0.16034284,-266.0285,266.23172,1.2724144,3.9939384,-100.48485,-266.4668,-302.31454,5.2663527,0.3400584,-0.46184403,54.462784,975000
|
| 77 |
+
0.6522926,261.80508,0.0036192944,0.0019656194,-11.956905,0.16428359,-261.76184,261.9713,0.9875607,2.919735,-100.33143,-262.27228,-302.10007,3.9072957,0.53268695,-0.78171146,61.83064,980000
|
| 78 |
+
0.6512202,262.42133,0.0035295177,-0.0071881423,-14.536579,0.17982444,-262.37006,262.59393,1.0968493,4.3913054,-49.4598,-262.97372,-301.75958,5.488155,0.5305307,-0.50646114,62.904163,985000
|
| 79 |
+
0.66661865,257.80447,0.00354901,0.0055935145,-10.923923,0.17467946,-257.7657,257.98474,1.313959,6.9371614,-99.07322,-258.62634,-302.39502,8.251121,1.8784924,-1.8434556,122.2343,990000
|
| 80 |
+
0.6636648,260.98584,0.0035597538,0.00076375203,-12.285448,0.1873773,-260.94214,261.17398,1.108559,4.47976,-83.279655,-261.97324,-302.2838,5.5883193,0.8410831,-0.46107504,67.765884,995000
|
| 81 |
+
0.66208524,259.30103,0.003445495,0.0014641915,-12.075042,0.14321694,-259.2594,259.4457,1.4018606,2.8618677,-100.24382,-260.07614,-302.0657,4.263728,0.62505955,-0.67501634,57.50255,1000000
|
| 82 |
+
0.6563843,261.56732,0.003291683,0.0008740645,-12.234463,0.16956082,-261.52704,261.73776,1.2287104,2.3021333,-98.687386,-262.32965,-301.73425,3.5308437,0.3339681,-0.20846432,40.827415,1005000
|
| 83 |
+
0.6575555,261.71902,0.0034246047,-0.002886303,-13.3428135,0.16029927,-261.67334,261.87643,1.0223477,3.6841028,-100.32084,-262.9382,-302.02954,4.7064505,0.5777801,-0.42657185,49.97992,1010000
|
| 84 |
+
0.65986913,253.97835,0.0032079625,0.004040791,-11.240387,0.1672875,-253.94228,254.14967,0.9039529,2.9982402,-77.38086,-254.51314,-301.83215,3.902193,0.37866285,-0.52929825,52.62655,1015000
|
| 85 |
+
0.65653205,261.25128,0.0035637603,-0.00025887645,-12.572641,0.17411378,-261.20648,261.42514,1.5223082,3.4719715,-87.04904,-261.87656,-301.99847,4.99428,0.35514015,-0.4967986,57.897858,1020000
|
| 86 |
+
0.6466819,262.68057,0.003413686,-0.006351027,-14.36046,0.1829174,-262.63153,262.85715,1.4623327,2.860129,-100.20497,-263.39075,-301.71704,4.322462,0.30967557,-0.55739844,46.266136,1025000
|
| 87 |
+
0.63788277,258.57867,0.0035358616,-0.0064326907,-14.319271,0.16495992,-258.528,258.73718,1.4346595,3.6145241,-100.49186,-259.68927,-302.07196,5.049184,0.6463211,-0.49093282,60.29489,1030000
|
| 88 |
+
0.66567755,255.84885,0.0033925078,0.0022620838,-11.833212,0.19438323,-255.80872,256.0455,1.970167,3.3068447,-100.24884,-256.7745,-302.01016,5.277012,0.37441555,-0.5104859,58.61408,1035000
|
| 89 |
+
0.66435033,255.17026,0.0033634163,0.0012540288,-12.127156,0.13133073,-255.12949,255.30284,1.1782786,3.4121118,-100.32861,-255.84526,-301.78882,4.59039,0.36319596,-0.36807364,50.360268,1040000
|
| 90 |
+
0.6757802,250.94873,0.003363038,0.007452863,-10.28389,0.162705,-250.91415,251.11888,1.2173586,3.2410038,-100.325714,-251.69609,-301.66815,4.4583626,0.3045745,-0.33514184,47.349785,1045000
|
| 91 |
+
0.65868413,256.05756,0.0033161256,-0.0014648307,-12.94173,0.17703392,-256.01468,256.23312,1.0264419,6.2512813,-100.41937,-257.07617,-301.8181,7.2777233,4.16162,-4.355138,157.3187,1050000
|
| 92 |
+
0.66043305,258.94485,0.0032934318,0.005597549,-10.80039,0.1677081,-258.9093,259.11813,1.2221743,2.8265827,-100.393105,-259.7606,-301.74634,4.048757,0.57991415,-0.5750266,43.316387,1055000
|
| 93 |
+
0.67259246,249.124,0.0033077463,0.008967727,-9.788871,0.14581458,-249.09161,249.27878,0.99595225,2.7984827,-100.28707,-249.64258,-301.91867,3.794435,0.46866822,-0.37264475,49.812122,1060000
|
| 94 |
+
0.6648399,253.57108,0.00321276,1.9814413e-05,-12.493833,0.17383426,-253.53094,253.74492,0.9703397,2.2629964,-76.37273,-254.23257,-301.6983,3.2333362,0.30220306,-0.27435437,41.834404,1065000
|
| 95 |
+
0.6508809,257.8426,0.0032236075,-0.004686635,-13.953848,0.19176298,-257.79764,258.02966,1.0857394,2.135378,-100.252884,-258.66818,-302.21246,3.2211173,0.61322963,-0.3952656,40.82026,1070000
|
| 96 |
+
0.6628362,252.9418,0.003208201,-0.0011395738,-12.8552065,0.172108,-252.90054,253.11276,0.9686883,3.159973,-98.78411,-253.5697,-301.7716,4.128661,0.43265274,-0.5022519,50.93865,1075000
|
| 97 |
+
0.6601302,261.19073,0.003412633,0.0012177253,-12.143171,0.17706582,-261.14926,261.36902,1.3875456,6.8427033,-100.40241,-262.5093,-302.16165,8.230249,0.96499413,-1.0618275,85.32804,1080000
|
| 98 |
+
0.65358746,260.44183,0.003528148,-0.0050064507,-13.919003,0.1806401,-260.3927,260.61746,1.5575346,3.9258919,-100.04229,-261.48953,-301.78098,5.4834266,0.67183113,-0.6458342,62.174324,1085000
|
| 99 |
+
0.6409463,253.99141,0.0033565736,-0.0072531854,-14.66089,0.148981,-253.9422,254.13315,1.1538728,4.4246626,-98.58921,-254.87425,-301.86902,5.5785356,0.36390615,-0.41233966,50.758873,1090000
|
| 100 |
+
0.6549215,252.58218,0.0031111427,-0.002677074,-13.360479,0.14474939,-252.5406,252.72426,1.5096258,3.3212554,-100.328896,-253.3897,-301.99347,4.830881,0.30282882,-0.45452234,52.2667,1095000
|
| 101 |
+
0.65415996,260.1411,0.0031734062,-0.007133554,-14.747917,0.17787759,-260.09427,260.31186,1.0177258,3.4760556,-100.3434,-260.94058,-302.06018,4.4937816,0.54474056,-0.6318835,54.95204,1100000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3ae9ed44c79a316e7bbe03d5b001b236f0db89f7c4442eb1383e13fcdb50058
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff32c3a2e939f45d632c5b9a2a73cc1128ea00730e05084592851a8dacbf9409
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:859d164fae7daa9fa5c70589b952f70dce59db7b38e01564276a5b7bd0d440b1
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5da0e69fcc3a2f6fc9b8dd4a548c01273dc06fc601d1e7936ad1107335a1b0ed
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa2068e3e3ef57cecbb928d5ca8c1162d55fc527852d914d5bb2ac0292cdaee7
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d6ab9fe1854be08866761cd0573aa75a6629ff34ddbf0a96e537fde0ba216327
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04e47b32eab0b4ae2b1d28ba71647d9d85350ab8d5e37a52b0bbacee48cfa788
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f1cbbd2081dca6470225f68be89512af7358661ea392bbe28fdd14e2bcdc3c4
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32b704dfb67c6b33f9257b1c169e249d6b1c54cb5e657d4c564acd69160ac058
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:edaefbfd4687dbe178e63d3dd7510f13bcd68ee612770167fc3324b11c11812b
|
| 3 |
+
size 328782656
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260326_204045/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/3zxosq5o
|