Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/env.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_350000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_400000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.08937466593615219,-0.005615782414502466,-0.08937671056909942,0.0009815154215385292,16.0658406213652,42.82100000001025,0.3,21923.68,-0.7,-854.12,854.42,2.510898690223694,350000
|
| 3 |
+
0.0,0.0,-0.06512802088601903,-0.012288582558944843,-0.06561470579090241,-0.012245239071936491,23.80186652162872,20.66900000000412,0.74,56344.02,-0.26,-415.0,411.38,1.2676726484298706,400000
|
| 4 |
+
0.0,0.0,-0.019438184731233963,-0.0038353621132485266,-0.019393758808160484,-0.0029174762174196903,34.59172045991821,4.269000000000164,0.98,67701.4,-0.02,-82.4,83.38,0.2909025478363037,450000
|
| 5 |
+
0.0,0.0,-0.03779894249237325,0.009298536282358095,-0.03716815645892263,0.0013632462386282895,35.07498458153072,2.7149999999999337,1.0,70733.3,0.0,-51.3,52.3,0.18175065994262696,500000
|
| 6 |
+
0.0,0.0,-0.033219418977903044,0.012084468898178307,-0.0323219569947234,0.01172670463607988,35.68549431334374,1.8669999999999822,1.0,73238.94,0.0,-34.34,35.34,0.1271272373199463,550000
|
| 7 |
+
0.0,0.0,-0.03656118236958592,0.028101287598466335,-0.03503705235113229,0.021950300495383875,35.610860180647514,1.685999999999996,1.0,74950.84,0.0,-30.72,31.72,0.11518264770507812,600000
|
| 8 |
+
0.0,0.0,-0.030296507574174025,0.02548515101663337,-0.02868534295215926,0.024229313081812098,35.71053878093133,2.1789999999999723,1.0,76690.14,0.0,-40.58,41.58,0.14509506702423094,650000
|
| 9 |
+
0.0,0.0,-0.0443371192707943,0.02915653911915694,-0.04231464748281095,0.04184743401747342,35.66903232245783,2.2540000000000058,1.0,79059.92,0.0,-42.08,43.08,0.1489090585708618,700000
|
| 10 |
+
0.0,0.0,-0.02465517425055975,0.037639558934508044,-0.022692288568313325,0.03068106007624631,35.69426774327665,1.5649999999999933,1.0,80879.38,0.0,-28.3,29.3,0.10564068794250488,750000
|
| 11 |
+
0.0,0.0,-0.04162954510011876,0.0367857303340405,-0.03977567190645938,0.03756815756750879,35.58854449798936,1.6299999999999883,1.0,82464.12,0.0,-29.6,30.6,0.11070118427276611,800000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.08937466593615219,-0.005615782414502466,-0.08937671056909942,0.0009815154215385292,16.0658406213652,42.82100000001025,0.3,21923.68,-0.7,-854.12,854.42,2.510898690223694,350000
|
| 3 |
+
0.0,0.0,-0.06512802088601903,-0.012288582558944843,-0.06561470579090241,-0.012245239071936491,23.80186652162872,20.66900000000412,0.74,56344.02,-0.26,-415.0,411.38,1.2676726484298706,400000
|
| 4 |
+
0.0,0.0,-0.019438184731233963,-0.0038353621132485266,-0.019393758808160484,-0.0029174762174196903,34.59172045991821,4.269000000000164,0.98,67701.4,-0.02,-82.4,83.38,0.2909025478363037,450000
|
| 5 |
+
0.0,0.0,-0.03779894249237325,0.009298536282358095,-0.03716815645892263,0.0013632462386282895,35.07498458153072,2.7149999999999337,1.0,70733.3,0.0,-51.3,52.3,0.18175065994262696,500000
|
| 6 |
+
0.0,0.0,-0.033219418977903044,0.012084468898178307,-0.0323219569947234,0.01172670463607988,35.68549431334374,1.8669999999999822,1.0,73238.94,0.0,-34.34,35.34,0.1271272373199463,550000
|
| 7 |
+
0.0,0.0,-0.03656118236958592,0.028101287598466335,-0.03503705235113229,0.021950300495383875,35.610860180647514,1.685999999999996,1.0,74950.84,0.0,-30.72,31.72,0.11518264770507812,600000
|
| 8 |
+
0.0,0.0,-0.030296507574174025,0.02548515101663337,-0.02868534295215926,0.024229313081812098,35.71053878093133,2.1789999999999723,1.0,76690.14,0.0,-40.58,41.58,0.14509506702423094,650000
|
| 9 |
+
0.0,0.0,-0.0443371192707943,0.02915653911915694,-0.04231464748281095,0.04184743401747342,35.66903232245783,2.2540000000000058,1.0,79059.92,0.0,-42.08,43.08,0.1489090585708618,700000
|
| 10 |
+
0.0,0.0,-0.02465517425055975,0.037639558934508044,-0.022692288568313325,0.03068106007624631,35.69426774327665,1.5649999999999933,1.0,80879.38,0.0,-28.3,29.3,0.10564068794250488,750000
|
| 11 |
+
0.0,0.0,-0.04162954510011876,0.0367857303340405,-0.03977567190645938,0.03756815756750879,35.58854449798936,1.6299999999999883,1.0,82464.12,0.0,-29.6,30.6,0.11070118427276611,800000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.00785593,0.7855931,1.0078559,4.702727,-117.951675,-277.43326,-308.47235,2.4461327,-1.2623036,73.72482,305000
|
| 3 |
+
1.0,1.0,0.008356346,0.8356347,1.0083563,3.0130782,-144.87886,-275.0844,-308.0339,0.5202177,-0.5235604,39.834656,310000
|
| 4 |
+
1.0,1.0,0.008402732,0.84027326,1.0084027,3.9131355,-110.53178,-270.7399,-309.8808,0.6785216,-0.4559435,54.76413,315000
|
| 5 |
+
1.0,1.0000001,0.008296741,0.8296742,1.0082968,3.4446914,-181.69012,-276.91116,-308.32666,0.54522634,-0.7216768,43.61008,320000
|
| 6 |
+
1.0,1.0,0.009025304,0.9025304,1.0090253,2.4588673,-106.25509,-276.1235,-308.50208,0.7244345,-0.32419902,35.097923,325000
|
| 7 |
+
1.0,1.0,0.0077135325,0.7713533,1.0077136,2.6787655,1.7600244,-275.22263,-308.09073,0.73953855,-0.760645,48.06979,330000
|
| 8 |
+
1.0,1.0,0.008454563,0.84545624,1.0084546,2.7475092,-105.449844,-278.58054,-309.9474,0.37052786,-0.5322874,38.241196,335000
|
| 9 |
+
1.0,0.99999994,0.008246486,0.8246486,1.0082464,3.120067,-100.266945,-275.2226,-309.602,0.40093112,-0.42960668,42.21204,340000
|
| 10 |
+
1.0,1.0,0.007723704,0.7723704,1.0077237,2.7239673,-101.18325,-276.57495,-308.72186,0.4877918,-0.60518676,38.10908,345000
|
| 11 |
+
1.0,1.0,0.007833427,0.7833428,1.0078335,2.8081405,-57.556915,-274.38205,-309.32922,0.7012021,-0.7899197,41.1869,350000
|
| 12 |
+
1.0,1.0,0.0075464062,0.75464064,1.0075464,2.6121807,-50.866753,-272.57544,-308.04034,0.4528672,-0.39407653,36.035812,355000
|
| 13 |
+
1.0,1.0,0.008711021,0.87110215,1.008711,2.9785614,-101.64322,-273.36935,-308.8308,0.36039454,-0.38567796,43.14878,360000
|
| 14 |
+
1.0,1.0,0.008991418,0.8991418,1.0089914,3.170436,-97.23434,-274.2341,-308.64233,0.6809511,-0.8693867,49.855453,365000
|
| 15 |
+
1.0,1.0,0.008614775,0.8614775,1.0086148,3.0229006,-16.063234,-267.24805,-308.01517,0.47216213,-0.39800018,38.18885,370000
|
| 16 |
+
1.0,1.0,0.008453641,0.8453641,1.0084536,3.4975793,-27.16941,-265.1312,-309.29816,4.2453666,-3.4748027,96.386765,375000
|
| 17 |
+
1.0,1.0,0.008816572,0.88165724,1.0088166,3.0952375,-89.88906,-267.72714,-307.62,0.56103116,-0.83132625,46.345787,380000
|
| 18 |
+
1.0,1.0,0.008921676,0.8921676,1.0089216,4.185446,-16.129288,-267.83344,-308.3797,0.658519,-0.6012849,53.02057,385000
|
| 19 |
+
1.0,0.99999994,0.008851864,0.88518643,1.0088518,2.9359376,-39.643433,-269.0025,-309.5515,0.4565323,-0.63322306,42.416374,390000
|
| 20 |
+
1.0,1.0,0.0091171935,0.91171944,1.0091172,2.9902508,-66.7269,-270.47345,-308.28265,0.3133789,-0.5125977,37.49151,395000
|
| 21 |
+
1.0,1.0,0.0079643065,0.7964306,1.0079643,3.4428918,-73.73259,-266.85696,-309.37723,0.8988309,-0.7043295,49.05326,400000
|
| 22 |
+
1.0,0.9999999,0.007886119,0.788612,1.007886,2.419428,-63.72022,-271.0032,-308.00168,0.43775457,-0.4580328,33.955868,405000
|
| 23 |
+
1.0,0.99999994,0.009078741,0.9078742,1.0090787,3.3152223,-33.234524,-271.93707,-308.04703,0.55414355,-0.64743036,42.39855,410000
|
| 24 |
+
1.0,0.99999994,0.008100722,0.81007224,1.0081006,3.543015,-17.628792,-265.05313,-308.26077,7.6353817,-8.643481,126.734146,415000
|
| 25 |
+
1.0,1.0,0.008181304,0.8181304,1.0081813,3.4564216,-40.191982,-263.79395,-308.077,0.8363586,-1.0858083,54.619514,420000
|
| 26 |
+
1.0,0.9999999,0.0079464,0.79463995,1.0079463,4.2154627,-5.482759,-270.74368,-308.87296,1.3652726,-1.1924601,72.653046,425000
|
| 27 |
+
1.0,1.0,0.008490477,0.84904766,1.0084904,3.2752922,-19.900806,-267.24738,-307.48126,0.9963584,-1.2265433,52.226692,430000
|
| 28 |
+
1.0,1.0,0.008225711,0.82257116,1.0082257,3.0927575,-29.382977,-266.71567,-308.47382,0.82282364,-0.46754977,41.39809,435000
|
| 29 |
+
1.0,1.0,0.008814504,0.8814504,1.0088145,3.1262653,-21.634598,-263.4785,-308.279,0.64281553,-0.60786945,44.1144,440000
|
| 30 |
+
1.0,0.9999999,0.009098262,0.90982616,1.0090982,3.2471406,-23.268078,-260.32022,-308.55524,0.7138075,-0.92641366,45.11567,445000
|
| 31 |
+
1.0,1.0,0.008174076,0.8174076,1.0081741,3.2823417,-31.918728,-264.49167,-308.54147,0.36804387,-0.53015107,41.314804,450000
|
| 32 |
+
1.0,1.0000001,0.008430123,0.84301233,1.0084302,2.8414676,-12.521734,-263.05722,-308.04565,0.49321267,-0.42278036,38.37408,455000
|
| 33 |
+
1.0,1.0,0.007996617,0.79966164,1.0079966,4.2213907,-15.178493,-257.82504,-307.44577,0.58802056,-0.8274279,53.648766,460000
|
| 34 |
+
1.0,0.9999999,0.009291027,0.9291027,1.0092909,3.8576562,-29.980982,-260.14468,-307.8513,0.6671751,-0.6901789,49.336143,465000
|
| 35 |
+
1.0,1.0,0.010190487,1.0190487,1.0101905,5.3030143,-33.790195,-259.3618,-307.84186,3.9271052,-4.644583,133.31926,470000
|
| 36 |
+
1.0,0.99999994,0.0088913385,0.88913393,1.0088912,2.759516,-22.699883,-260.6229,-307.7081,1.140947,-1.235324,46.245575,475000
|
| 37 |
+
1.0,1.0,0.010065379,1.0065379,1.0100654,3.79588,-18.596523,-257.60657,-307.79462,0.53756654,-0.66322017,49.01293,480000
|
| 38 |
+
1.0,1.0,0.008916997,0.89169973,1.008917,3.3668308,-12.396543,-253.7563,-307.43643,0.80684745,-1.0061558,49.43993,485000
|
| 39 |
+
1.0,1.0000001,0.008659607,0.8659607,1.0086597,3.2869918,-8.342705,-256.95377,-307.978,0.5285134,-0.70570505,41.65285,490000
|
| 40 |
+
1.0,1.0,0.008686377,0.8686377,1.0086864,2.7866414,-14.470641,-262.3191,-307.38303,0.41415468,-0.6785805,38.636494,495000
|
| 41 |
+
1.0,1.0000001,0.01015677,1.015677,1.0101569,3.101947,-12.437152,-254.71806,-309.06583,0.80873364,-0.5659415,38.87712,500000
|
| 42 |
+
1.0,1.0,0.010326498,1.0326499,1.0103265,5.087914,-6.4758415,-252.82393,-307.65274,1.1039551,-1.3740246,71.79954,505000
|
| 43 |
+
1.0,1.0,0.009073533,0.9073532,1.0090735,3.3254478,-10.679778,-257.78494,-308.61325,0.977865,-0.7173711,46.933662,510000
|
| 44 |
+
1.0,0.99999994,0.0094210245,0.94210243,1.009421,3.3178048,-8.799489,-252.21207,-309.67346,0.6801572,-0.45887184,42.902603,515000
|
| 45 |
+
1.0,0.99999994,0.009526489,0.9526489,1.0095264,3.9016912,-15.923454,-258.89044,-307.83267,0.6373737,-0.6349619,49.257244,520000
|
| 46 |
+
1.0,1.0,0.008543294,0.85432947,1.0085433,3.3495736,-3.0127976,-258.78635,-309.60968,0.9985571,-0.5816699,44.12215,525000
|
| 47 |
+
1.0,0.9999999,0.008479835,0.8479836,1.0084797,4.374055,-2.3834414,-259.83292,-306.89746,0.71525615,-0.78255314,52.708755,530000
|
| 48 |
+
1.0,1.0,0.009523101,0.9523101,1.0095232,3.1473794,-12.465159,-256.7303,-307.30618,0.6289184,-0.42370695,41.44025,535000
|
| 49 |
+
1.0,0.99999994,0.009056784,0.9056784,1.0090567,5.0916553,-13.668211,-258.8898,-307.70306,1.1565529,-1.194078,71.96095,540000
|
| 50 |
+
1.0,1.0,0.008975025,0.89750254,1.008975,3.0393894,-3.0611427,-250.32524,-308.40964,1.387765,-0.8497225,45.549088,545000
|
| 51 |
+
1.0,1.0,0.008721847,0.8721847,1.0087218,3.4251516,-10.170684,-263.94022,-309.6008,0.5910192,-0.48101568,41.645576,550000
|
| 52 |
+
1.0,1.0,0.008025066,0.8025066,1.008025,4.4145164,-6.2212877,-253.52132,-307.66052,1.4652073,-0.81934136,52.170425,555000
|
| 53 |
+
1.0,1.0,0.008100238,0.81002384,1.0081003,4.1577706,-4.347078,-254.4943,-308.83627,1.0665087,-0.8480296,52.697483,560000
|
| 54 |
+
1.0,0.99999994,0.008869037,0.88690364,1.0088689,2.93138,-5.4848995,-254.11546,-307.7971,0.92098737,-0.9755837,50.523834,565000
|
| 55 |
+
1.0,0.99999994,0.008595247,0.85952467,1.0085952,3.5953834,-3.5627196,-258.65097,-308.24323,0.5893711,-0.9080859,47.654602,570000
|
| 56 |
+
1.0,1.0000001,0.009083425,0.9083425,1.0090835,3.6636512,-9.965988,-250.88379,-308.1318,0.8959178,-2.2244518,54.25733,575000
|
| 57 |
+
1.0,1.0,0.009250335,0.92503357,1.0092503,3.891436,-5.3719835,-249.48462,-307.43576,0.55107033,-0.6562445,47.463085,580000
|
| 58 |
+
1.0,1.0,0.008368658,0.83686584,1.0083686,3.4764752,-3.1309905,-257.39532,-308.5103,1.643563,-0.81552106,42.80628,585000
|
| 59 |
+
1.0,1.0,0.009151539,0.9151539,1.0091516,3.2299173,-12.838133,-249.62373,-308.4405,0.9740074,-1.1616461,53.439884,590000
|
| 60 |
+
1.0,1.0,0.009351702,0.93517023,1.0093517,2.5728707,-8.773279,-255.62315,-308.61395,0.5249576,-0.48927724,36.920155,595000
|
| 61 |
+
1.0,1.0000001,0.009864879,0.98648787,1.009865,2.658858,-2.8194811,-249.51476,-307.447,0.36746243,-0.64136994,32.620094,600000
|
| 62 |
+
1.0,1.0000001,0.008525873,0.8525873,1.008526,3.2646272,-4.5251184,-249.31438,-308.9289,1.1814493,-0.9229969,48.301746,605000
|
| 63 |
+
1.0,1.0,0.009636126,0.9636127,1.0096362,4.4293833,-4.409541,-247.40239,-308.47736,0.81613696,-1.297333,51.435883,610000
|
| 64 |
+
1.0,1.0,0.010194886,1.0194886,1.0101949,4.3336535,-1.7642816,-243.85562,-308.47452,0.84476274,-1.310475,62.825043,615000
|
| 65 |
+
1.0,1.0,0.009248164,0.9248163,1.0092481,3.3315415,-2.7860012,-236.03496,-307.24783,0.7335463,-0.51876193,38.94253,620000
|
| 66 |
+
1.0,1.0000001,0.009072296,0.90722966,1.0090724,3.1952102,-4.4206877,-252.76323,-308.33444,0.59968454,-0.74100405,43.33814,625000
|
| 67 |
+
1.0,1.0,0.010183897,1.0183896,1.0101839,5.562764,-3.7290096,-245.48315,-307.17014,0.92904377,-0.7738714,48.86163,630000
|
| 68 |
+
1.0,0.99999994,0.008801086,0.8801086,1.008801,3.7996926,-3.2540002,-244.81157,-308.8446,0.56598777,-1.0225701,54.57209,635000
|
| 69 |
+
1.0,0.9999999,0.009801201,0.9801201,1.009801,2.6049469,-5.0259666,-255.13525,-307.1581,0.3677331,-0.84278506,33.17868,640000
|
| 70 |
+
1.0,1.0,0.008967355,0.8967355,1.0089674,2.958796,-4.086124,-254.85425,-308.9256,1.44717,-0.76133347,48.89281,645000
|
| 71 |
+
1.0,1.0,0.009939823,0.9939823,1.0099398,3.1035047,-4.604482,-243.80937,-307.79144,0.6121385,-1.500116,45.66456,650000
|
| 72 |
+
1.0,1.0,0.009191365,0.9191365,1.0091914,2.6049368,-6.5639057,-248.92174,-306.95813,0.49030876,-0.829157,36.30104,655000
|
| 73 |
+
1.0,1.0,0.009631756,0.96317565,1.0096318,9.944594,-5.3428235,-247.44678,-307.37555,3.446837,-4.9693146,157.95544,660000
|
| 74 |
+
1.0,0.9999999,0.008536801,0.8536801,1.0085367,2.5057862,-6.36908,-251.19742,-308.04843,1.3449281,-0.43434024,34.566406,665000
|
| 75 |
+
1.0,1.0,0.009419918,0.9419918,1.0094199,3.5329025,-1.35811,-239.11226,-307.78195,2.120259,-0.916797,58.930847,670000
|
| 76 |
+
1.0,1.0,0.008477688,0.8477688,1.0084777,2.6519277,-5.2959614,-250.52122,-307.88333,0.5841159,-0.38301232,33.531662,675000
|
| 77 |
+
1.0,0.99999994,0.008195851,0.8195851,1.0081958,2.6619713,0.12420201,-248.07994,-307.18442,0.44843492,-1.0610954,36.460793,680000
|
| 78 |
+
1.0,1.0,0.00884612,0.88461196,1.0088462,4.7210693,-4.407738,-246.19505,-307.7681,0.8080863,-0.48033643,47.94139,685000
|
| 79 |
+
1.0,1.0000001,0.01025916,1.025916,1.0102593,3.4668312,-5.8578825,-240.92847,-307.35205,1.3070061,-1.1277702,44.765373,690000
|
| 80 |
+
1.0,1.0,0.00916224,0.9162241,1.0091622,2.9837897,-2.926696,-245.40157,-307.8804,0.86676013,-1.1294924,44.55094,695000
|
| 81 |
+
1.0,1.0,0.009536259,0.9536259,1.0095363,2.8661785,-5.543932,-243.45445,-307.8719,0.55518365,-0.48128554,36.56855,700000
|
| 82 |
+
1.0,1.0,0.00921509,0.921509,1.0092151,2.440123,-5.0327907,-245.3908,-306.93027,0.7779575,-0.24579504,31.579025,705000
|
| 83 |
+
1.0,1.0,0.008812979,0.88129795,1.008813,5.238676,1.278112,-246.36375,-307.549,1.8078866,-1.817775,73.88407,710000
|
| 84 |
+
1.0,1.0,0.009854284,0.9854285,1.0098543,2.5699766,-4.267187,-235.84293,-307.82907,0.5441705,-0.6731831,38.490746,715000
|
| 85 |
+
1.0,1.0,0.008964989,0.896499,1.008965,3.1504152,-3.2432752,-243.40747,-308.3661,0.70773095,-0.7078953,39.844795,720000
|
| 86 |
+
1.0,1.0000001,0.00876451,0.876451,1.0087646,2.7766702,-2.2141962,-246.8872,-307.29294,0.38993728,-0.434227,33.7341,725000
|
| 87 |
+
1.0,1.0000001,0.009903256,0.99032557,1.0099034,3.589093,-6.1247873,-243.40413,-307.77313,0.9387083,-1.3462713,54.624985,730000
|
| 88 |
+
1.0,1.0,0.009551233,0.9551233,1.0095513,2.6431885,-3.235449,-238.36406,-307.49545,0.842038,-0.71996826,35.77782,735000
|
| 89 |
+
1.0,1.0,0.009458975,0.9458975,1.009459,2.7324343,-1.1407855,-237.28027,-307.52255,0.4667683,-0.41225672,33.71316,740000
|
| 90 |
+
1.0,1.0,0.009987749,0.99877495,1.0099877,4.952407,1.262779,-232.95825,-307.8991,0.7059569,-1.527515,55.418327,745000
|
| 91 |
+
1.0,1.0000001,0.009547141,0.95471406,1.0095472,3.0161066,-1.5366853,-239.37564,-307.27112,1.3902466,-1.0244315,43.57731,750000
|
| 92 |
+
1.0,1.0,0.00890668,0.8906681,1.0089067,2.9437907,-2.8316295,-242.29932,-308.97043,0.8471869,-0.5724305,38.34799,755000
|
| 93 |
+
1.0,1.0,0.009747673,0.9747673,1.0097476,3.4154365,-0.050124794,-229.42598,-306.87198,1.6249788,-1.6564052,46.733418,760000
|
| 94 |
+
1.0,1.0,0.009048451,0.9048451,1.0090485,3.7148812,-2.5049996,-235.74132,-307.04254,1.8739394,-0.5578582,42.463676,765000
|
| 95 |
+
1.0,0.99999994,0.0089579,0.8957901,1.0089579,3.436948,-3.1817245,-239.8147,-307.74954,0.8160521,-0.73104066,46.573883,770000
|
| 96 |
+
1.0,1.0,0.009433816,0.94338167,1.0094339,2.8478096,-3.2269096,-235.25198,-307.84012,0.79513824,-0.40423095,40.35383,775000
|
| 97 |
+
1.0,1.0,0.009460151,0.9460151,1.0094602,3.0416298,-0.68303764,-247.26407,-307.47238,0.5960729,-0.6934618,38.188835,780000
|
| 98 |
+
1.0,0.99999994,0.008602859,0.860286,1.0086029,2.8764222,-4.839858,-245.70596,-307.37,0.8399459,-1.1304666,41.669174,785000
|
| 99 |
+
1.0,1.0,0.010084756,1.0084755,1.0100847,3.614376,0.23395225,-234.41113,-307.33347,1.0512754,-0.70257217,45.65798,790000
|
| 100 |
+
1.0,1.0,0.009170068,0.91700685,1.00917,2.7953625,-0.33901995,-233.82935,-307.3443,0.6757382,-0.70509124,33.448433,795000
|
| 101 |
+
1.0,1.0,0.008968448,0.89684486,1.0089685,2.3449218,-5.3463917,-242.90019,-307.5466,0.39603162,-0.5807388,30.336462,800000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.00785593,0.7855931,1.0078559,4.702727,-117.951675,-277.43326,-308.47235,2.4461327,-1.2623036,73.72482,305000
|
| 3 |
+
1.0,1.0,0.008356346,0.8356347,1.0083563,3.0130782,-144.87886,-275.0844,-308.0339,0.5202177,-0.5235604,39.834656,310000
|
| 4 |
+
1.0,1.0,0.008402732,0.84027326,1.0084027,3.9131355,-110.53178,-270.7399,-309.8808,0.6785216,-0.4559435,54.76413,315000
|
| 5 |
+
1.0,1.0000001,0.008296741,0.8296742,1.0082968,3.4446914,-181.69012,-276.91116,-308.32666,0.54522634,-0.7216768,43.61008,320000
|
| 6 |
+
1.0,1.0,0.009025304,0.9025304,1.0090253,2.4588673,-106.25509,-276.1235,-308.50208,0.7244345,-0.32419902,35.097923,325000
|
| 7 |
+
1.0,1.0,0.0077135325,0.7713533,1.0077136,2.6787655,1.7600244,-275.22263,-308.09073,0.73953855,-0.760645,48.06979,330000
|
| 8 |
+
1.0,1.0,0.008454563,0.84545624,1.0084546,2.7475092,-105.449844,-278.58054,-309.9474,0.37052786,-0.5322874,38.241196,335000
|
| 9 |
+
1.0,0.99999994,0.008246486,0.8246486,1.0082464,3.120067,-100.266945,-275.2226,-309.602,0.40093112,-0.42960668,42.21204,340000
|
| 10 |
+
1.0,1.0,0.007723704,0.7723704,1.0077237,2.7239673,-101.18325,-276.57495,-308.72186,0.4877918,-0.60518676,38.10908,345000
|
| 11 |
+
1.0,1.0,0.007833427,0.7833428,1.0078335,2.8081405,-57.556915,-274.38205,-309.32922,0.7012021,-0.7899197,41.1869,350000
|
| 12 |
+
1.0,1.0,0.0075464062,0.75464064,1.0075464,2.6121807,-50.866753,-272.57544,-308.04034,0.4528672,-0.39407653,36.035812,355000
|
| 13 |
+
1.0,1.0,0.008711021,0.87110215,1.008711,2.9785614,-101.64322,-273.36935,-308.8308,0.36039454,-0.38567796,43.14878,360000
|
| 14 |
+
1.0,1.0,0.008991418,0.8991418,1.0089914,3.170436,-97.23434,-274.2341,-308.64233,0.6809511,-0.8693867,49.855453,365000
|
| 15 |
+
1.0,1.0,0.008614775,0.8614775,1.0086148,3.0229006,-16.063234,-267.24805,-308.01517,0.47216213,-0.39800018,38.18885,370000
|
| 16 |
+
1.0,1.0,0.008453641,0.8453641,1.0084536,3.4975793,-27.16941,-265.1312,-309.29816,4.2453666,-3.4748027,96.386765,375000
|
| 17 |
+
1.0,1.0,0.008816572,0.88165724,1.0088166,3.0952375,-89.88906,-267.72714,-307.62,0.56103116,-0.83132625,46.345787,380000
|
| 18 |
+
1.0,1.0,0.008921676,0.8921676,1.0089216,4.185446,-16.129288,-267.83344,-308.3797,0.658519,-0.6012849,53.02057,385000
|
| 19 |
+
1.0,0.99999994,0.008851864,0.88518643,1.0088518,2.9359376,-39.643433,-269.0025,-309.5515,0.4565323,-0.63322306,42.416374,390000
|
| 20 |
+
1.0,1.0,0.0091171935,0.91171944,1.0091172,2.9902508,-66.7269,-270.47345,-308.28265,0.3133789,-0.5125977,37.49151,395000
|
| 21 |
+
1.0,1.0,0.0079643065,0.7964306,1.0079643,3.4428918,-73.73259,-266.85696,-309.37723,0.8988309,-0.7043295,49.05326,400000
|
| 22 |
+
1.0,0.9999999,0.007886119,0.788612,1.007886,2.419428,-63.72022,-271.0032,-308.00168,0.43775457,-0.4580328,33.955868,405000
|
| 23 |
+
1.0,0.99999994,0.009078741,0.9078742,1.0090787,3.3152223,-33.234524,-271.93707,-308.04703,0.55414355,-0.64743036,42.39855,410000
|
| 24 |
+
1.0,0.99999994,0.008100722,0.81007224,1.0081006,3.543015,-17.628792,-265.05313,-308.26077,7.6353817,-8.643481,126.734146,415000
|
| 25 |
+
1.0,1.0,0.008181304,0.8181304,1.0081813,3.4564216,-40.191982,-263.79395,-308.077,0.8363586,-1.0858083,54.619514,420000
|
| 26 |
+
1.0,0.9999999,0.0079464,0.79463995,1.0079463,4.2154627,-5.482759,-270.74368,-308.87296,1.3652726,-1.1924601,72.653046,425000
|
| 27 |
+
1.0,1.0,0.008490477,0.84904766,1.0084904,3.2752922,-19.900806,-267.24738,-307.48126,0.9963584,-1.2265433,52.226692,430000
|
| 28 |
+
1.0,1.0,0.008225711,0.82257116,1.0082257,3.0927575,-29.382977,-266.71567,-308.47382,0.82282364,-0.46754977,41.39809,435000
|
| 29 |
+
1.0,1.0,0.008814504,0.8814504,1.0088145,3.1262653,-21.634598,-263.4785,-308.279,0.64281553,-0.60786945,44.1144,440000
|
| 30 |
+
1.0,0.9999999,0.009098262,0.90982616,1.0090982,3.2471406,-23.268078,-260.32022,-308.55524,0.7138075,-0.92641366,45.11567,445000
|
| 31 |
+
1.0,1.0,0.008174076,0.8174076,1.0081741,3.2823417,-31.918728,-264.49167,-308.54147,0.36804387,-0.53015107,41.314804,450000
|
| 32 |
+
1.0,1.0000001,0.008430123,0.84301233,1.0084302,2.8414676,-12.521734,-263.05722,-308.04565,0.49321267,-0.42278036,38.37408,455000
|
| 33 |
+
1.0,1.0,0.007996617,0.79966164,1.0079966,4.2213907,-15.178493,-257.82504,-307.44577,0.58802056,-0.8274279,53.648766,460000
|
| 34 |
+
1.0,0.9999999,0.009291027,0.9291027,1.0092909,3.8576562,-29.980982,-260.14468,-307.8513,0.6671751,-0.6901789,49.336143,465000
|
| 35 |
+
1.0,1.0,0.010190487,1.0190487,1.0101905,5.3030143,-33.790195,-259.3618,-307.84186,3.9271052,-4.644583,133.31926,470000
|
| 36 |
+
1.0,0.99999994,0.0088913385,0.88913393,1.0088912,2.759516,-22.699883,-260.6229,-307.7081,1.140947,-1.235324,46.245575,475000
|
| 37 |
+
1.0,1.0,0.010065379,1.0065379,1.0100654,3.79588,-18.596523,-257.60657,-307.79462,0.53756654,-0.66322017,49.01293,480000
|
| 38 |
+
1.0,1.0,0.008916997,0.89169973,1.008917,3.3668308,-12.396543,-253.7563,-307.43643,0.80684745,-1.0061558,49.43993,485000
|
| 39 |
+
1.0,1.0000001,0.008659607,0.8659607,1.0086597,3.2869918,-8.342705,-256.95377,-307.978,0.5285134,-0.70570505,41.65285,490000
|
| 40 |
+
1.0,1.0,0.008686377,0.8686377,1.0086864,2.7866414,-14.470641,-262.3191,-307.38303,0.41415468,-0.6785805,38.636494,495000
|
| 41 |
+
1.0,1.0000001,0.01015677,1.015677,1.0101569,3.101947,-12.437152,-254.71806,-309.06583,0.80873364,-0.5659415,38.87712,500000
|
| 42 |
+
1.0,1.0,0.010326498,1.0326499,1.0103265,5.087914,-6.4758415,-252.82393,-307.65274,1.1039551,-1.3740246,71.79954,505000
|
| 43 |
+
1.0,1.0,0.009073533,0.9073532,1.0090735,3.3254478,-10.679778,-257.78494,-308.61325,0.977865,-0.7173711,46.933662,510000
|
| 44 |
+
1.0,0.99999994,0.0094210245,0.94210243,1.009421,3.3178048,-8.799489,-252.21207,-309.67346,0.6801572,-0.45887184,42.902603,515000
|
| 45 |
+
1.0,0.99999994,0.009526489,0.9526489,1.0095264,3.9016912,-15.923454,-258.89044,-307.83267,0.6373737,-0.6349619,49.257244,520000
|
| 46 |
+
1.0,1.0,0.008543294,0.85432947,1.0085433,3.3495736,-3.0127976,-258.78635,-309.60968,0.9985571,-0.5816699,44.12215,525000
|
| 47 |
+
1.0,0.9999999,0.008479835,0.8479836,1.0084797,4.374055,-2.3834414,-259.83292,-306.89746,0.71525615,-0.78255314,52.708755,530000
|
| 48 |
+
1.0,1.0,0.009523101,0.9523101,1.0095232,3.1473794,-12.465159,-256.7303,-307.30618,0.6289184,-0.42370695,41.44025,535000
|
| 49 |
+
1.0,0.99999994,0.009056784,0.9056784,1.0090567,5.0916553,-13.668211,-258.8898,-307.70306,1.1565529,-1.194078,71.96095,540000
|
| 50 |
+
1.0,1.0,0.008975025,0.89750254,1.008975,3.0393894,-3.0611427,-250.32524,-308.40964,1.387765,-0.8497225,45.549088,545000
|
| 51 |
+
1.0,1.0,0.008721847,0.8721847,1.0087218,3.4251516,-10.170684,-263.94022,-309.6008,0.5910192,-0.48101568,41.645576,550000
|
| 52 |
+
1.0,1.0,0.008025066,0.8025066,1.008025,4.4145164,-6.2212877,-253.52132,-307.66052,1.4652073,-0.81934136,52.170425,555000
|
| 53 |
+
1.0,1.0,0.008100238,0.81002384,1.0081003,4.1577706,-4.347078,-254.4943,-308.83627,1.0665087,-0.8480296,52.697483,560000
|
| 54 |
+
1.0,0.99999994,0.008869037,0.88690364,1.0088689,2.93138,-5.4848995,-254.11546,-307.7971,0.92098737,-0.9755837,50.523834,565000
|
| 55 |
+
1.0,0.99999994,0.008595247,0.85952467,1.0085952,3.5953834,-3.5627196,-258.65097,-308.24323,0.5893711,-0.9080859,47.654602,570000
|
| 56 |
+
1.0,1.0000001,0.009083425,0.9083425,1.0090835,3.6636512,-9.965988,-250.88379,-308.1318,0.8959178,-2.2244518,54.25733,575000
|
| 57 |
+
1.0,1.0,0.009250335,0.92503357,1.0092503,3.891436,-5.3719835,-249.48462,-307.43576,0.55107033,-0.6562445,47.463085,580000
|
| 58 |
+
1.0,1.0,0.008368658,0.83686584,1.0083686,3.4764752,-3.1309905,-257.39532,-308.5103,1.643563,-0.81552106,42.80628,585000
|
| 59 |
+
1.0,1.0,0.009151539,0.9151539,1.0091516,3.2299173,-12.838133,-249.62373,-308.4405,0.9740074,-1.1616461,53.439884,590000
|
| 60 |
+
1.0,1.0,0.009351702,0.93517023,1.0093517,2.5728707,-8.773279,-255.62315,-308.61395,0.5249576,-0.48927724,36.920155,595000
|
| 61 |
+
1.0,1.0000001,0.009864879,0.98648787,1.009865,2.658858,-2.8194811,-249.51476,-307.447,0.36746243,-0.64136994,32.620094,600000
|
| 62 |
+
1.0,1.0000001,0.008525873,0.8525873,1.008526,3.2646272,-4.5251184,-249.31438,-308.9289,1.1814493,-0.9229969,48.301746,605000
|
| 63 |
+
1.0,1.0,0.009636126,0.9636127,1.0096362,4.4293833,-4.409541,-247.40239,-308.47736,0.81613696,-1.297333,51.435883,610000
|
| 64 |
+
1.0,1.0,0.010194886,1.0194886,1.0101949,4.3336535,-1.7642816,-243.85562,-308.47452,0.84476274,-1.310475,62.825043,615000
|
| 65 |
+
1.0,1.0,0.009248164,0.9248163,1.0092481,3.3315415,-2.7860012,-236.03496,-307.24783,0.7335463,-0.51876193,38.94253,620000
|
| 66 |
+
1.0,1.0000001,0.009072296,0.90722966,1.0090724,3.1952102,-4.4206877,-252.76323,-308.33444,0.59968454,-0.74100405,43.33814,625000
|
| 67 |
+
1.0,1.0,0.010183897,1.0183896,1.0101839,5.562764,-3.7290096,-245.48315,-307.17014,0.92904377,-0.7738714,48.86163,630000
|
| 68 |
+
1.0,0.99999994,0.008801086,0.8801086,1.008801,3.7996926,-3.2540002,-244.81157,-308.8446,0.56598777,-1.0225701,54.57209,635000
|
| 69 |
+
1.0,0.9999999,0.009801201,0.9801201,1.009801,2.6049469,-5.0259666,-255.13525,-307.1581,0.3677331,-0.84278506,33.17868,640000
|
| 70 |
+
1.0,1.0,0.008967355,0.8967355,1.0089674,2.958796,-4.086124,-254.85425,-308.9256,1.44717,-0.76133347,48.89281,645000
|
| 71 |
+
1.0,1.0,0.009939823,0.9939823,1.0099398,3.1035047,-4.604482,-243.80937,-307.79144,0.6121385,-1.500116,45.66456,650000
|
| 72 |
+
1.0,1.0,0.009191365,0.9191365,1.0091914,2.6049368,-6.5639057,-248.92174,-306.95813,0.49030876,-0.829157,36.30104,655000
|
| 73 |
+
1.0,1.0,0.009631756,0.96317565,1.0096318,9.944594,-5.3428235,-247.44678,-307.37555,3.446837,-4.9693146,157.95544,660000
|
| 74 |
+
1.0,0.9999999,0.008536801,0.8536801,1.0085367,2.5057862,-6.36908,-251.19742,-308.04843,1.3449281,-0.43434024,34.566406,665000
|
| 75 |
+
1.0,1.0,0.009419918,0.9419918,1.0094199,3.5329025,-1.35811,-239.11226,-307.78195,2.120259,-0.916797,58.930847,670000
|
| 76 |
+
1.0,1.0,0.008477688,0.8477688,1.0084777,2.6519277,-5.2959614,-250.52122,-307.88333,0.5841159,-0.38301232,33.531662,675000
|
| 77 |
+
1.0,0.99999994,0.008195851,0.8195851,1.0081958,2.6619713,0.12420201,-248.07994,-307.18442,0.44843492,-1.0610954,36.460793,680000
|
| 78 |
+
1.0,1.0,0.00884612,0.88461196,1.0088462,4.7210693,-4.407738,-246.19505,-307.7681,0.8080863,-0.48033643,47.94139,685000
|
| 79 |
+
1.0,1.0000001,0.01025916,1.025916,1.0102593,3.4668312,-5.8578825,-240.92847,-307.35205,1.3070061,-1.1277702,44.765373,690000
|
| 80 |
+
1.0,1.0,0.00916224,0.9162241,1.0091622,2.9837897,-2.926696,-245.40157,-307.8804,0.86676013,-1.1294924,44.55094,695000
|
| 81 |
+
1.0,1.0,0.009536259,0.9536259,1.0095363,2.8661785,-5.543932,-243.45445,-307.8719,0.55518365,-0.48128554,36.56855,700000
|
| 82 |
+
1.0,1.0,0.00921509,0.921509,1.0092151,2.440123,-5.0327907,-245.3908,-306.93027,0.7779575,-0.24579504,31.579025,705000
|
| 83 |
+
1.0,1.0,0.008812979,0.88129795,1.008813,5.238676,1.278112,-246.36375,-307.549,1.8078866,-1.817775,73.88407,710000
|
| 84 |
+
1.0,1.0,0.009854284,0.9854285,1.0098543,2.5699766,-4.267187,-235.84293,-307.82907,0.5441705,-0.6731831,38.490746,715000
|
| 85 |
+
1.0,1.0,0.008964989,0.896499,1.008965,3.1504152,-3.2432752,-243.40747,-308.3661,0.70773095,-0.7078953,39.844795,720000
|
| 86 |
+
1.0,1.0000001,0.00876451,0.876451,1.0087646,2.7766702,-2.2141962,-246.8872,-307.29294,0.38993728,-0.434227,33.7341,725000
|
| 87 |
+
1.0,1.0000001,0.009903256,0.99032557,1.0099034,3.589093,-6.1247873,-243.40413,-307.77313,0.9387083,-1.3462713,54.624985,730000
|
| 88 |
+
1.0,1.0,0.009551233,0.9551233,1.0095513,2.6431885,-3.235449,-238.36406,-307.49545,0.842038,-0.71996826,35.77782,735000
|
| 89 |
+
1.0,1.0,0.009458975,0.9458975,1.009459,2.7324343,-1.1407855,-237.28027,-307.52255,0.4667683,-0.41225672,33.71316,740000
|
| 90 |
+
1.0,1.0,0.009987749,0.99877495,1.0099877,4.952407,1.262779,-232.95825,-307.8991,0.7059569,-1.527515,55.418327,745000
|
| 91 |
+
1.0,1.0000001,0.009547141,0.95471406,1.0095472,3.0161066,-1.5366853,-239.37564,-307.27112,1.3902466,-1.0244315,43.57731,750000
|
| 92 |
+
1.0,1.0,0.00890668,0.8906681,1.0089067,2.9437907,-2.8316295,-242.29932,-308.97043,0.8471869,-0.5724305,38.34799,755000
|
| 93 |
+
1.0,1.0,0.009747673,0.9747673,1.0097476,3.4154365,-0.050124794,-229.42598,-306.87198,1.6249788,-1.6564052,46.733418,760000
|
| 94 |
+
1.0,1.0,0.009048451,0.9048451,1.0090485,3.7148812,-2.5049996,-235.74132,-307.04254,1.8739394,-0.5578582,42.463676,765000
|
| 95 |
+
1.0,0.99999994,0.0089579,0.8957901,1.0089579,3.436948,-3.1817245,-239.8147,-307.74954,0.8160521,-0.73104066,46.573883,770000
|
| 96 |
+
1.0,1.0,0.009433816,0.94338167,1.0094339,2.8478096,-3.2269096,-235.25198,-307.84012,0.79513824,-0.40423095,40.35383,775000
|
| 97 |
+
1.0,1.0,0.009460151,0.9460151,1.0094602,3.0416298,-0.68303764,-247.26407,-307.47238,0.5960729,-0.6934618,38.188835,780000
|
| 98 |
+
1.0,0.99999994,0.008602859,0.860286,1.0086029,2.8764222,-4.839858,-245.70596,-307.37,0.8399459,-1.1304666,41.669174,785000
|
| 99 |
+
1.0,1.0,0.010084756,1.0084755,1.0100847,3.614376,0.23395225,-234.41113,-307.33347,1.0512754,-0.70257217,45.65798,790000
|
| 100 |
+
1.0,1.0,0.009170068,0.91700685,1.00917,2.7953625,-0.33901995,-233.82935,-307.3443,0.6757382,-0.70509124,33.448433,795000
|
| 101 |
+
1.0,1.0,0.008968448,0.89684486,1.0089685,2.3449218,-5.3463917,-242.90019,-307.5466,0.39603162,-0.5807388,30.336462,800000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5c2a168e68ec062e7d90d86a7f8dabd17914f77b9543e071fd3be688b886701
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:221e7e9977376fa1cb43d5b326d985443f97eeb344821f209091b07e1774ba28
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52aa7a50ae359243dc37c919eb080fcff01921edf0330b3d7d4b724b3847bb79
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:058dc994ad36f6bb17f21fe017b4c9f86b54522da942d4a13391207d998c17e2
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ad6519810cdcda194294f9f48e4df9a5db90826df7df03b222b30e7e110ad92
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:809515a81b9eb8f90bf49e52967946dbbec051f7ab9edbfea92a60720ffb48a3
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c94a4861289515af2a51e8f157a4263edeb9048256ab8286af48a1b9fc16a07
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5217430f64ebe722270aaf28286270be7c9ae57892d28b7ba226e3b67f716ba
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8e7618da79030d2b5271491c3602140c34c1ed89fdd4ee0fc0769c42a68b670
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:073683a6a7f995e405d418e1e782de6b18b586ceddf5b7e1dd700997cac24cfb
|
| 3 |
+
size 218872466
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260325_133502/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/zpszsv3y
|