Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1150000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1200000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1350000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1400000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0038587789337467568,0.014819595601737888,-0.0029632380780788927,0.008845929003434007,30.221097771915936,9.07399999999924,0.84,4360.2,-0.26,-282.34,179.48,0.546796464920044,1050000
|
| 3 |
+
0.0,0.0,-0.02385421830361252,0.025259361473578722,-0.021453336751532433,0.006385029035338985,30.45677902271803,5.717999999999627,0.94,12333.14,-0.1,-171.56,112.36,0.35362154960632325,1100000
|
| 4 |
+
0.0,0.0,-0.012742254204436436,0.04748483813892522,-0.010268683655527909,0.031803083055602775,30.795672687394212,5.347999999999594,0.92,17835.1,-0.12,-154.3,104.96,0.32850610733032226,1150000
|
| 5 |
+
0.0,0.0,-0.031367916350784196,0.047251126056869056,-0.028117197032024945,0.03755514832707488,34.23284221143241,5.179999999999683,0.92,24244.86,-0.14,-162.9,101.6,0.31889729499816893,1200000
|
| 6 |
+
0.0,0.0,-0.024181376944138338,0.04774656734022301,-0.021069660984916996,0.04462270076562636,34.438974218602155,4.503999999999696,0.94,28674.54,-0.08,-123.86,88.08,0.27795729160308835,1250000
|
| 7 |
+
0.0,0.0,-0.014701514993216236,0.05712006890533633,-0.011842252788579137,0.05129530266285756,34.5149284736229,4.3879999999997095,0.94,32753.22,-0.08,-124.12,85.76,0.2695520973205566,1300000
|
| 8 |
+
0.0,0.0,-0.03002899812015002,0.05816240318589313,-0.026774567260521086,0.0554468892850628,34.995597929929886,2.680999999999926,1.0,36625.82,0.0,-74.32,51.62,0.1730452585220337,1350000
|
| 9 |
+
0.0,0.0,-0.03139422500593572,0.047722689469622596,-0.028529422980579894,0.03727744536004617,34.26645769998402,3.580999999999807,0.96,39856.6,-0.04,-98.2,69.62,0.2287040376663208,1400000
|
| 10 |
+
0.0,0.0,-0.02291151372915357,0.03523618844942553,-0.019326665232914566,0.0487144426679734,34.86022394526794,2.855999999999907,1.0,42930.4,0.0,-83.36,55.12,0.18379430770874022,1450000
|
| 11 |
+
0.0,0.0,-0.05778155953376586,0.058333553520526514,-0.05360269994542461,0.058413165631075355,33.505108783280335,3.3529999999998323,0.96,46051.38,-0.06,-97.36,65.06,0.20875516891479493,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0038587789337467568,0.014819595601737888,-0.0029632380780788927,0.008845929003434007,30.221097771915936,9.07399999999924,0.84,4360.2,-0.26,-282.34,179.48,0.546796464920044,1050000
|
| 3 |
+
0.0,0.0,-0.02385421830361252,0.025259361473578722,-0.021453336751532433,0.006385029035338985,30.45677902271803,5.717999999999627,0.94,12333.14,-0.1,-171.56,112.36,0.35362154960632325,1100000
|
| 4 |
+
0.0,0.0,-0.012742254204436436,0.04748483813892522,-0.010268683655527909,0.031803083055602775,30.795672687394212,5.347999999999594,0.92,17835.1,-0.12,-154.3,104.96,0.32850610733032226,1150000
|
| 5 |
+
0.0,0.0,-0.031367916350784196,0.047251126056869056,-0.028117197032024945,0.03755514832707488,34.23284221143241,5.179999999999683,0.92,24244.86,-0.14,-162.9,101.6,0.31889729499816893,1200000
|
| 6 |
+
0.0,0.0,-0.024181376944138338,0.04774656734022301,-0.021069660984916996,0.04462270076562636,34.438974218602155,4.503999999999696,0.94,28674.54,-0.08,-123.86,88.08,0.27795729160308835,1250000
|
| 7 |
+
0.0,0.0,-0.014701514993216236,0.05712006890533633,-0.011842252788579137,0.05129530266285756,34.5149284736229,4.3879999999997095,0.94,32753.22,-0.08,-124.12,85.76,0.2695520973205566,1300000
|
| 8 |
+
0.0,0.0,-0.03002899812015002,0.05816240318589313,-0.026774567260521086,0.0554468892850628,34.995597929929886,2.680999999999926,1.0,36625.82,0.0,-74.32,51.62,0.1730452585220337,1350000
|
| 9 |
+
0.0,0.0,-0.03139422500593572,0.047722689469622596,-0.028529422980579894,0.03727744536004617,34.26645769998402,3.580999999999807,0.96,39856.6,-0.04,-98.2,69.62,0.2287040376663208,1400000
|
| 10 |
+
0.0,0.0,-0.02291151372915357,0.03523618844942553,-0.019326665232914566,0.0487144426679734,34.86022394526794,2.855999999999907,1.0,42930.4,0.0,-83.36,55.12,0.18379430770874022,1450000
|
| 11 |
+
0.0,0.0,-0.05778155953376586,0.058333553520526514,-0.05360269994542461,0.058413165631075355,33.505108783280335,3.3529999999998323,0.96,46051.38,-0.06,-97.36,65.06,0.20875516891479493,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.023651967,2.3651967,1.023652,0.43836632,-26.368126,-106.14491,-188.58656,0.078554474,-0.17183231,7.12453,1005000
|
| 3 |
+
1.0,0.99999994,0.022768516,2.2768517,1.0227685,0.5737972,-17.686811,-106.22243,-179.38441,0.05551976,-0.11353974,6.2016263,1010000
|
| 4 |
+
1.0,1.0,0.020188726,2.0188727,1.0201887,0.6754975,-26.391823,-110.39007,-183.42769,0.08095614,-0.1552536,9.204514,1015000
|
| 5 |
+
1.0,1.0,0.020509992,2.0509992,1.02051,1.1724981,-16.82068,-111.49275,-196.48622,0.10217324,-0.11814135,10.522205,1020000
|
| 6 |
+
1.0,1.0,0.020538926,2.0538929,1.0205389,0.78178406,-38.923584,-111.373634,-193.50706,0.0944096,-0.15122707,10.399107,1025000
|
| 7 |
+
1.0,1.0,0.021316824,2.1316824,1.0213168,0.8429219,-31.613361,-108.88555,-200.84824,0.14418007,-0.269759,9.95328,1030000
|
| 8 |
+
1.0,0.9999999,0.022282084,2.2282085,1.022282,1.1098388,-27.463186,-109.462944,-187.43167,0.37627593,-0.51224524,23.995373,1035000
|
| 9 |
+
1.0,1.0,0.022627816,2.2627816,1.0226278,1.4064362,-5.5641685,-108.59688,-193.78392,0.6861374,-0.7192694,17.338226,1040000
|
| 10 |
+
1.0,1.0,0.022442397,2.2442396,1.0224423,1.0285304,-32.943203,-107.53513,-203.62256,0.15134369,-0.09798091,9.335012,1045000
|
| 11 |
+
1.0,0.99999994,0.025357526,2.5357528,1.0253575,1.5022174,-7.8266397,-104.56728,-184.62178,0.2267323,-0.180875,17.764101,1050000
|
| 12 |
+
1.0,0.99999994,0.025738478,2.5738478,1.0257385,1.831831,-13.224666,-100.8055,-183.92148,0.8890711,-0.8475282,33.739456,1055000
|
| 13 |
+
1.0,1.0000001,0.02572991,2.572991,1.02573,1.0990932,-6.117949,-97.88636,-195.34436,0.112531655,-0.2051138,11.291361,1060000
|
| 14 |
+
1.0,0.9999999,0.024527501,2.4527504,1.0245274,1.2782599,-9.886341,-97.40848,-196.7845,0.16389073,-0.15916944,14.116468,1065000
|
| 15 |
+
1.0,1.0,0.024961442,2.4961445,1.0249615,1.3742927,-6.7538733,-95.42881,-203.2796,0.27720144,-0.18057595,17.15875,1070000
|
| 16 |
+
1.0,0.99999994,0.025860969,2.586097,1.0258609,1.4446481,-16.03243,-99.74546,-200.15889,0.15135132,-0.17915747,14.006632,1075000
|
| 17 |
+
1.0,1.0,0.02545555,2.545555,1.0254556,1.1775972,-10.334783,-100.58115,-193.65416,0.19012639,-0.2356601,13.434515,1080000
|
| 18 |
+
1.0,1.0,0.025178447,2.517845,1.0251784,1.1239891,-12.125945,-100.12705,-195.60182,0.20398624,-0.12641856,11.663926,1085000
|
| 19 |
+
1.0,1.0,0.025841387,2.5841386,1.0258414,1.2125174,-18.085783,-97.45181,-193.2321,0.20604005,-0.09889553,11.785121,1090000
|
| 20 |
+
1.0,1.0,0.025831297,2.5831296,1.0258313,1.2539396,-19.239056,-99.06719,-199.6735,0.1752054,-0.13194342,13.974208,1095000
|
| 21 |
+
1.0,1.0,0.024493206,2.4493208,1.0244932,1.3166525,-3.852267,-93.09307,-197.47676,0.15908729,-0.28056324,16.203259,1100000
|
| 22 |
+
1.0,1.0,0.02603377,2.6033773,1.0260338,0.9023053,3.6312983,-95.62066,-186.03728,0.15599889,-0.14517993,10.489866,1105000
|
| 23 |
+
1.0,0.9999999,0.026317466,2.6317468,1.0263174,1.3880774,-0.94908804,-95.723076,-176.0935,0.41654253,-0.21097668,19.091097,1110000
|
| 24 |
+
1.0,0.9999496,0.025811639,2.581164,1.0257612,0.97436064,0.83790016,-90.8128,-164.93365,0.20369118,-0.18897378,11.778637,1115000
|
| 25 |
+
1.0,1.0,0.026311452,2.6311452,1.0263114,1.4754766,-1.0317684,-93.65905,-181.33908,0.20092544,-0.18979979,14.177969,1120000
|
| 26 |
+
1.0,0.99999994,0.026082888,2.6082888,1.0260829,1.1526183,0.82592106,-96.687065,-184.10838,0.16958016,-0.17807132,12.121864,1125000
|
| 27 |
+
1.0,1.0000001,0.025895495,2.5895495,1.0258956,1.0541912,-2.087263,-95.60661,-184.83557,0.24908677,-0.15258369,10.519295,1130000
|
| 28 |
+
1.0,0.99996984,0.027400322,2.7400324,1.0273702,1.1657863,2.7022593,-94.255775,-173.374,0.2373641,-0.4082457,15.683628,1135000
|
| 29 |
+
1.0,1.0,0.026964247,2.696425,1.0269642,1.8674748,-10.604765,-89.22976,-185.7776,0.24491817,-0.21801142,18.551052,1140000
|
| 30 |
+
1.0,1.0,0.028477134,2.8477135,1.0284772,1.1673087,-7.858329,-94.504295,-198.64137,0.3296125,-0.14319858,16.31474,1145000
|
| 31 |
+
1.0,0.99999994,0.025569879,2.5569878,1.0255698,0.91185474,-7.748625,-90.916595,-192.67741,0.21051905,-0.09050098,10.726854,1150000
|
| 32 |
+
1.0,1.0,0.025300058,2.530006,1.0253,1.0118703,-6.941567,-91.71848,-187.9503,0.32832915,-0.18532553,16.299252,1155000
|
| 33 |
+
1.0,0.9999999,0.0266676,2.6667602,1.0266675,1.2558072,-3.2313526,-95.048004,-194.65744,0.6712628,-0.60390747,22.845083,1160000
|
| 34 |
+
1.0,1.0,0.025637425,2.5637426,1.0256374,1.1381973,-2.3181424,-90.096725,-175.54868,0.19147371,-0.23931241,13.912151,1165000
|
| 35 |
+
1.0,1.0,0.027239127,2.7239127,1.0272391,1.7036841,-5.108044,-89.66248,-197.39926,0.39002725,-0.4564362,20.39904,1170000
|
| 36 |
+
1.0,1.0,0.027042244,2.7042246,1.0270423,1.3906244,-14.305172,-93.37961,-195.8596,0.48770887,-0.3121635,20.810692,1175000
|
| 37 |
+
1.0,0.99995565,0.026161108,2.6161108,1.0261167,1.1701674,2.0870216,-92.65749,-198.36607,0.3142498,-0.347053,14.459129,1180000
|
| 38 |
+
1.0,1.0000001,0.027041547,2.7041547,1.0270417,1.0547429,-8.039805,-87.88315,-170.23396,0.35264683,-0.2541278,17.238573,1185000
|
| 39 |
+
1.0,1.0,0.02514603,2.514603,1.025146,1.2256746,-5.5852065,-86.867676,-202.57928,0.3965174,-0.39228904,21.100105,1190000
|
| 40 |
+
1.0,1.0,0.026837619,2.683762,1.0268376,1.1914396,-5.43315,-90.01537,-198.50882,0.28604725,-0.3132456,17.499826,1195000
|
| 41 |
+
1.0,1.0,0.026201282,2.6201282,1.0262012,1.0259726,-1.0378729,-87.65226,-201.32045,0.13108411,-0.26076183,14.833001,1200000
|
| 42 |
+
1.0,0.99987745,0.02664186,2.664186,1.0265193,1.4344549,4.7467732,-85.95977,-180.33926,0.2300108,-0.29651526,20.044773,1205000
|
| 43 |
+
1.0,1.0,0.026362719,2.636272,1.0263628,1.020406,1.4722557,-89.92592,-181.57121,0.24565156,-0.21259093,14.004459,1210000
|
| 44 |
+
1.0,1.0,0.027305618,2.730562,1.0273056,1.7586371,-3.2519414,-88.84867,-194.57271,0.5218425,-0.49831912,23.807926,1215000
|
| 45 |
+
1.0,0.99999994,0.025851894,2.5851893,1.0258518,1.0645403,-2.888834,-87.71795,-195.34454,0.12058848,-0.19461676,11.76993,1220000
|
| 46 |
+
1.0,0.9999999,0.026371134,2.6371136,1.026371,1.019508,-3.601331,-85.40132,-186.98131,0.23087922,-0.10125613,13.151688,1225000
|
| 47 |
+
1.0,1.0,0.02784416,2.7844162,1.0278442,1.0235027,2.0173903,-89.67007,-178.58644,0.22521603,-0.16879313,12.546202,1230000
|
| 48 |
+
1.0,1.0,0.02607903,2.607903,1.026079,1.5001549,0.7757906,-88.193405,-181.31337,0.28608543,-0.29589313,17.49635,1235000
|
| 49 |
+
1.0,0.99996716,0.027934462,2.793446,1.0279016,1.3378435,2.4544842,-88.832756,-198.56067,0.58410454,-0.38215622,21.314653,1240000
|
| 50 |
+
1.0,1.0,0.027604254,2.7604256,1.0276042,1.9128859,0.4146422,-87.867584,-193.12108,0.38850608,-0.37053928,21.276764,1245000
|
| 51 |
+
1.0,1.0,0.02399158,2.399158,1.0239916,1.6600342,2.4435706,-82.71752,-197.63145,0.31425014,-0.31023052,20.465164,1250000
|
| 52 |
+
1.0,1.0,0.0267747,2.6774702,1.0267746,1.4438552,0.5149206,-88.67742,-191.54161,0.18132252,-0.16323915,14.662432,1255000
|
| 53 |
+
1.0,1.0,0.028046098,2.8046098,1.0280461,1.272148,1.6836951,-86.273315,-187.61697,0.20096105,-0.21390906,16.037645,1260000
|
| 54 |
+
1.0,1.0000001,0.027906075,2.7906077,1.0279062,1.5720943,-11.30769,-85.98105,-202.31781,0.35206765,-0.18847616,22.404488,1265000
|
| 55 |
+
1.0,0.99999994,0.027277492,2.7277493,1.0272775,0.9166452,-2.0318558,-85.726555,-168.1261,0.15281641,-0.21322533,11.507335,1270000
|
| 56 |
+
1.0,1.0,0.0261025,2.6102502,1.0261025,0.89469016,-3.6923351,-83.99993,-203.0235,0.19499275,-0.27774203,13.035761,1275000
|
| 57 |
+
1.0,1.0,0.02773192,2.7731924,1.0277319,1.1452267,0.25071502,-86.07572,-193.46059,0.19262584,-0.20233294,13.474594,1280000
|
| 58 |
+
1.0,1.0,0.026960082,2.6960082,1.0269601,2.5902753,4.20969,-82.55552,-173.17758,0.32678413,-0.33538252,23.11806,1285000
|
| 59 |
+
1.0,1.0,0.02703211,2.7032113,1.0270321,1.5670751,4.9415255,-79.747635,-198.13269,0.28995144,-0.3763908,19.937737,1290000
|
| 60 |
+
1.0,0.9999528,0.02659364,2.6593642,1.0265465,1.8049263,1.4144183,-83.63558,-183.70973,0.38617542,-0.46000865,31.155731,1295000
|
| 61 |
+
1.0,0.99999994,0.024900854,2.4900851,1.0249008,1.1072472,0.4431514,-82.3944,-176.77689,0.20549752,-0.26869226,16.557106,1300000
|
| 62 |
+
1.0,1.0,0.029001907,2.9001906,1.029002,1.3813347,-5.092573,-85.70498,-181.97186,0.4100741,-0.31643215,18.590206,1305000
|
| 63 |
+
1.0,1.0,0.029786937,2.9786937,1.029787,1.3746914,2.562056,-83.11715,-198.23666,0.16061918,-0.33767813,15.6843195,1310000
|
| 64 |
+
1.0,1.0,0.02554312,2.5543122,1.0255431,1.4382414,-3.0787768,-81.77313,-172.96217,0.19659612,-0.4278549,16.053299,1315000
|
| 65 |
+
1.0,1.0,0.028418373,2.8418372,1.0284184,1.6235787,-4.3738523,-82.8175,-172.52763,0.45399037,-0.46266133,28.023891,1320000
|
| 66 |
+
1.0,1.0000001,0.028948773,2.8948772,1.0289489,2.1350954,0.55748165,-84.60968,-190.25752,0.27681082,-0.19816737,18.809278,1325000
|
| 67 |
+
1.0,1.0,0.028060332,2.8060334,1.0280603,1.3950396,-2.884531,-82.01004,-164.92157,0.28448516,-0.21003535,19.639248,1330000
|
| 68 |
+
1.0,1.0000001,0.027015831,2.7015831,1.0270159,1.1863136,-6.035005,-80.61007,-202.72345,0.27774495,-0.25557846,15.055702,1335000
|
| 69 |
+
1.0,1.0,0.02937891,2.937891,1.0293789,1.0242108,-5.1361556,-80.82958,-178.50919,0.22407898,-0.41796985,16.029417,1340000
|
| 70 |
+
1.0,1.0,0.027782157,2.778216,1.0277822,0.9705187,-4.528643,-85.869545,-197.26315,0.25803316,-0.4924352,13.381568,1345000
|
| 71 |
+
1.0,1.0,0.027045915,2.7045915,1.027046,1.3532006,3.9235864,-79.8156,-188.73735,0.53437376,-0.2060205,18.244204,1350000
|
| 72 |
+
1.0,1.0,0.028092153,2.8092153,1.0280921,1.7306057,1.7731265,-81.19765,-175.88393,0.57109237,-0.24174672,23.358894,1355000
|
| 73 |
+
1.0,0.9999999,0.027472075,2.7472076,1.0274719,1.3518519,-0.7343054,-78.74987,-201.99739,0.17963146,-0.17288244,14.064979,1360000
|
| 74 |
+
1.0,1.0,0.02874221,2.8742213,1.0287422,1.071885,-3.5617146,-83.86052,-179.32172,0.13394174,-0.120032564,12.348149,1365000
|
| 75 |
+
1.0,1.0,0.02731184,2.731184,1.0273118,1.2776009,-0.7156879,-79.15613,-184.5462,0.16599311,-0.39764258,18.121666,1370000
|
| 76 |
+
1.0,1.0,0.028226485,2.8226485,1.0282265,1.337922,1.6439612,-79.404015,-203.05122,0.4942332,-0.35198438,20.240606,1375000
|
| 77 |
+
1.0,1.0,0.026114818,2.6114817,1.0261148,2.1087682,1.3346101,-80.58927,-166.66487,0.37479553,-0.14706933,15.014568,1380000
|
| 78 |
+
1.0,1.0,0.027063508,2.7063508,1.0270635,1.6871995,-1.8540345,-79.557045,-170.78682,0.9646955,-0.67752767,29.080046,1385000
|
| 79 |
+
1.0,1.0,0.029987238,2.998724,1.0299872,1.1114969,5.5271654,-83.27405,-183.4798,0.2167314,-0.18655077,13.363647,1390000
|
| 80 |
+
1.0,1.0,0.029171452,2.9171453,1.0291715,1.2276795,1.3710434,-82.05205,-170.38437,0.19235045,-0.25440884,15.03238,1395000
|
| 81 |
+
1.0,1.0,0.026374292,2.6374292,1.0263743,1.821022,-2.2898202,-77.01446,-162.7994,0.7237098,-0.74887407,26.379486,1400000
|
| 82 |
+
1.0,1.0,0.027619205,2.7619205,1.0276192,1.260196,-1.2097963,-80.08569,-181.87595,0.29714164,-0.3165536,18.772928,1405000
|
| 83 |
+
1.0,0.9999999,0.028622556,2.8622556,1.0286224,1.2201799,-2.0509253,-79.79119,-161.27295,0.14320761,-0.42216384,15.477751,1410000
|
| 84 |
+
1.0,0.9999999,0.026010161,2.601016,1.02601,1.3833599,-1.0891365,-82.62893,-170.42793,0.28998008,-0.74788594,17.568554,1415000
|
| 85 |
+
1.0,0.99998605,0.030049033,3.0049033,1.0300351,1.0171834,0.12989731,-79.30222,-170.2214,0.20998721,-0.21858339,14.458116,1420000
|
| 86 |
+
1.0,0.99999994,0.026165271,2.6165273,1.0261652,2.9441402,0.7366878,-77.384125,-202.59744,0.27796036,-0.28606215,28.628025,1425000
|
| 87 |
+
1.0,1.0,0.028756216,2.8756216,1.0287563,1.3111724,-2.8512492,-75.4912,-171.46056,0.2941572,-0.58879614,22.205349,1430000
|
| 88 |
+
1.0,0.9999999,0.030413568,3.041357,1.0304134,1.0679556,-0.5503577,-79.29983,-201.69894,0.23061213,-0.21627475,12.628849,1435000
|
| 89 |
+
1.0,0.99991685,0.028485868,2.848587,1.0284027,1.2437693,3.026593,-73.38411,-186.92796,0.24652752,-0.30339804,19.372904,1440000
|
| 90 |
+
1.0,1.0,0.02801417,2.8014169,1.0280142,1.3528433,-1.3937386,-80.48362,-166.03123,0.3062772,-0.3065651,16.92468,1445000
|
| 91 |
+
1.0,1.0,0.026732644,2.6732645,1.0267327,1.6842533,-0.6096046,-75.99794,-168.01506,0.4295409,-0.23703238,19.401783,1450000
|
| 92 |
+
1.0,1.0,0.028583195,2.8583198,1.0285832,1.3639402,-0.63113964,-77.72902,-177.15224,0.35535163,-0.180796,15.398751,1455000
|
| 93 |
+
1.0,1.0000001,0.026785258,2.6785257,1.0267854,2.699776,-1.8609384,-74.01296,-159.10812,0.58312464,-0.5235004,42.325848,1460000
|
| 94 |
+
1.0,1.0,0.02957328,2.9573278,1.0295733,1.1611458,-1.7448711,-76.606834,-162.88533,0.4608424,-0.3316999,16.378223,1465000
|
| 95 |
+
1.0,0.99999994,0.029587492,2.9587495,1.0295874,1.640572,-2.9813573,-74.34541,-144.37926,0.27586788,-0.45188528,20.377258,1470000
|
| 96 |
+
1.0,1.0,0.028601984,2.8601985,1.028602,1.3084935,0.03812857,-73.07995,-176.62192,0.23652133,-0.2940235,13.773493,1475000
|
| 97 |
+
1.0,1.0,0.030692618,3.069262,1.0306926,1.7254685,1.1169322,-74.15663,-155.55486,0.61705947,-0.5115822,27.781586,1480000
|
| 98 |
+
1.0,0.99999994,0.028925378,2.8925376,1.0289253,0.95634586,-5.449058,-73.91454,-197.68529,0.11393053,-0.27527383,13.641064,1485000
|
| 99 |
+
1.0,1.0,0.02843166,2.8431659,1.0284317,2.798063,-1.800198,-75.0144,-167.7738,0.71643215,-0.47580418,39.087997,1490000
|
| 100 |
+
1.0,0.9999999,0.026748627,2.6748629,1.0267485,2.5946472,0.74695534,-72.28324,-168.76535,0.76172864,-0.6570817,33.160202,1495000
|
| 101 |
+
1.0,1.0000001,0.029818503,2.9818506,1.0298187,1.1125789,2.4921021,-69.6694,-165.75235,0.1526338,-0.1587772,12.939063,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.023651967,2.3651967,1.023652,0.43836632,-26.368126,-106.14491,-188.58656,0.078554474,-0.17183231,7.12453,1005000
|
| 3 |
+
1.0,0.99999994,0.022768516,2.2768517,1.0227685,0.5737972,-17.686811,-106.22243,-179.38441,0.05551976,-0.11353974,6.2016263,1010000
|
| 4 |
+
1.0,1.0,0.020188726,2.0188727,1.0201887,0.6754975,-26.391823,-110.39007,-183.42769,0.08095614,-0.1552536,9.204514,1015000
|
| 5 |
+
1.0,1.0,0.020509992,2.0509992,1.02051,1.1724981,-16.82068,-111.49275,-196.48622,0.10217324,-0.11814135,10.522205,1020000
|
| 6 |
+
1.0,1.0,0.020538926,2.0538929,1.0205389,0.78178406,-38.923584,-111.373634,-193.50706,0.0944096,-0.15122707,10.399107,1025000
|
| 7 |
+
1.0,1.0,0.021316824,2.1316824,1.0213168,0.8429219,-31.613361,-108.88555,-200.84824,0.14418007,-0.269759,9.95328,1030000
|
| 8 |
+
1.0,0.9999999,0.022282084,2.2282085,1.022282,1.1098388,-27.463186,-109.462944,-187.43167,0.37627593,-0.51224524,23.995373,1035000
|
| 9 |
+
1.0,1.0,0.022627816,2.2627816,1.0226278,1.4064362,-5.5641685,-108.59688,-193.78392,0.6861374,-0.7192694,17.338226,1040000
|
| 10 |
+
1.0,1.0,0.022442397,2.2442396,1.0224423,1.0285304,-32.943203,-107.53513,-203.62256,0.15134369,-0.09798091,9.335012,1045000
|
| 11 |
+
1.0,0.99999994,0.025357526,2.5357528,1.0253575,1.5022174,-7.8266397,-104.56728,-184.62178,0.2267323,-0.180875,17.764101,1050000
|
| 12 |
+
1.0,0.99999994,0.025738478,2.5738478,1.0257385,1.831831,-13.224666,-100.8055,-183.92148,0.8890711,-0.8475282,33.739456,1055000
|
| 13 |
+
1.0,1.0000001,0.02572991,2.572991,1.02573,1.0990932,-6.117949,-97.88636,-195.34436,0.112531655,-0.2051138,11.291361,1060000
|
| 14 |
+
1.0,0.9999999,0.024527501,2.4527504,1.0245274,1.2782599,-9.886341,-97.40848,-196.7845,0.16389073,-0.15916944,14.116468,1065000
|
| 15 |
+
1.0,1.0,0.024961442,2.4961445,1.0249615,1.3742927,-6.7538733,-95.42881,-203.2796,0.27720144,-0.18057595,17.15875,1070000
|
| 16 |
+
1.0,0.99999994,0.025860969,2.586097,1.0258609,1.4446481,-16.03243,-99.74546,-200.15889,0.15135132,-0.17915747,14.006632,1075000
|
| 17 |
+
1.0,1.0,0.02545555,2.545555,1.0254556,1.1775972,-10.334783,-100.58115,-193.65416,0.19012639,-0.2356601,13.434515,1080000
|
| 18 |
+
1.0,1.0,0.025178447,2.517845,1.0251784,1.1239891,-12.125945,-100.12705,-195.60182,0.20398624,-0.12641856,11.663926,1085000
|
| 19 |
+
1.0,1.0,0.025841387,2.5841386,1.0258414,1.2125174,-18.085783,-97.45181,-193.2321,0.20604005,-0.09889553,11.785121,1090000
|
| 20 |
+
1.0,1.0,0.025831297,2.5831296,1.0258313,1.2539396,-19.239056,-99.06719,-199.6735,0.1752054,-0.13194342,13.974208,1095000
|
| 21 |
+
1.0,1.0,0.024493206,2.4493208,1.0244932,1.3166525,-3.852267,-93.09307,-197.47676,0.15908729,-0.28056324,16.203259,1100000
|
| 22 |
+
1.0,1.0,0.02603377,2.6033773,1.0260338,0.9023053,3.6312983,-95.62066,-186.03728,0.15599889,-0.14517993,10.489866,1105000
|
| 23 |
+
1.0,0.9999999,0.026317466,2.6317468,1.0263174,1.3880774,-0.94908804,-95.723076,-176.0935,0.41654253,-0.21097668,19.091097,1110000
|
| 24 |
+
1.0,0.9999496,0.025811639,2.581164,1.0257612,0.97436064,0.83790016,-90.8128,-164.93365,0.20369118,-0.18897378,11.778637,1115000
|
| 25 |
+
1.0,1.0,0.026311452,2.6311452,1.0263114,1.4754766,-1.0317684,-93.65905,-181.33908,0.20092544,-0.18979979,14.177969,1120000
|
| 26 |
+
1.0,0.99999994,0.026082888,2.6082888,1.0260829,1.1526183,0.82592106,-96.687065,-184.10838,0.16958016,-0.17807132,12.121864,1125000
|
| 27 |
+
1.0,1.0000001,0.025895495,2.5895495,1.0258956,1.0541912,-2.087263,-95.60661,-184.83557,0.24908677,-0.15258369,10.519295,1130000
|
| 28 |
+
1.0,0.99996984,0.027400322,2.7400324,1.0273702,1.1657863,2.7022593,-94.255775,-173.374,0.2373641,-0.4082457,15.683628,1135000
|
| 29 |
+
1.0,1.0,0.026964247,2.696425,1.0269642,1.8674748,-10.604765,-89.22976,-185.7776,0.24491817,-0.21801142,18.551052,1140000
|
| 30 |
+
1.0,1.0,0.028477134,2.8477135,1.0284772,1.1673087,-7.858329,-94.504295,-198.64137,0.3296125,-0.14319858,16.31474,1145000
|
| 31 |
+
1.0,0.99999994,0.025569879,2.5569878,1.0255698,0.91185474,-7.748625,-90.916595,-192.67741,0.21051905,-0.09050098,10.726854,1150000
|
| 32 |
+
1.0,1.0,0.025300058,2.530006,1.0253,1.0118703,-6.941567,-91.71848,-187.9503,0.32832915,-0.18532553,16.299252,1155000
|
| 33 |
+
1.0,0.9999999,0.0266676,2.6667602,1.0266675,1.2558072,-3.2313526,-95.048004,-194.65744,0.6712628,-0.60390747,22.845083,1160000
|
| 34 |
+
1.0,1.0,0.025637425,2.5637426,1.0256374,1.1381973,-2.3181424,-90.096725,-175.54868,0.19147371,-0.23931241,13.912151,1165000
|
| 35 |
+
1.0,1.0,0.027239127,2.7239127,1.0272391,1.7036841,-5.108044,-89.66248,-197.39926,0.39002725,-0.4564362,20.39904,1170000
|
| 36 |
+
1.0,1.0,0.027042244,2.7042246,1.0270423,1.3906244,-14.305172,-93.37961,-195.8596,0.48770887,-0.3121635,20.810692,1175000
|
| 37 |
+
1.0,0.99995565,0.026161108,2.6161108,1.0261167,1.1701674,2.0870216,-92.65749,-198.36607,0.3142498,-0.347053,14.459129,1180000
|
| 38 |
+
1.0,1.0000001,0.027041547,2.7041547,1.0270417,1.0547429,-8.039805,-87.88315,-170.23396,0.35264683,-0.2541278,17.238573,1185000
|
| 39 |
+
1.0,1.0,0.02514603,2.514603,1.025146,1.2256746,-5.5852065,-86.867676,-202.57928,0.3965174,-0.39228904,21.100105,1190000
|
| 40 |
+
1.0,1.0,0.026837619,2.683762,1.0268376,1.1914396,-5.43315,-90.01537,-198.50882,0.28604725,-0.3132456,17.499826,1195000
|
| 41 |
+
1.0,1.0,0.026201282,2.6201282,1.0262012,1.0259726,-1.0378729,-87.65226,-201.32045,0.13108411,-0.26076183,14.833001,1200000
|
| 42 |
+
1.0,0.99987745,0.02664186,2.664186,1.0265193,1.4344549,4.7467732,-85.95977,-180.33926,0.2300108,-0.29651526,20.044773,1205000
|
| 43 |
+
1.0,1.0,0.026362719,2.636272,1.0263628,1.020406,1.4722557,-89.92592,-181.57121,0.24565156,-0.21259093,14.004459,1210000
|
| 44 |
+
1.0,1.0,0.027305618,2.730562,1.0273056,1.7586371,-3.2519414,-88.84867,-194.57271,0.5218425,-0.49831912,23.807926,1215000
|
| 45 |
+
1.0,0.99999994,0.025851894,2.5851893,1.0258518,1.0645403,-2.888834,-87.71795,-195.34454,0.12058848,-0.19461676,11.76993,1220000
|
| 46 |
+
1.0,0.9999999,0.026371134,2.6371136,1.026371,1.019508,-3.601331,-85.40132,-186.98131,0.23087922,-0.10125613,13.151688,1225000
|
| 47 |
+
1.0,1.0,0.02784416,2.7844162,1.0278442,1.0235027,2.0173903,-89.67007,-178.58644,0.22521603,-0.16879313,12.546202,1230000
|
| 48 |
+
1.0,1.0,0.02607903,2.607903,1.026079,1.5001549,0.7757906,-88.193405,-181.31337,0.28608543,-0.29589313,17.49635,1235000
|
| 49 |
+
1.0,0.99996716,0.027934462,2.793446,1.0279016,1.3378435,2.4544842,-88.832756,-198.56067,0.58410454,-0.38215622,21.314653,1240000
|
| 50 |
+
1.0,1.0,0.027604254,2.7604256,1.0276042,1.9128859,0.4146422,-87.867584,-193.12108,0.38850608,-0.37053928,21.276764,1245000
|
| 51 |
+
1.0,1.0,0.02399158,2.399158,1.0239916,1.6600342,2.4435706,-82.71752,-197.63145,0.31425014,-0.31023052,20.465164,1250000
|
| 52 |
+
1.0,1.0,0.0267747,2.6774702,1.0267746,1.4438552,0.5149206,-88.67742,-191.54161,0.18132252,-0.16323915,14.662432,1255000
|
| 53 |
+
1.0,1.0,0.028046098,2.8046098,1.0280461,1.272148,1.6836951,-86.273315,-187.61697,0.20096105,-0.21390906,16.037645,1260000
|
| 54 |
+
1.0,1.0000001,0.027906075,2.7906077,1.0279062,1.5720943,-11.30769,-85.98105,-202.31781,0.35206765,-0.18847616,22.404488,1265000
|
| 55 |
+
1.0,0.99999994,0.027277492,2.7277493,1.0272775,0.9166452,-2.0318558,-85.726555,-168.1261,0.15281641,-0.21322533,11.507335,1270000
|
| 56 |
+
1.0,1.0,0.0261025,2.6102502,1.0261025,0.89469016,-3.6923351,-83.99993,-203.0235,0.19499275,-0.27774203,13.035761,1275000
|
| 57 |
+
1.0,1.0,0.02773192,2.7731924,1.0277319,1.1452267,0.25071502,-86.07572,-193.46059,0.19262584,-0.20233294,13.474594,1280000
|
| 58 |
+
1.0,1.0,0.026960082,2.6960082,1.0269601,2.5902753,4.20969,-82.55552,-173.17758,0.32678413,-0.33538252,23.11806,1285000
|
| 59 |
+
1.0,1.0,0.02703211,2.7032113,1.0270321,1.5670751,4.9415255,-79.747635,-198.13269,0.28995144,-0.3763908,19.937737,1290000
|
| 60 |
+
1.0,0.9999528,0.02659364,2.6593642,1.0265465,1.8049263,1.4144183,-83.63558,-183.70973,0.38617542,-0.46000865,31.155731,1295000
|
| 61 |
+
1.0,0.99999994,0.024900854,2.4900851,1.0249008,1.1072472,0.4431514,-82.3944,-176.77689,0.20549752,-0.26869226,16.557106,1300000
|
| 62 |
+
1.0,1.0,0.029001907,2.9001906,1.029002,1.3813347,-5.092573,-85.70498,-181.97186,0.4100741,-0.31643215,18.590206,1305000
|
| 63 |
+
1.0,1.0,0.029786937,2.9786937,1.029787,1.3746914,2.562056,-83.11715,-198.23666,0.16061918,-0.33767813,15.6843195,1310000
|
| 64 |
+
1.0,1.0,0.02554312,2.5543122,1.0255431,1.4382414,-3.0787768,-81.77313,-172.96217,0.19659612,-0.4278549,16.053299,1315000
|
| 65 |
+
1.0,1.0,0.028418373,2.8418372,1.0284184,1.6235787,-4.3738523,-82.8175,-172.52763,0.45399037,-0.46266133,28.023891,1320000
|
| 66 |
+
1.0,1.0000001,0.028948773,2.8948772,1.0289489,2.1350954,0.55748165,-84.60968,-190.25752,0.27681082,-0.19816737,18.809278,1325000
|
| 67 |
+
1.0,1.0,0.028060332,2.8060334,1.0280603,1.3950396,-2.884531,-82.01004,-164.92157,0.28448516,-0.21003535,19.639248,1330000
|
| 68 |
+
1.0,1.0000001,0.027015831,2.7015831,1.0270159,1.1863136,-6.035005,-80.61007,-202.72345,0.27774495,-0.25557846,15.055702,1335000
|
| 69 |
+
1.0,1.0,0.02937891,2.937891,1.0293789,1.0242108,-5.1361556,-80.82958,-178.50919,0.22407898,-0.41796985,16.029417,1340000
|
| 70 |
+
1.0,1.0,0.027782157,2.778216,1.0277822,0.9705187,-4.528643,-85.869545,-197.26315,0.25803316,-0.4924352,13.381568,1345000
|
| 71 |
+
1.0,1.0,0.027045915,2.7045915,1.027046,1.3532006,3.9235864,-79.8156,-188.73735,0.53437376,-0.2060205,18.244204,1350000
|
| 72 |
+
1.0,1.0,0.028092153,2.8092153,1.0280921,1.7306057,1.7731265,-81.19765,-175.88393,0.57109237,-0.24174672,23.358894,1355000
|
| 73 |
+
1.0,0.9999999,0.027472075,2.7472076,1.0274719,1.3518519,-0.7343054,-78.74987,-201.99739,0.17963146,-0.17288244,14.064979,1360000
|
| 74 |
+
1.0,1.0,0.02874221,2.8742213,1.0287422,1.071885,-3.5617146,-83.86052,-179.32172,0.13394174,-0.120032564,12.348149,1365000
|
| 75 |
+
1.0,1.0,0.02731184,2.731184,1.0273118,1.2776009,-0.7156879,-79.15613,-184.5462,0.16599311,-0.39764258,18.121666,1370000
|
| 76 |
+
1.0,1.0,0.028226485,2.8226485,1.0282265,1.337922,1.6439612,-79.404015,-203.05122,0.4942332,-0.35198438,20.240606,1375000
|
| 77 |
+
1.0,1.0,0.026114818,2.6114817,1.0261148,2.1087682,1.3346101,-80.58927,-166.66487,0.37479553,-0.14706933,15.014568,1380000
|
| 78 |
+
1.0,1.0,0.027063508,2.7063508,1.0270635,1.6871995,-1.8540345,-79.557045,-170.78682,0.9646955,-0.67752767,29.080046,1385000
|
| 79 |
+
1.0,1.0,0.029987238,2.998724,1.0299872,1.1114969,5.5271654,-83.27405,-183.4798,0.2167314,-0.18655077,13.363647,1390000
|
| 80 |
+
1.0,1.0,0.029171452,2.9171453,1.0291715,1.2276795,1.3710434,-82.05205,-170.38437,0.19235045,-0.25440884,15.03238,1395000
|
| 81 |
+
1.0,1.0,0.026374292,2.6374292,1.0263743,1.821022,-2.2898202,-77.01446,-162.7994,0.7237098,-0.74887407,26.379486,1400000
|
| 82 |
+
1.0,1.0,0.027619205,2.7619205,1.0276192,1.260196,-1.2097963,-80.08569,-181.87595,0.29714164,-0.3165536,18.772928,1405000
|
| 83 |
+
1.0,0.9999999,0.028622556,2.8622556,1.0286224,1.2201799,-2.0509253,-79.79119,-161.27295,0.14320761,-0.42216384,15.477751,1410000
|
| 84 |
+
1.0,0.9999999,0.026010161,2.601016,1.02601,1.3833599,-1.0891365,-82.62893,-170.42793,0.28998008,-0.74788594,17.568554,1415000
|
| 85 |
+
1.0,0.99998605,0.030049033,3.0049033,1.0300351,1.0171834,0.12989731,-79.30222,-170.2214,0.20998721,-0.21858339,14.458116,1420000
|
| 86 |
+
1.0,0.99999994,0.026165271,2.6165273,1.0261652,2.9441402,0.7366878,-77.384125,-202.59744,0.27796036,-0.28606215,28.628025,1425000
|
| 87 |
+
1.0,1.0,0.028756216,2.8756216,1.0287563,1.3111724,-2.8512492,-75.4912,-171.46056,0.2941572,-0.58879614,22.205349,1430000
|
| 88 |
+
1.0,0.9999999,0.030413568,3.041357,1.0304134,1.0679556,-0.5503577,-79.29983,-201.69894,0.23061213,-0.21627475,12.628849,1435000
|
| 89 |
+
1.0,0.99991685,0.028485868,2.848587,1.0284027,1.2437693,3.026593,-73.38411,-186.92796,0.24652752,-0.30339804,19.372904,1440000
|
| 90 |
+
1.0,1.0,0.02801417,2.8014169,1.0280142,1.3528433,-1.3937386,-80.48362,-166.03123,0.3062772,-0.3065651,16.92468,1445000
|
| 91 |
+
1.0,1.0,0.026732644,2.6732645,1.0267327,1.6842533,-0.6096046,-75.99794,-168.01506,0.4295409,-0.23703238,19.401783,1450000
|
| 92 |
+
1.0,1.0,0.028583195,2.8583198,1.0285832,1.3639402,-0.63113964,-77.72902,-177.15224,0.35535163,-0.180796,15.398751,1455000
|
| 93 |
+
1.0,1.0000001,0.026785258,2.6785257,1.0267854,2.699776,-1.8609384,-74.01296,-159.10812,0.58312464,-0.5235004,42.325848,1460000
|
| 94 |
+
1.0,1.0,0.02957328,2.9573278,1.0295733,1.1611458,-1.7448711,-76.606834,-162.88533,0.4608424,-0.3316999,16.378223,1465000
|
| 95 |
+
1.0,0.99999994,0.029587492,2.9587495,1.0295874,1.640572,-2.9813573,-74.34541,-144.37926,0.27586788,-0.45188528,20.377258,1470000
|
| 96 |
+
1.0,1.0,0.028601984,2.8601985,1.028602,1.3084935,0.03812857,-73.07995,-176.62192,0.23652133,-0.2940235,13.773493,1475000
|
| 97 |
+
1.0,1.0,0.030692618,3.069262,1.0306926,1.7254685,1.1169322,-74.15663,-155.55486,0.61705947,-0.5115822,27.781586,1480000
|
| 98 |
+
1.0,0.99999994,0.028925378,2.8925376,1.0289253,0.95634586,-5.449058,-73.91454,-197.68529,0.11393053,-0.27527383,13.641064,1485000
|
| 99 |
+
1.0,1.0,0.02843166,2.8431659,1.0284317,2.798063,-1.800198,-75.0144,-167.7738,0.71643215,-0.47580418,39.087997,1490000
|
| 100 |
+
1.0,0.9999999,0.026748627,2.6748629,1.0267485,2.5946472,0.74695534,-72.28324,-168.76535,0.76172864,-0.6570817,33.160202,1495000
|
| 101 |
+
1.0,1.0000001,0.029818503,2.9818506,1.0298187,1.1125789,2.4921021,-69.6694,-165.75235,0.1526338,-0.1587772,12.939063,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d312d1d72b29dfca7f1209c75fd7442f76b62daea4f72884cf92bbea982d39de
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ec8ee0fe64944a2bd02a66b3293eac27e8ffb3fe8aec9cfe2f60e1db1625b81
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c031dedb9e7e33047b72b37815ef25675019c317ccec11bf953552f83537cfe
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93af12f74d4779dc5fabf81fc3337e82e77b40a62a2fa007b2dbd4074c6d6708
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c3323bcf27a8ff420dd0f0a80a2be2d04a07f1dd34a39678857b66d16e9b80d
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f8091b88c48d8201aa6d4afde3eec402368aaa8721e9048de9aa9e56b3b610f
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1e722bdc464b903a8bdb39be9c68189ffc0961127ae3d1923c0e910959f505e
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:356de7b68834fd0138c84e4859c8dceca88d7b6b5c9914af652d8f6f58521e76
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:586f52ab15798a50d25534ae141e46fdf14a446d6d8b9fdfe780ef5e7760db26
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/params_1500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:537cac2fe632d9bae45006157bea5c62fb2439cc8a7b19036e592bf84dc0a19c
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_205107/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/8urqpbo1
|