Tiredsheep commited on
Commit
1feff50
·
verified ·
1 Parent(s): 99a89da

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_150000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_200000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_250000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_300000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_350000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_400000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_450000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_500000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_550000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_600000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.008887333895063989,0.0019341213080858548,-0.008052675362670438,-0.0002973189080094523,32.20695315488001,8.647999999999172,0.8,3965.12,-0.26,-237.04,170.96,0.5355212593078613,150000
3
+ 0.0,0.0,-0.05873787161841812,0.03201241565932577,-0.05573603588185595,0.031988977005410604,34.290362693260406,7.369999999999401,0.84,12542.72,-0.26,-219.66,145.4,0.4454111385345459,200000
4
+ 0.0,0.0,-0.055926408545736675,0.045001778167284456,-0.05176161373550871,0.047913184433674295,35.68516637892293,3.4959999999998996,1.0,18072.98,0.0,-98.96,67.92,0.228868088722229,250000
5
+ 0.0,0.0,-0.06065155260536109,0.06000837654657149,-0.058297217247142014,0.038561353882192104,35.08742098642286,4.596999999999696,0.94,22259.98,-0.1,-140.6,89.94,0.2813494348526001,300000
6
+ 0.0,0.0,-0.05732338329909022,0.05218115564308199,-0.0542452936143115,0.057050443841860254,35.80527576140374,3.2809999999999153,1.0,26064.84,0.0,-96.46,63.62,0.21064093112945556,350000
7
+ 0.0,0.0,-0.0546704120611837,0.06760811128829024,-0.051571921869737615,0.05228165275377025,35.344781027351864,3.6559999999998003,0.96,29479.04,-0.04,-97.68,71.12,0.23343121528625488,400000
8
+ 0.0,0.0,-0.07038598392604734,0.06507287975281188,-0.06586337059885594,0.05671475185107329,35.78090820581776,3.039999999999952,1.0,32786.32,0.0,-83.42,58.8,0.1938487148284912,450000
9
+ 0.0,0.0,-0.06901409437138908,0.06723214817283439,-0.06454410710567676,0.06926228296505094,35.776869958166095,2.7069999999999323,1.0,35863.78,0.0,-78.34,52.14,0.17715529918670656,500000
10
+ 0.0,0.0,-0.06527669247978675,0.060693802837339904,-0.06066296473648594,0.0664032939404194,35.541443398510005,2.6979999999999382,1.0,38550.36,0.0,-76.06,51.96,0.17429033756256104,550000
11
+ 0.0,0.0,-0.06444719325873606,0.06714983720367658,-0.060744645468875424,0.057568265381749015,33.99262179142071,3.6879999999997866,0.94,41997.32,-0.08,-101.88,71.76,0.2275490427017212,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.008887333895063989,0.0019341213080858548,-0.008052675362670438,-0.0002973189080094523,32.20695315488001,8.647999999999172,0.8,3965.12,-0.26,-237.04,170.96,0.5355212593078613,150000
3
+ 0.0,0.0,-0.05873787161841812,0.03201241565932577,-0.05573603588185595,0.031988977005410604,34.290362693260406,7.369999999999401,0.84,12542.72,-0.26,-219.66,145.4,0.4454111385345459,200000
4
+ 0.0,0.0,-0.055926408545736675,0.045001778167284456,-0.05176161373550871,0.047913184433674295,35.68516637892293,3.4959999999998996,1.0,18072.98,0.0,-98.96,67.92,0.228868088722229,250000
5
+ 0.0,0.0,-0.06065155260536109,0.06000837654657149,-0.058297217247142014,0.038561353882192104,35.08742098642286,4.596999999999696,0.94,22259.98,-0.1,-140.6,89.94,0.2813494348526001,300000
6
+ 0.0,0.0,-0.05732338329909022,0.05218115564308199,-0.0542452936143115,0.057050443841860254,35.80527576140374,3.2809999999999153,1.0,26064.84,0.0,-96.46,63.62,0.21064093112945556,350000
7
+ 0.0,0.0,-0.0546704120611837,0.06760811128829024,-0.051571921869737615,0.05228165275377025,35.344781027351864,3.6559999999998003,0.96,29479.04,-0.04,-97.68,71.12,0.23343121528625488,400000
8
+ 0.0,0.0,-0.07038598392604734,0.06507287975281188,-0.06586337059885594,0.05671475185107329,35.78090820581776,3.039999999999952,1.0,32786.32,0.0,-83.42,58.8,0.1938487148284912,450000
9
+ 0.0,0.0,-0.06901409437138908,0.06723214817283439,-0.06454410710567676,0.06926228296505094,35.776869958166095,2.7069999999999323,1.0,35863.78,0.0,-78.34,52.14,0.17715529918670656,500000
10
+ 0.0,0.0,-0.06527669247978675,0.060693802837339904,-0.06066296473648594,0.0664032939404194,35.541443398510005,2.6979999999999382,1.0,38550.36,0.0,-76.06,51.96,0.17429033756256104,550000
11
+ 0.0,0.0,-0.06444719325873606,0.06714983720367658,-0.060744645468875424,0.057568265381749015,33.99262179142071,3.6879999999997866,0.94,41997.32,-0.08,-101.88,71.76,0.2275490427017212,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,1.0,0.032774344,3.2774343,1.0327743,1.0932425,-23.77521,-91.97807,-147.01707,0.1600882,-0.15353456,15.720018,105000
3
+ 1.0,1.0000001,0.031835515,3.1835513,1.0318357,1.4218435,-18.075861,-93.09893,-161.27055,0.2842212,-0.28069493,21.895842,110000
4
+ 1.0,0.99999994,0.027711786,2.7711787,1.0277117,1.5592369,-24.273634,-95.705574,-157.6764,0.6112,-0.68368834,30.667006,115000
5
+ 1.0,1.0000001,0.0275824,2.7582397,1.0275825,1.3217583,-15.737227,-97.25216,-159.7271,0.19395939,-0.19663891,20.816746,120000
6
+ 1.0,1.0,0.025870271,2.587027,1.0258703,1.1924757,-36.987053,-98.1174,-165.33034,0.2159443,-0.23467453,17.054049,125000
7
+ 1.0,1.0,0.025660686,2.5660686,1.0256606,1.5210073,-21.56017,-98.27798,-171.34308,0.23008533,-0.23990558,23.608383,130000
8
+ 1.0,1.0,0.027204666,2.7204669,1.0272046,6.3665085,-21.163803,-100.12323,-157.3892,1.2037358,-0.97086346,66.20146,135000
9
+ 1.0,0.99999994,0.02757203,2.757203,1.0275719,1.9145364,-32.27921,-99.10265,-163.48196,0.30442533,-0.3145899,31.85463,140000
10
+ 1.0,1.0000001,0.028245334,2.8245335,1.0282454,1.5821365,-31.48007,-97.05345,-188.46776,0.18967888,-0.13200487,18.562883,145000
11
+ 1.0,1.0,0.029247006,2.9247007,1.029247,2.5130506,-25.22242,-94.6451,-171.09814,0.5469305,-0.6774365,46.151115,150000
12
+ 1.0,0.9999999,0.031125467,3.112547,1.0311253,1.6968602,-22.493814,-93.9178,-168.32181,0.39000577,-0.37254533,23.996946,155000
13
+ 1.0,1.0,0.028160103,2.8160105,1.0281601,2.639326,-3.828883,-90.73015,-171.63512,0.9921873,-0.86885947,52.379066,160000
14
+ 1.0,1.0,0.027181972,2.7181973,1.027182,1.4002876,-17.270971,-93.44409,-174.58575,0.15795536,-0.16163401,17.743622,165000
15
+ 1.0,1.0,0.026805688,2.6805687,1.0268056,1.6040888,-7.6107574,-92.32056,-177.5878,0.27002743,-0.30091658,20.312656,170000
16
+ 1.0,1.0,0.029856231,2.985623,1.0298562,2.202814,-21.11451,-95.58227,-185.62738,1.717517,-1.6330662,41.226604,175000
17
+ 1.0,1.0,0.028749857,2.8749857,1.0287498,1.7678899,-9.644874,-95.388664,-180.31941,0.20257859,-0.26442268,21.652401,180000
18
+ 1.0,1.0,0.028368756,2.836876,1.0283687,1.8996629,-3.1878076,-95.06043,-188.65915,0.28772888,-0.5123288,29.4916,185000
19
+ 1.0,0.99999994,0.02828301,2.828301,1.028283,1.4262173,-7.318556,-94.20504,-184.68166,0.14343011,-0.1606307,17.382645,190000
20
+ 1.0,1.0,0.028992739,2.8992739,1.0289928,1.6380312,-3.1305532,-93.45379,-184.92604,0.20466472,-0.19004013,21.041492,195000
21
+ 1.0,1.0,0.028351761,2.835176,1.0283518,2.2002785,-7.10841,-91.16237,-170.61526,0.26162374,-0.26867864,28.279707,200000
22
+ 1.0,0.9999999,0.028182479,2.818248,1.0281824,1.6027899,-6.781366,-93.065025,-185.27458,0.20146504,-0.20117216,24.18475,205000
23
+ 1.0,1.0,0.02897347,2.8973467,1.0289735,1.2823778,-3.7525268,-90.68994,-168.50206,0.13532227,-0.1092464,14.987029,210000
24
+ 1.0,1.0000001,0.028144255,2.8144255,1.0281444,1.5923005,1.3301108,-90.385475,-180.58116,0.1855624,-0.17930008,20.40823,215000
25
+ 1.0,0.9999616,0.028958028,2.895803,1.0289197,1.5928963,3.9776516,-89.653175,-163.06285,0.79556763,-0.88867295,27.529282,220000
26
+ 1.0,0.99999994,0.030537017,3.0537016,1.030537,2.2458725,-11.937216,-91.877106,-182.11176,0.3400941,-0.26796144,22.769707,225000
27
+ 1.0,1.0,0.030574225,3.0574224,1.0305742,1.5653282,-15.153382,-91.25504,-182.55283,0.29095858,-0.43341208,22.444723,230000
28
+ 1.0,1.0,0.02885652,2.885652,1.0288565,1.7685711,1.313568,-89.124054,-166.1746,0.20126915,-0.22533625,21.64465,235000
29
+ 1.0,1.0,0.0298104,2.9810402,1.0298104,1.7850014,-10.748077,-86.302025,-183.13586,0.20106946,-0.20874545,21.781883,240000
30
+ 1.0,1.0,0.030701958,3.0701957,1.030702,2.452132,-9.966492,-88.22473,-181.0386,0.5202119,-0.50465596,28.07013,245000
31
+ 1.0,1.0,0.02927308,2.9273078,1.029273,1.7923872,-4.667734,-88.046524,-165.67738,0.359545,-0.25625303,22.23195,250000
32
+ 1.0,1.0,0.02831237,2.831237,1.0283123,1.2162807,-4.072564,-87.34977,-175.6577,0.15797326,-0.13864116,15.318936,255000
33
+ 1.0,1.0,0.030370828,3.037083,1.0303708,2.9208515,-2.546937,-86.439896,-179.68413,0.87395734,-0.7738875,33.678455,260000
34
+ 1.0,1.0000001,0.029941281,2.9941282,1.0299414,1.7246269,-2.4551518,-85.56594,-160.59956,0.6956084,-0.62144357,28.021894,265000
35
+ 1.0,1.0,0.032908496,3.2908494,1.0329084,3.301616,-2.2319899,-83.71052,-173.81097,0.8048148,-0.7716172,37.324787,270000
36
+ 1.0,0.99999994,0.03163052,3.1630518,1.0316305,1.8411057,-0.029120117,-87.06445,-179.74669,0.21129604,-0.35592896,20.845585,275000
37
+ 1.0,1.0,0.030466061,3.046606,1.0304661,2.3689067,-0.7425792,-85.69172,-173.48724,0.9737913,-0.8775818,39.29247,280000
38
+ 1.0,1.0,0.03192516,3.1925163,1.0319252,1.5327636,-3.656193,-83.96082,-185.29085,0.38624167,-0.23929961,20.844732,285000
39
+ 1.0,1.0,0.029626096,2.9626098,1.0296261,1.2865337,-8.097196,-82.02044,-185.11414,0.36774322,-0.43225116,20.445904,290000
40
+ 1.0,1.0,0.03017468,3.017468,1.0301747,1.1757487,-6.481999,-83.2958,-180.15736,0.17762174,-0.22414416,16.12037,295000
41
+ 1.0,1.0,0.03044125,3.044125,1.0304413,1.1878039,-6.5765266,-85.51775,-180.50961,0.12965338,-0.11892362,14.993297,300000
42
+ 1.0,1.0,0.030085644,3.0085645,1.0300857,1.2726935,0.12017433,-83.35165,-153.67169,0.14564992,-0.21433535,19.264969,305000
43
+ 1.0,1.0,0.029670909,2.967091,1.029671,1.8538548,-6.4937396,-84.59881,-167.03911,0.4017379,-0.35887247,25.394983,310000
44
+ 1.0,1.0,0.032123793,3.2123795,1.0321238,4.9606767,-6.2638125,-83.800285,-169.68092,0.33971527,-0.35840556,36.788055,315000
45
+ 1.0,1.0,0.029921956,2.9921956,1.029922,1.4314578,-2.114652,-80.57882,-167.37814,0.32194293,-0.3055415,18.554905,320000
46
+ 1.0,0.99999994,0.03079728,3.0797281,1.0307972,1.472742,-0.2836917,-81.44424,-156.57545,0.23684002,-0.34831017,17.76606,325000
47
+ 1.0,1.0,0.03252253,3.252253,1.0325226,2.1069863,-0.9545042,-82.36473,-172.43729,0.30504507,-0.2901919,21.94638,330000
48
+ 1.0,0.99999994,0.030152382,3.0152383,1.0301523,1.1832618,0.017013595,-82.11964,-172.74567,0.2357518,-0.12053896,15.507708,335000
49
+ 1.0,0.99992543,0.029715475,2.9715476,1.0296409,2.209481,2.9708118,-83.289635,-179.09962,0.52299505,-0.30461514,28.133324,340000
50
+ 1.0,1.0,0.031533606,3.1533608,1.0315336,1.2599803,-2.1205344,-81.24496,-177.42004,0.25015074,-0.32222024,19.888603,345000
51
+ 1.0,1.0,0.028018348,2.8018348,1.0280184,1.5544826,-2.3414254,-76.51045,-173.06053,0.24250296,-0.20328434,19.6653,350000
52
+ 1.0,1.0,0.031052392,3.1052394,1.0310524,1.4340402,-3.4488013,-84.92341,-164.02466,0.2571986,-0.18058455,18.308693,355000
53
+ 1.0,0.9999999,0.032303534,3.2303536,1.0323035,1.283858,1.3345565,-80.40675,-165.91072,0.25437114,-0.23836634,18.12211,360000
54
+ 1.0,1.0000001,0.032051712,3.205171,1.0320518,1.1459788,-2.703693,-80.95571,-182.12097,0.5075672,-0.45890436,17.400234,365000
55
+ 1.0,1.0,0.029962808,2.996281,1.0299628,1.0037999,-5.1022115,-81.9513,-165.93463,0.14836016,-0.13742039,13.488472,370000
56
+ 1.0,1.0,0.027147165,2.7147164,1.0271472,1.4494708,-3.6189775,-79.6572,-174.41208,0.26713037,-0.15894201,15.689156,375000
57
+ 1.0,1.0,0.030181205,3.0181208,1.0301812,1.2448612,-5.6140704,-81.461205,-167.88966,0.3864386,-0.36070836,21.89621,380000
58
+ 1.0,0.9999999,0.029202467,2.9202466,1.0292023,1.2190682,-0.7791507,-80.30688,-155.54109,0.19845238,-0.14565477,15.502027,385000
59
+ 1.0,1.0000001,0.02855375,2.8553753,1.0285538,1.6088613,-1.3206321,-79.07693,-175.06966,1.6938184,-1.7251164,34.098106,390000
60
+ 1.0,0.99999315,0.030457085,3.0457087,1.0304502,2.071902,1.2714635,-81.035484,-179.06296,1.0956709,-1.4804114,38.674454,395000
61
+ 1.0,1.0,0.028935758,2.8935757,1.0289358,1.2305905,-3.6661725,-80.41815,-161.63199,0.1343096,-0.25638235,15.827568,400000
62
+ 1.0,0.99999994,0.03178581,3.1785812,1.0317857,1.5115639,-1.3100661,-84.28002,-172.9628,0.23508501,-0.26350704,18.904182,405000
63
+ 1.0,1.0,0.03104471,3.1044712,1.0310447,1.6429285,-0.2376203,-78.08773,-162.77092,0.38271052,-0.34505835,25.191202,410000
64
+ 1.0,0.99999994,0.028552089,2.8552089,1.028552,1.5683923,-2.3638132,-77.38912,-154.27553,0.29901552,-0.3427899,22.770252,415000
65
+ 1.0,1.0,0.030336384,3.0336387,1.0303364,1.186932,-4.192255,-78.29003,-163.10117,0.14497678,-0.21412687,14.570672,420000
66
+ 1.0,1.0,0.03275743,3.275743,1.0327574,1.6903981,-0.64183027,-79.4017,-166.51668,0.31774548,-0.3509749,24.120447,425000
67
+ 1.0,1.0,0.031195242,3.119524,1.0311953,1.8878803,-3.041251,-75.570885,-161.28532,0.47474518,-0.48824558,24.291481,430000
68
+ 1.0,1.0000001,0.03182739,3.182739,1.0318274,1.7655785,-2.2475045,-78.10741,-175.83176,0.355838,-0.2608187,25.254631,435000
69
+ 1.0,1.0000001,0.03218074,3.2180738,1.0321809,3.2502835,-0.07287747,-79.2376,-157.40236,0.3316678,-0.6209378,30.323048,440000
70
+ 1.0,0.9999999,0.03159128,3.1591282,1.0315912,1.1219404,-4.2508893,-82.53801,-168.20102,0.14740884,-0.21787308,15.014231,445000
71
+ 1.0,1.0000001,0.028630637,2.8630636,1.0286307,1.0140047,1.9789938,-77.48628,-163.15143,0.17781867,-0.2522599,14.209028,450000
72
+ 1.0,1.0,0.029725479,2.972548,1.0297254,1.1093912,-0.7031282,-78.38739,-159.40454,0.20706387,-0.22369246,14.351609,455000
73
+ 1.0,1.0000001,0.029396735,2.9396734,1.0293969,1.866346,-3.4077923,-76.25256,-170.37366,0.2955889,-0.3872293,24.962719,460000
74
+ 1.0,0.99998915,0.030594924,3.0594923,1.0305841,1.7025871,-0.7289362,-77.053116,-168.2727,0.5564788,-0.49631712,21.359306,465000
75
+ 1.0,1.0,0.030428695,3.0428696,1.0304286,2.2409487,-5.519577,-75.84811,-136.6638,0.80923593,-0.8168167,32.850643,470000
76
+ 1.0,1.0,0.029387087,2.9387088,1.0293871,1.9280081,0.50478107,-73.82256,-164.7535,0.5339467,-0.52293265,24.846146,475000
77
+ 1.0,1.0,0.029863387,2.9863389,1.0298634,1.2707541,2.1815271,-75.812126,-147.56506,0.27843952,-0.2240629,15.925829,480000
78
+ 1.0,0.9999999,0.030370776,3.0370774,1.0303707,1.2416432,-4.084595,-74.16615,-156.67795,0.25534427,-0.36216944,16.368612,485000
79
+ 1.0,1.0,0.03250511,3.2505112,1.0325052,1.0163826,-2.1402812,-78.342735,-162.85678,0.15619574,-0.28395817,17.586185,490000
80
+ 1.0,1.0,0.031071544,3.1071544,1.0310715,1.3813454,-3.1357214,-79.38387,-148.08937,0.3588021,-0.51829755,20.758862,495000
81
+ 1.0,1.0000001,0.029300671,2.9300673,1.0293008,1.9654938,-3.426087,-76.44865,-141.74524,0.39007488,-0.32283652,24.048874,500000
82
+ 1.0,1.0,0.029589316,2.9589314,1.0295893,1.0607764,-2.2628438,-78.07964,-167.50966,0.32241982,-0.28564164,17.326225,505000
83
+ 1.0,0.9999999,0.032006755,3.2006757,1.0320066,1.2547177,-6.3551965,-77.872375,-153.03954,0.21408743,-0.19598311,16.03841,510000
84
+ 1.0,1.0,0.032282826,3.228283,1.0322828,2.2499013,-1.8912278,-76.29686,-151.44978,0.7725436,-0.3772579,33.548485,515000
85
+ 1.0,1.0,0.034067355,3.4067354,1.0340674,1.0663801,-1.6230657,-73.52699,-162.0798,0.21637778,-0.15455642,12.593742,520000
86
+ 1.0,1.0,0.029797029,2.979703,1.0297971,1.1965449,-1.6316009,-72.29594,-170.65988,0.15868407,-0.18614109,14.889644,525000
87
+ 1.0,0.99999994,0.030478194,3.0478194,1.0304781,1.5555328,-0.8570956,-73.245094,-147.65683,0.23839161,-0.33103323,19.716301,530000
88
+ 1.0,1.0,0.033316404,3.3316402,1.0333164,1.108349,-2.705311,-76.68551,-167.55818,0.20680618,-0.16494934,15.094501,535000
89
+ 1.0,1.0,0.029558675,2.9558678,1.0295587,1.2780452,-1.1530197,-70.263245,-155.72827,0.34698632,-0.26147532,20.478857,540000
90
+ 1.0,0.99999994,0.031751644,3.1751645,1.0317516,1.2835222,2.1195028,-75.80636,-154.40569,0.42015386,-0.27758902,16.997849,545000
91
+ 1.0,1.0000001,0.031809196,3.1809196,1.0318093,1.1487522,-6.196899,-73.57082,-154.92665,0.23775113,-0.41025722,16.49393,550000
92
+ 1.0,1.0,0.03182818,3.182818,1.0318282,1.0283337,0.16966526,-75.164154,-158.75043,0.21207249,-0.11738857,14.196728,555000
93
+ 1.0,1.0,0.030552652,3.0552654,1.0305526,0.8810099,-2.5212777,-72.41766,-143.59276,0.34712806,-0.34174347,13.278177,560000
94
+ 1.0,0.99999994,0.033734906,3.3734908,1.0337348,1.2163817,-2.130519,-73.90445,-163.6609,0.17010489,-0.119622305,15.138552,565000
95
+ 1.0,1.0,0.03219202,3.2192025,1.032192,1.5027753,1.4317808,-70.96926,-138.76143,0.9190578,-1.0211698,24.70922,570000
96
+ 1.0,1.0000001,0.030795928,3.0795927,1.030796,1.5908698,0.44193769,-71.51781,-157.17508,0.21955636,-0.289798,18.414686,575000
97
+ 1.0,0.99999994,0.032965273,3.2965274,1.0329652,1.4800255,0.6564129,-70.69915,-146.5932,0.2907906,-0.34182978,18.404882,580000
98
+ 1.0,0.9999999,0.03218526,3.218526,1.0321852,1.1645294,-1.968122,-71.18796,-156.5364,0.33026892,-0.28354946,20.493284,585000
99
+ 1.0,1.0,0.031810973,3.1810975,1.031811,1.052676,-1.712674,-72.42431,-151.20766,0.21674103,-0.2761722,14.7893,590000
100
+ 1.0,1.0,0.030376822,3.0376823,1.0303768,3.6318028,-0.39172602,-68.219826,-159.69699,0.56909096,-0.36228615,30.106056,595000
101
+ 1.0,0.99999994,0.031967625,3.1967626,1.0319675,1.3909878,-3.538613,-68.04067,-161.39017,0.5810254,-0.6094781,24.089241,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,1.0,0.032774344,3.2774343,1.0327743,1.0932425,-23.77521,-91.97807,-147.01707,0.1600882,-0.15353456,15.720018,105000
3
+ 1.0,1.0000001,0.031835515,3.1835513,1.0318357,1.4218435,-18.075861,-93.09893,-161.27055,0.2842212,-0.28069493,21.895842,110000
4
+ 1.0,0.99999994,0.027711786,2.7711787,1.0277117,1.5592369,-24.273634,-95.705574,-157.6764,0.6112,-0.68368834,30.667006,115000
5
+ 1.0,1.0000001,0.0275824,2.7582397,1.0275825,1.3217583,-15.737227,-97.25216,-159.7271,0.19395939,-0.19663891,20.816746,120000
6
+ 1.0,1.0,0.025870271,2.587027,1.0258703,1.1924757,-36.987053,-98.1174,-165.33034,0.2159443,-0.23467453,17.054049,125000
7
+ 1.0,1.0,0.025660686,2.5660686,1.0256606,1.5210073,-21.56017,-98.27798,-171.34308,0.23008533,-0.23990558,23.608383,130000
8
+ 1.0,1.0,0.027204666,2.7204669,1.0272046,6.3665085,-21.163803,-100.12323,-157.3892,1.2037358,-0.97086346,66.20146,135000
9
+ 1.0,0.99999994,0.02757203,2.757203,1.0275719,1.9145364,-32.27921,-99.10265,-163.48196,0.30442533,-0.3145899,31.85463,140000
10
+ 1.0,1.0000001,0.028245334,2.8245335,1.0282454,1.5821365,-31.48007,-97.05345,-188.46776,0.18967888,-0.13200487,18.562883,145000
11
+ 1.0,1.0,0.029247006,2.9247007,1.029247,2.5130506,-25.22242,-94.6451,-171.09814,0.5469305,-0.6774365,46.151115,150000
12
+ 1.0,0.9999999,0.031125467,3.112547,1.0311253,1.6968602,-22.493814,-93.9178,-168.32181,0.39000577,-0.37254533,23.996946,155000
13
+ 1.0,1.0,0.028160103,2.8160105,1.0281601,2.639326,-3.828883,-90.73015,-171.63512,0.9921873,-0.86885947,52.379066,160000
14
+ 1.0,1.0,0.027181972,2.7181973,1.027182,1.4002876,-17.270971,-93.44409,-174.58575,0.15795536,-0.16163401,17.743622,165000
15
+ 1.0,1.0,0.026805688,2.6805687,1.0268056,1.6040888,-7.6107574,-92.32056,-177.5878,0.27002743,-0.30091658,20.312656,170000
16
+ 1.0,1.0,0.029856231,2.985623,1.0298562,2.202814,-21.11451,-95.58227,-185.62738,1.717517,-1.6330662,41.226604,175000
17
+ 1.0,1.0,0.028749857,2.8749857,1.0287498,1.7678899,-9.644874,-95.388664,-180.31941,0.20257859,-0.26442268,21.652401,180000
18
+ 1.0,1.0,0.028368756,2.836876,1.0283687,1.8996629,-3.1878076,-95.06043,-188.65915,0.28772888,-0.5123288,29.4916,185000
19
+ 1.0,0.99999994,0.02828301,2.828301,1.028283,1.4262173,-7.318556,-94.20504,-184.68166,0.14343011,-0.1606307,17.382645,190000
20
+ 1.0,1.0,0.028992739,2.8992739,1.0289928,1.6380312,-3.1305532,-93.45379,-184.92604,0.20466472,-0.19004013,21.041492,195000
21
+ 1.0,1.0,0.028351761,2.835176,1.0283518,2.2002785,-7.10841,-91.16237,-170.61526,0.26162374,-0.26867864,28.279707,200000
22
+ 1.0,0.9999999,0.028182479,2.818248,1.0281824,1.6027899,-6.781366,-93.065025,-185.27458,0.20146504,-0.20117216,24.18475,205000
23
+ 1.0,1.0,0.02897347,2.8973467,1.0289735,1.2823778,-3.7525268,-90.68994,-168.50206,0.13532227,-0.1092464,14.987029,210000
24
+ 1.0,1.0000001,0.028144255,2.8144255,1.0281444,1.5923005,1.3301108,-90.385475,-180.58116,0.1855624,-0.17930008,20.40823,215000
25
+ 1.0,0.9999616,0.028958028,2.895803,1.0289197,1.5928963,3.9776516,-89.653175,-163.06285,0.79556763,-0.88867295,27.529282,220000
26
+ 1.0,0.99999994,0.030537017,3.0537016,1.030537,2.2458725,-11.937216,-91.877106,-182.11176,0.3400941,-0.26796144,22.769707,225000
27
+ 1.0,1.0,0.030574225,3.0574224,1.0305742,1.5653282,-15.153382,-91.25504,-182.55283,0.29095858,-0.43341208,22.444723,230000
28
+ 1.0,1.0,0.02885652,2.885652,1.0288565,1.7685711,1.313568,-89.124054,-166.1746,0.20126915,-0.22533625,21.64465,235000
29
+ 1.0,1.0,0.0298104,2.9810402,1.0298104,1.7850014,-10.748077,-86.302025,-183.13586,0.20106946,-0.20874545,21.781883,240000
30
+ 1.0,1.0,0.030701958,3.0701957,1.030702,2.452132,-9.966492,-88.22473,-181.0386,0.5202119,-0.50465596,28.07013,245000
31
+ 1.0,1.0,0.02927308,2.9273078,1.029273,1.7923872,-4.667734,-88.046524,-165.67738,0.359545,-0.25625303,22.23195,250000
32
+ 1.0,1.0,0.02831237,2.831237,1.0283123,1.2162807,-4.072564,-87.34977,-175.6577,0.15797326,-0.13864116,15.318936,255000
33
+ 1.0,1.0,0.030370828,3.037083,1.0303708,2.9208515,-2.546937,-86.439896,-179.68413,0.87395734,-0.7738875,33.678455,260000
34
+ 1.0,1.0000001,0.029941281,2.9941282,1.0299414,1.7246269,-2.4551518,-85.56594,-160.59956,0.6956084,-0.62144357,28.021894,265000
35
+ 1.0,1.0,0.032908496,3.2908494,1.0329084,3.301616,-2.2319899,-83.71052,-173.81097,0.8048148,-0.7716172,37.324787,270000
36
+ 1.0,0.99999994,0.03163052,3.1630518,1.0316305,1.8411057,-0.029120117,-87.06445,-179.74669,0.21129604,-0.35592896,20.845585,275000
37
+ 1.0,1.0,0.030466061,3.046606,1.0304661,2.3689067,-0.7425792,-85.69172,-173.48724,0.9737913,-0.8775818,39.29247,280000
38
+ 1.0,1.0,0.03192516,3.1925163,1.0319252,1.5327636,-3.656193,-83.96082,-185.29085,0.38624167,-0.23929961,20.844732,285000
39
+ 1.0,1.0,0.029626096,2.9626098,1.0296261,1.2865337,-8.097196,-82.02044,-185.11414,0.36774322,-0.43225116,20.445904,290000
40
+ 1.0,1.0,0.03017468,3.017468,1.0301747,1.1757487,-6.481999,-83.2958,-180.15736,0.17762174,-0.22414416,16.12037,295000
41
+ 1.0,1.0,0.03044125,3.044125,1.0304413,1.1878039,-6.5765266,-85.51775,-180.50961,0.12965338,-0.11892362,14.993297,300000
42
+ 1.0,1.0,0.030085644,3.0085645,1.0300857,1.2726935,0.12017433,-83.35165,-153.67169,0.14564992,-0.21433535,19.264969,305000
43
+ 1.0,1.0,0.029670909,2.967091,1.029671,1.8538548,-6.4937396,-84.59881,-167.03911,0.4017379,-0.35887247,25.394983,310000
44
+ 1.0,1.0,0.032123793,3.2123795,1.0321238,4.9606767,-6.2638125,-83.800285,-169.68092,0.33971527,-0.35840556,36.788055,315000
45
+ 1.0,1.0,0.029921956,2.9921956,1.029922,1.4314578,-2.114652,-80.57882,-167.37814,0.32194293,-0.3055415,18.554905,320000
46
+ 1.0,0.99999994,0.03079728,3.0797281,1.0307972,1.472742,-0.2836917,-81.44424,-156.57545,0.23684002,-0.34831017,17.76606,325000
47
+ 1.0,1.0,0.03252253,3.252253,1.0325226,2.1069863,-0.9545042,-82.36473,-172.43729,0.30504507,-0.2901919,21.94638,330000
48
+ 1.0,0.99999994,0.030152382,3.0152383,1.0301523,1.1832618,0.017013595,-82.11964,-172.74567,0.2357518,-0.12053896,15.507708,335000
49
+ 1.0,0.99992543,0.029715475,2.9715476,1.0296409,2.209481,2.9708118,-83.289635,-179.09962,0.52299505,-0.30461514,28.133324,340000
50
+ 1.0,1.0,0.031533606,3.1533608,1.0315336,1.2599803,-2.1205344,-81.24496,-177.42004,0.25015074,-0.32222024,19.888603,345000
51
+ 1.0,1.0,0.028018348,2.8018348,1.0280184,1.5544826,-2.3414254,-76.51045,-173.06053,0.24250296,-0.20328434,19.6653,350000
52
+ 1.0,1.0,0.031052392,3.1052394,1.0310524,1.4340402,-3.4488013,-84.92341,-164.02466,0.2571986,-0.18058455,18.308693,355000
53
+ 1.0,0.9999999,0.032303534,3.2303536,1.0323035,1.283858,1.3345565,-80.40675,-165.91072,0.25437114,-0.23836634,18.12211,360000
54
+ 1.0,1.0000001,0.032051712,3.205171,1.0320518,1.1459788,-2.703693,-80.95571,-182.12097,0.5075672,-0.45890436,17.400234,365000
55
+ 1.0,1.0,0.029962808,2.996281,1.0299628,1.0037999,-5.1022115,-81.9513,-165.93463,0.14836016,-0.13742039,13.488472,370000
56
+ 1.0,1.0,0.027147165,2.7147164,1.0271472,1.4494708,-3.6189775,-79.6572,-174.41208,0.26713037,-0.15894201,15.689156,375000
57
+ 1.0,1.0,0.030181205,3.0181208,1.0301812,1.2448612,-5.6140704,-81.461205,-167.88966,0.3864386,-0.36070836,21.89621,380000
58
+ 1.0,0.9999999,0.029202467,2.9202466,1.0292023,1.2190682,-0.7791507,-80.30688,-155.54109,0.19845238,-0.14565477,15.502027,385000
59
+ 1.0,1.0000001,0.02855375,2.8553753,1.0285538,1.6088613,-1.3206321,-79.07693,-175.06966,1.6938184,-1.7251164,34.098106,390000
60
+ 1.0,0.99999315,0.030457085,3.0457087,1.0304502,2.071902,1.2714635,-81.035484,-179.06296,1.0956709,-1.4804114,38.674454,395000
61
+ 1.0,1.0,0.028935758,2.8935757,1.0289358,1.2305905,-3.6661725,-80.41815,-161.63199,0.1343096,-0.25638235,15.827568,400000
62
+ 1.0,0.99999994,0.03178581,3.1785812,1.0317857,1.5115639,-1.3100661,-84.28002,-172.9628,0.23508501,-0.26350704,18.904182,405000
63
+ 1.0,1.0,0.03104471,3.1044712,1.0310447,1.6429285,-0.2376203,-78.08773,-162.77092,0.38271052,-0.34505835,25.191202,410000
64
+ 1.0,0.99999994,0.028552089,2.8552089,1.028552,1.5683923,-2.3638132,-77.38912,-154.27553,0.29901552,-0.3427899,22.770252,415000
65
+ 1.0,1.0,0.030336384,3.0336387,1.0303364,1.186932,-4.192255,-78.29003,-163.10117,0.14497678,-0.21412687,14.570672,420000
66
+ 1.0,1.0,0.03275743,3.275743,1.0327574,1.6903981,-0.64183027,-79.4017,-166.51668,0.31774548,-0.3509749,24.120447,425000
67
+ 1.0,1.0,0.031195242,3.119524,1.0311953,1.8878803,-3.041251,-75.570885,-161.28532,0.47474518,-0.48824558,24.291481,430000
68
+ 1.0,1.0000001,0.03182739,3.182739,1.0318274,1.7655785,-2.2475045,-78.10741,-175.83176,0.355838,-0.2608187,25.254631,435000
69
+ 1.0,1.0000001,0.03218074,3.2180738,1.0321809,3.2502835,-0.07287747,-79.2376,-157.40236,0.3316678,-0.6209378,30.323048,440000
70
+ 1.0,0.9999999,0.03159128,3.1591282,1.0315912,1.1219404,-4.2508893,-82.53801,-168.20102,0.14740884,-0.21787308,15.014231,445000
71
+ 1.0,1.0000001,0.028630637,2.8630636,1.0286307,1.0140047,1.9789938,-77.48628,-163.15143,0.17781867,-0.2522599,14.209028,450000
72
+ 1.0,1.0,0.029725479,2.972548,1.0297254,1.1093912,-0.7031282,-78.38739,-159.40454,0.20706387,-0.22369246,14.351609,455000
73
+ 1.0,1.0000001,0.029396735,2.9396734,1.0293969,1.866346,-3.4077923,-76.25256,-170.37366,0.2955889,-0.3872293,24.962719,460000
74
+ 1.0,0.99998915,0.030594924,3.0594923,1.0305841,1.7025871,-0.7289362,-77.053116,-168.2727,0.5564788,-0.49631712,21.359306,465000
75
+ 1.0,1.0,0.030428695,3.0428696,1.0304286,2.2409487,-5.519577,-75.84811,-136.6638,0.80923593,-0.8168167,32.850643,470000
76
+ 1.0,1.0,0.029387087,2.9387088,1.0293871,1.9280081,0.50478107,-73.82256,-164.7535,0.5339467,-0.52293265,24.846146,475000
77
+ 1.0,1.0,0.029863387,2.9863389,1.0298634,1.2707541,2.1815271,-75.812126,-147.56506,0.27843952,-0.2240629,15.925829,480000
78
+ 1.0,0.9999999,0.030370776,3.0370774,1.0303707,1.2416432,-4.084595,-74.16615,-156.67795,0.25534427,-0.36216944,16.368612,485000
79
+ 1.0,1.0,0.03250511,3.2505112,1.0325052,1.0163826,-2.1402812,-78.342735,-162.85678,0.15619574,-0.28395817,17.586185,490000
80
+ 1.0,1.0,0.031071544,3.1071544,1.0310715,1.3813454,-3.1357214,-79.38387,-148.08937,0.3588021,-0.51829755,20.758862,495000
81
+ 1.0,1.0000001,0.029300671,2.9300673,1.0293008,1.9654938,-3.426087,-76.44865,-141.74524,0.39007488,-0.32283652,24.048874,500000
82
+ 1.0,1.0,0.029589316,2.9589314,1.0295893,1.0607764,-2.2628438,-78.07964,-167.50966,0.32241982,-0.28564164,17.326225,505000
83
+ 1.0,0.9999999,0.032006755,3.2006757,1.0320066,1.2547177,-6.3551965,-77.872375,-153.03954,0.21408743,-0.19598311,16.03841,510000
84
+ 1.0,1.0,0.032282826,3.228283,1.0322828,2.2499013,-1.8912278,-76.29686,-151.44978,0.7725436,-0.3772579,33.548485,515000
85
+ 1.0,1.0,0.034067355,3.4067354,1.0340674,1.0663801,-1.6230657,-73.52699,-162.0798,0.21637778,-0.15455642,12.593742,520000
86
+ 1.0,1.0,0.029797029,2.979703,1.0297971,1.1965449,-1.6316009,-72.29594,-170.65988,0.15868407,-0.18614109,14.889644,525000
87
+ 1.0,0.99999994,0.030478194,3.0478194,1.0304781,1.5555328,-0.8570956,-73.245094,-147.65683,0.23839161,-0.33103323,19.716301,530000
88
+ 1.0,1.0,0.033316404,3.3316402,1.0333164,1.108349,-2.705311,-76.68551,-167.55818,0.20680618,-0.16494934,15.094501,535000
89
+ 1.0,1.0,0.029558675,2.9558678,1.0295587,1.2780452,-1.1530197,-70.263245,-155.72827,0.34698632,-0.26147532,20.478857,540000
90
+ 1.0,0.99999994,0.031751644,3.1751645,1.0317516,1.2835222,2.1195028,-75.80636,-154.40569,0.42015386,-0.27758902,16.997849,545000
91
+ 1.0,1.0000001,0.031809196,3.1809196,1.0318093,1.1487522,-6.196899,-73.57082,-154.92665,0.23775113,-0.41025722,16.49393,550000
92
+ 1.0,1.0,0.03182818,3.182818,1.0318282,1.0283337,0.16966526,-75.164154,-158.75043,0.21207249,-0.11738857,14.196728,555000
93
+ 1.0,1.0,0.030552652,3.0552654,1.0305526,0.8810099,-2.5212777,-72.41766,-143.59276,0.34712806,-0.34174347,13.278177,560000
94
+ 1.0,0.99999994,0.033734906,3.3734908,1.0337348,1.2163817,-2.130519,-73.90445,-163.6609,0.17010489,-0.119622305,15.138552,565000
95
+ 1.0,1.0,0.03219202,3.2192025,1.032192,1.5027753,1.4317808,-70.96926,-138.76143,0.9190578,-1.0211698,24.70922,570000
96
+ 1.0,1.0000001,0.030795928,3.0795927,1.030796,1.5908698,0.44193769,-71.51781,-157.17508,0.21955636,-0.289798,18.414686,575000
97
+ 1.0,0.99999994,0.032965273,3.2965274,1.0329652,1.4800255,0.6564129,-70.69915,-146.5932,0.2907906,-0.34182978,18.404882,580000
98
+ 1.0,0.9999999,0.03218526,3.218526,1.0321852,1.1645294,-1.968122,-71.18796,-156.5364,0.33026892,-0.28354946,20.493284,585000
99
+ 1.0,1.0,0.031810973,3.1810975,1.031811,1.052676,-1.712674,-72.42431,-151.20766,0.21674103,-0.2761722,14.7893,590000
100
+ 1.0,1.0,0.030376822,3.0376823,1.0303768,3.6318028,-0.39172602,-68.219826,-159.69699,0.56909096,-0.36228615,30.106056,595000
101
+ 1.0,0.99999994,0.031967625,3.1967626,1.0319675,1.3909878,-3.538613,-68.04067,-161.39017,0.5810254,-0.6094781,24.089241,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d44bcd35774595728af67825b08775d995a7677585b94430f8a606f6853d912e
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35dc22367e564c9c72920b3d4d843c22e35451598caf84daf20f168a0f72cf1a
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47da02c8d1cc2c98e1b3b72fce6df8a5f164907a10ac05573ae15eb832264e2c
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62aa3bace9a703519bc49969ccd888f58eb32159c1e19ddf7f017a44dcc9fd49
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15379947ca07efed8a3ebf8a96d216e663ed27e5eb9740e9943a4f8d3cdcda25
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9b48b8ba731646433f3db806472f8b97697db9121e56d014227f652d6ca1f90
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6228cd5a50422655dad459e79d9faa0ceb3ab0e491d4f7878c8d9d295bd07ca
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c85bf018e11a1daad446c2304e5fd4125c7feda8d1d7a5df773003ea53fbc2b0
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:870d9595b3836d65c0d2bb2f9bcbc3e22dbe1eb90488e7c4b52fa8fab6042898
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c0af8f75c45ee9a3b10ac53ead00e8d0878b71701f2c170b4c7d15d5c78a94a
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_104054/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/9p3hd9v5