Tiredsheep commited on
Commit
12bb778
·
verified ·
1 Parent(s): fc00e93

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_350000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_400000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_450000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_500000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_550000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_600000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_650000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_700000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_750000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_800000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.04282830816094977,-0.00012293608146269315,-0.041690472630144554,0.007105941252878568,27.83180481203074,9.186999999999108,0.8,4545.04,-0.3,-256.96,181.74,0.5639923858642578,350000
3
+ 0.0,0.0,-0.06221163625495219,0.032367165109573465,-0.06113429526382985,-0.003801925367609371,28.96558423568568,7.814999999999276,0.82,13658.66,-0.34,-267.04,154.3,0.4666427135467529,400000
4
+ 0.0,0.0,-0.060652132489156727,0.04882220055164859,-0.056653199636389005,0.04174926314085777,34.16196538023772,4.575999999999727,0.96,19975.48,-0.08,-139.68,89.52,0.2888590145111084,450000
5
+ 0.0,0.0,-0.07030779800349042,0.0498941244813069,-0.066264861498018,0.04842425563478959,35.39926446487472,4.037999999999813,0.98,23705.78,-0.02,-112.02,78.76,0.26009866237640383,500000
6
+ 0.0,0.0,-0.0697714024780041,0.058424291275668956,-0.06551227670111003,0.1121741545177756,34.29968070856652,4.78299999999975,0.94,28833.58,-0.06,-128.06,93.66,0.2952264928817749,550000
7
+ 0.0,0.0,-0.06283801962139493,0.048522558837145145,-0.05932229349353395,0.051722501928293765,33.040565834893194,4.159999999999751,0.96,33344.96,-0.06,-116.54,81.2,0.26340507984161377,600000
8
+ 0.0,0.0,-0.06234732179190664,0.05687454375058551,-0.05847178228360296,0.058549140135818696,34.45078011857752,4.212999999999778,0.94,37349.78,-0.08,-109.44,82.26,0.266047306060791,650000
9
+ 0.0,0.0,-0.06855706145893337,0.05819578369813279,-0.0647821909188096,0.06255509055342139,35.09145632433152,3.3329999999998345,0.96,41183.0,-0.06,-93.94,64.66,0.2129999303817749,700000
10
+ 0.0,0.0,-0.06465282540860906,0.042792685560819124,-0.06041098398024768,0.06539141224001695,34.717336779566054,2.773999999999923,1.0,44022.92,0.0,-78.12,53.48,0.18061086654663086,750000
11
+ 0.0,0.0,-0.05351378723106064,0.04415969249901216,-0.04932830963076607,0.06487790424935362,34.68477198646255,3.2359999999998457,0.96,47117.02,-0.04,-84.1,62.72,0.204510178565979,800000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.04282830816094977,-0.00012293608146269315,-0.041690472630144554,0.007105941252878568,27.83180481203074,9.186999999999108,0.8,4545.04,-0.3,-256.96,181.74,0.5639923858642578,350000
3
+ 0.0,0.0,-0.06221163625495219,0.032367165109573465,-0.06113429526382985,-0.003801925367609371,28.96558423568568,7.814999999999276,0.82,13658.66,-0.34,-267.04,154.3,0.4666427135467529,400000
4
+ 0.0,0.0,-0.060652132489156727,0.04882220055164859,-0.056653199636389005,0.04174926314085777,34.16196538023772,4.575999999999727,0.96,19975.48,-0.08,-139.68,89.52,0.2888590145111084,450000
5
+ 0.0,0.0,-0.07030779800349042,0.0498941244813069,-0.066264861498018,0.04842425563478959,35.39926446487472,4.037999999999813,0.98,23705.78,-0.02,-112.02,78.76,0.26009866237640383,500000
6
+ 0.0,0.0,-0.0697714024780041,0.058424291275668956,-0.06551227670111003,0.1121741545177756,34.29968070856652,4.78299999999975,0.94,28833.58,-0.06,-128.06,93.66,0.2952264928817749,550000
7
+ 0.0,0.0,-0.06283801962139493,0.048522558837145145,-0.05932229349353395,0.051722501928293765,33.040565834893194,4.159999999999751,0.96,33344.96,-0.06,-116.54,81.2,0.26340507984161377,600000
8
+ 0.0,0.0,-0.06234732179190664,0.05687454375058551,-0.05847178228360296,0.058549140135818696,34.45078011857752,4.212999999999778,0.94,37349.78,-0.08,-109.44,82.26,0.266047306060791,650000
9
+ 0.0,0.0,-0.06855706145893337,0.05819578369813279,-0.0647821909188096,0.06255509055342139,35.09145632433152,3.3329999999998345,0.96,41183.0,-0.06,-93.94,64.66,0.2129999303817749,700000
10
+ 0.0,0.0,-0.06465282540860906,0.042792685560819124,-0.06041098398024768,0.06539141224001695,34.717336779566054,2.773999999999923,1.0,44022.92,0.0,-78.12,53.48,0.18061086654663086,750000
11
+ 0.0,0.0,-0.05351378723106064,0.04415969249901216,-0.04932830963076607,0.06487790424935362,34.68477198646255,3.2359999999998457,0.96,47117.02,-0.04,-84.1,62.72,0.204510178565979,800000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,1.0,0.025970446,2.5970447,1.0259705,0.61797017,-24.327396,-102.1219,-164.98207,0.17441538,-0.15975727,9.351312,305000
3
+ 1.0,1.0,0.024198644,2.4198647,1.0241987,0.98557514,-23.998299,-103.44277,-166.37785,0.7783513,-0.8673335,21.170956,310000
4
+ 1.0,1.0,0.02279361,2.2793612,1.0227937,0.93565714,-28.933817,-106.68423,-176.3245,0.12134427,-0.122952916,12.474191,315000
5
+ 1.0,1.0000001,0.022773342,2.2773342,1.0227735,1.6021703,-23.472734,-106.96023,-185.2901,1.4559342,-1.6074111,46.552155,320000
6
+ 1.0,1.0,0.023886522,2.3886523,1.0238866,0.9559885,-40.056564,-105.52886,-187.2561,0.09516618,-0.09845582,11.181156,325000
7
+ 1.0,1.0000001,0.024195768,2.4195766,1.0241959,1.1675915,-13.632698,-102.67061,-189.329,0.25979096,-0.25629005,19.00258,330000
8
+ 1.0,1.0,0.024336517,2.433652,1.0243366,1.3106807,-12.586526,-102.45811,-187.25758,0.6124355,-0.59153634,29.252857,335000
9
+ 1.0,0.99999994,0.024821166,2.4821167,1.0248212,2.3970692,-32.095455,-104.410515,-175.45593,1.0803895,-1.1375939,39.177917,340000
10
+ 1.0,1.0000001,0.02500773,2.500773,1.0250078,1.7950035,-24.833326,-102.249016,-200.38692,0.43900657,-0.47564027,24.241295,345000
11
+ 1.0,1.0,0.026817784,2.6817784,1.0268178,1.9322785,-23.329155,-101.54619,-179.43999,0.75198764,-0.6283168,32.181236,350000
12
+ 1.0,1.0,0.02633738,2.633738,1.0263374,1.9671745,-8.133112,-99.71804,-190.21053,0.91923624,-0.8747534,32.69053,355000
13
+ 1.0,1.0,0.027504835,2.7504835,1.0275048,1.347749,-23.00677,-97.6818,-189.5472,0.23139882,-0.28074902,20.395578,360000
14
+ 1.0,1.0,0.02593712,2.593712,1.0259371,1.3600177,-20.220642,-94.66597,-187.67415,0.28263286,-0.25005642,18.987928,365000
15
+ 1.0,0.99999994,0.026539763,2.6539764,1.0265397,1.4376891,-10.259895,-91.938126,-196.85551,0.22555135,-0.24404359,15.463736,370000
16
+ 1.0,1.0000002,0.029647395,2.9647396,1.0296476,2.093026,-24.879921,-93.2969,-189.80333,0.6199899,-0.6904321,32.90751,375000
17
+ 1.0,0.99999994,0.029641354,2.9641354,1.0296413,2.8429334,-6.753205,-93.804,-180.04564,0.22864452,-0.28644386,22.350397,380000
18
+ 1.0,0.99999994,0.028743897,2.8743896,1.0287439,1.2493395,-3.482328,-92.5494,-178.198,0.45098293,-0.57453597,23.32129,385000
19
+ 1.0,1.0,0.030125756,3.0125754,1.0301257,1.4858295,-13.328147,-90.66831,-184.16116,0.2663263,-0.22266287,19.334219,390000
20
+ 1.0,1.0,0.030704072,3.070407,1.030704,1.4174905,1.4585557,-91.84765,-174.84428,0.18346721,-0.16610174,16.984112,395000
21
+ 1.0,0.99999994,0.028152477,2.8152478,1.0281525,1.174852,-19.192045,-86.13014,-160.22984,0.3018727,-0.19470216,14.601456,400000
22
+ 1.0,1.0,0.029939774,2.9939775,1.0299398,1.137135,-1.367926,-87.66848,-165.08939,0.14824641,-0.15510102,12.757724,405000
23
+ 1.0,0.99999994,0.030181902,3.0181901,1.0301819,1.6288594,-15.692904,-87.709755,-156.14171,0.37674382,-0.33528775,24.011173,410000
24
+ 1.0,0.9998845,0.029349096,2.9349098,1.0292336,1.0171874,1.9547448,-84.91956,-179.92557,0.224294,-0.14463592,12.607237,415000
25
+ 1.0,1.0,0.030203335,3.0203338,1.0302033,0.9725605,-7.612387,-84.70607,-173.13293,0.16637543,-0.22601117,14.511656,420000
26
+ 1.0,1.0,0.029837746,2.983775,1.0298377,1.4719096,-4.523689,-86.43562,-172.28146,0.24101304,-0.4022084,21.746063,425000
27
+ 1.0,0.99999994,0.031215683,3.1215682,1.0312157,1.1666243,-0.621766,-86.52639,-173.84575,0.18478253,-0.13005427,15.246854,430000
28
+ 1.0,0.9999389,0.030666508,3.0666509,1.0306054,1.3576425,1.3815085,-84.50162,-161.53247,0.3761146,-0.22600876,19.066484,435000
29
+ 1.0,0.99999994,0.031642217,3.1642218,1.0316422,1.3217419,-5.035165,-80.033,-173.03848,0.38146323,-0.4314169,21.916441,440000
30
+ 1.0,0.9999999,0.031383082,3.1383083,1.0313829,1.1573004,-3.65542,-82.10425,-163.45523,0.14388916,-0.12313154,14.391802,445000
31
+ 1.0,1.0,0.030858772,3.0858774,1.0308588,1.3424736,-3.709149,-82.378044,-190.84026,0.20015103,-0.21729986,15.850815,450000
32
+ 1.0,1.0000001,0.029661484,2.9661486,1.0296617,2.1374233,-1.9868177,-83.40203,-188.55676,0.8654126,-0.8754444,37.308678,455000
33
+ 1.0,1.0,0.030179318,3.017932,1.0301793,1.4842345,-0.21859603,-85.39974,-171.95277,0.34767607,-0.22139913,18.637077,460000
34
+ 1.0,1.0,0.03074146,3.074146,1.0307415,1.1450975,-1.1607375,-83.54258,-166.8056,0.1860245,-0.2961151,18.06142,465000
35
+ 1.0,0.99999994,0.03373386,3.3733861,1.0337338,1.339273,-6.300381,-80.80837,-169.58092,0.6987014,-0.6940768,26.906128,470000
36
+ 1.0,1.0,0.03259988,3.2599883,1.0325999,1.8981717,-0.77594745,-84.019554,-178.02205,0.5587725,-0.3400071,23.869677,475000
37
+ 1.0,0.999905,0.030698944,3.0698946,1.0306039,1.7692112,2.3665307,-83.74553,-173.58675,0.4186941,-0.41102505,23.606571,480000
38
+ 1.0,0.9999999,0.03167137,3.1671371,1.0316713,1.2740253,-0.44332445,-80.48379,-162.8863,0.3127696,-0.28837344,15.915227,485000
39
+ 1.0,1.0,0.031455263,3.1455264,1.0314553,1.6969767,-13.836949,-79.78822,-167.91647,0.60418046,-0.62567663,30.689327,490000
40
+ 1.0,1.0,0.033401582,3.3401585,1.0334016,1.4847941,-8.586334,-80.1708,-171.52502,0.14482026,-0.20694083,17.05365,495000
41
+ 1.0,0.99999994,0.031268936,3.1268935,1.0312688,1.209678,-2.7779028,-80.297935,-173.72461,0.3260636,-0.39363047,22.495419,500000
42
+ 1.0,1.0,0.032819696,3.2819698,1.0328197,1.2413424,-4.4433513,-80.049,-172.7935,0.24822594,-0.32857692,17.431831,505000
43
+ 1.0,1.0,0.032206334,3.2206337,1.0322063,0.99547255,-2.0257387,-78.47825,-159.94205,0.26130122,-0.17986342,16.022758,510000
44
+ 1.0,1.0,0.03184907,3.184907,1.031849,1.5465404,-6.743034,-80.90395,-171.89903,0.21831024,-0.22446845,20.02318,515000
45
+ 1.0,1.0,0.031025518,3.1025517,1.0310255,1.3203449,-5.5931,-78.168236,-169.48325,0.30399337,-0.4825654,20.675695,520000
46
+ 1.0,1.0,0.030954044,3.0954046,1.030954,1.6724478,-3.6360633,-76.43373,-145.50067,0.29218525,-0.46965092,25.039577,525000
47
+ 1.0,1.0,0.03419694,3.419694,1.034197,1.3715729,-6.2684956,-81.52063,-157.6875,0.20582281,-0.24045487,17.452372,530000
48
+ 1.0,1.0,0.029367778,2.936778,1.0293678,1.3024606,-2.4041758,-78.330284,-154.91835,0.141869,-0.14368004,14.08783,535000
49
+ 1.0,0.9999012,0.030907474,3.0907476,1.0308087,1.4228268,1.2555124,-78.415565,-168.78181,0.78444,-0.5195512,31.483822,540000
50
+ 1.0,0.9999999,0.0337763,3.3776298,1.0337762,1.351764,-3.5755327,-81.46997,-152.02417,0.22034785,-0.1984426,15.18378,545000
51
+ 1.0,1.0,0.029828142,2.9828143,1.0298282,2.3572137,0.2679395,-74.508934,-173.46431,0.3351168,-0.46852615,26.10388,550000
52
+ 1.0,1.0,0.031699724,3.1699724,1.0316998,1.2801898,0.8271607,-79.29699,-162.04356,0.18852474,-0.28073752,14.616115,555000
53
+ 1.0,1.0,0.031780906,3.178091,1.031781,1.625774,1.3246003,-76.07964,-171.21703,0.4283538,-0.41769668,22.14267,560000
54
+ 1.0,1.0,0.03344983,3.344983,1.0334499,16.017694,-1.4612627,-75.648125,-171.92348,3.3133323,-3.3451102,95.795135,565000
55
+ 1.0,1.0000001,0.030947067,3.094707,1.0309472,1.6849556,0.7214161,-76.21171,-153.61516,0.34507835,-0.3120985,22.81577,570000
56
+ 1.0,1.0,0.030237097,3.0237095,1.0302371,1.5069698,-0.595807,-75.60787,-175.41429,0.4352113,-0.15727258,18.072308,575000
57
+ 1.0,1.0,0.031588245,3.1588247,1.0315882,1.2193358,-2.9080946,-75.9464,-162.61143,0.27560276,-0.35351598,16.492746,580000
58
+ 1.0,1.0,0.030126799,3.01268,1.0301268,1.1559385,-4.1794643,-75.33663,-161.75754,0.29052818,-0.34248358,15.277493,585000
59
+ 1.0,0.99999994,0.029949972,2.9949975,1.0299499,1.1157866,-1.8244305,-72.82251,-168.13348,0.21694712,-0.16966791,15.092472,590000
60
+ 1.0,1.0,0.03200285,3.2002852,1.0320028,2.2222068,1.2567415,-75.29958,-153.51605,0.28892347,-0.3703931,25.73973,595000
61
+ 1.0,1.0,0.029341798,2.93418,1.0293418,1.0068554,-2.0198584,-76.202965,-160.56458,0.23660174,-0.18319799,11.321814,600000
62
+ 1.0,0.99999994,0.032258797,3.22588,1.0322587,2.6988413,-0.7239052,-76.63749,-150.8965,0.68426996,-0.70081484,33.10107,605000
63
+ 1.0,1.0,0.03558142,3.5581422,1.0355815,1.5785003,-5.101623,-73.95965,-154.1837,0.22952145,-0.22787346,18.722895,610000
64
+ 1.0,0.99999994,0.030895427,3.0895426,1.0308954,1.3040155,-5.044939,-75.2369,-150.12013,2.787803,-2.82185,34.990284,615000
65
+ 1.0,0.9999999,0.032885164,3.2885165,1.0328851,1.1160873,-4.0502987,-73.55358,-148.9154,0.2696564,-0.14822036,15.908524,620000
66
+ 1.0,0.99999994,0.03491494,3.4914942,1.0349149,1.3472639,-3.152269,-72.53079,-176.00545,0.21937364,-0.31539676,17.786564,625000
67
+ 1.0,0.99999994,0.031720348,3.172035,1.0317203,1.4399548,-2.6382403,-72.104126,-142.33696,0.3083681,-0.5282302,23.567396,630000
68
+ 1.0,0.99999994,0.032286264,3.2286263,1.0322862,1.5705748,-2.468065,-71.757744,-170.16425,0.20047921,-0.22548467,21.150293,635000
69
+ 1.0,1.0,0.032496672,3.2496672,1.0324967,1.1775327,-0.77121735,-73.92078,-148.00293,0.18685286,-0.18910535,15.325074,640000
70
+ 1.0,1.0,0.03228181,3.228181,1.0322818,1.2618818,-1.9631743,-76.65282,-154.2353,0.15404934,-0.18152857,15.768902,645000
71
+ 1.0,1.0,0.029512506,2.9512506,1.0295125,1.2127136,-3.5900738,-70.93663,-154.27995,0.29151207,-0.27993584,18.57493,650000
72
+ 1.0,0.9999999,0.031470135,3.1470137,1.0314701,1.1232098,1.4667127,-77.14154,-163.62471,0.20630932,-0.16764575,12.823296,655000
73
+ 1.0,1.0,0.030943763,3.0943763,1.0309438,1.0791585,-4.7858787,-70.91695,-160.8167,0.120213546,-0.26107085,12.854346,660000
74
+ 1.0,0.99999994,0.030199796,3.0199795,1.0301998,1.14361,-3.5024016,-72.28202,-158.71751,0.16492786,-0.29146308,15.387384,665000
75
+ 1.0,1.0,0.030801263,3.0801263,1.0308013,1.369837,-3.8097172,-70.67834,-141.4685,0.17607671,-0.17866711,15.826492,670000
76
+ 1.0,1.0000001,0.031449042,3.1449044,1.0314492,2.6550965,0.61832976,-71.54462,-162.30405,0.2691045,-0.3915677,25.754328,675000
77
+ 1.0,1.0000001,0.03187311,3.187311,1.0318732,1.7178322,-1.9108498,-73.47057,-151.91049,0.43845862,-0.34298536,22.142466,680000
78
+ 1.0,0.99999994,0.032033782,3.2033782,1.0320337,1.3725023,-6.0816736,-73.18013,-152.22961,0.36489367,-0.3861867,17.481806,685000
79
+ 1.0,0.99999994,0.035278056,3.5278058,1.035278,1.3051045,-6.802564,-74.438255,-162.61978,0.22680324,-0.33500135,21.514647,690000
80
+ 1.0,1.0,0.031692423,3.1692424,1.0316924,1.3266491,-6.7748857,-73.13553,-135.03961,0.32267055,-0.18928246,15.705068,695000
81
+ 1.0,1.0000001,0.032505848,3.2505844,1.032506,1.8400964,-0.4125327,-71.42125,-147.94923,0.29090878,-0.41242343,26.23286,700000
82
+ 1.0,1.0,0.030766511,3.0766513,1.0307665,1.1338634,-0.6511265,-69.57879,-159.24617,0.16429389,-0.3549353,14.974909,705000
83
+ 1.0,1.0,0.032606572,3.2606568,1.0326066,1.1511444,0.31815112,-72.11944,-138.8939,0.58689976,-0.65151083,22.271599,710000
84
+ 1.0,1.0,0.030843128,3.084313,1.0308431,1.2358466,-5.8933325,-69.614456,-153.08177,0.3505729,-0.35293922,17.546595,715000
85
+ 1.0,1.0,0.03484597,3.484597,1.034846,1.2776264,-2.9479403,-69.73804,-148.94511,0.2815615,-0.25882635,14.67079,720000
86
+ 1.0,1.0000001,0.033019986,3.3019986,1.0330201,1.0122999,-1.8517076,-70.11432,-162.63448,0.22147627,-0.16788472,14.029137,725000
87
+ 1.0,0.99999994,0.03505851,3.505851,1.0350585,1.1720668,-6.164068,-68.51537,-149.3577,0.16140425,-0.14975393,14.543343,730000
88
+ 1.0,1.0,0.033847503,3.3847504,1.0338475,1.4934441,-1.6866816,-71.18555,-157.40546,0.4522859,-0.33478385,19.780056,735000
89
+ 1.0,0.99999994,0.03305051,3.3050513,1.0330504,1.1364739,-3.033078,-65.76893,-146.1934,0.22095922,-0.2421422,13.419214,740000
90
+ 1.0,1.0,0.03388377,3.388377,1.0338838,0.89143753,-2.5165186,-72.707115,-139.53392,0.12855297,-0.21848407,12.204435,745000
91
+ 1.0,1.0,0.032122504,3.2122502,1.0321225,1.2144057,-1.4629948,-67.90535,-145.89539,0.34964505,-0.20484483,14.536982,750000
92
+ 1.0,1.0,0.030859383,3.0859385,1.0308594,2.905049,0.18387985,-67.61903,-148.88385,0.32593668,-0.18808894,18.432854,755000
93
+ 1.0,1.0,0.032328416,3.2328417,1.0323284,1.11977,-2.938629,-67.11894,-131.53659,0.2885465,-0.19455637,15.464851,760000
94
+ 1.0,1.0,0.0351802,3.5180202,1.0351802,0.9154064,-4.0914273,-66.38386,-141.36455,0.17471592,-0.16705902,13.351176,765000
95
+ 1.0,1.0,0.03437395,3.437395,1.034374,1.5323299,0.08685258,-66.84939,-131.24068,0.5782699,-0.61017936,23.542889,770000
96
+ 1.0,1.0,0.03137696,3.1376963,1.031377,1.116166,-0.49188706,-67.96752,-146.40535,0.21924964,-0.31558943,16.625122,775000
97
+ 1.0,1.0,0.032022875,3.2022877,1.0320228,1.3057535,0.7701128,-66.7344,-134.0267,0.6199541,-0.65984535,18.416992,780000
98
+ 1.0,1.0,0.034123898,3.4123898,1.0341239,0.79152,-1.6244937,-65.2934,-167.721,0.18452904,-0.20514823,11.737368,785000
99
+ 1.0,1.0,0.03284663,3.284663,1.0328467,1.5301571,-1.272017,-66.81696,-149.69717,0.45190057,-0.4174839,24.294365,790000
100
+ 1.0,0.99999994,0.030926447,3.0926447,1.0309263,1.3812237,-3.38074,-64.26676,-147.28783,0.2918481,-0.5710223,20.813961,795000
101
+ 1.0,1.0,0.033369966,3.336997,1.03337,1.5455695,0.92182755,-65.57903,-151.04001,0.7860269,-0.67315143,22.234379,800000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,1.0,0.025970446,2.5970447,1.0259705,0.61797017,-24.327396,-102.1219,-164.98207,0.17441538,-0.15975727,9.351312,305000
3
+ 1.0,1.0,0.024198644,2.4198647,1.0241987,0.98557514,-23.998299,-103.44277,-166.37785,0.7783513,-0.8673335,21.170956,310000
4
+ 1.0,1.0,0.02279361,2.2793612,1.0227937,0.93565714,-28.933817,-106.68423,-176.3245,0.12134427,-0.122952916,12.474191,315000
5
+ 1.0,1.0000001,0.022773342,2.2773342,1.0227735,1.6021703,-23.472734,-106.96023,-185.2901,1.4559342,-1.6074111,46.552155,320000
6
+ 1.0,1.0,0.023886522,2.3886523,1.0238866,0.9559885,-40.056564,-105.52886,-187.2561,0.09516618,-0.09845582,11.181156,325000
7
+ 1.0,1.0000001,0.024195768,2.4195766,1.0241959,1.1675915,-13.632698,-102.67061,-189.329,0.25979096,-0.25629005,19.00258,330000
8
+ 1.0,1.0,0.024336517,2.433652,1.0243366,1.3106807,-12.586526,-102.45811,-187.25758,0.6124355,-0.59153634,29.252857,335000
9
+ 1.0,0.99999994,0.024821166,2.4821167,1.0248212,2.3970692,-32.095455,-104.410515,-175.45593,1.0803895,-1.1375939,39.177917,340000
10
+ 1.0,1.0000001,0.02500773,2.500773,1.0250078,1.7950035,-24.833326,-102.249016,-200.38692,0.43900657,-0.47564027,24.241295,345000
11
+ 1.0,1.0,0.026817784,2.6817784,1.0268178,1.9322785,-23.329155,-101.54619,-179.43999,0.75198764,-0.6283168,32.181236,350000
12
+ 1.0,1.0,0.02633738,2.633738,1.0263374,1.9671745,-8.133112,-99.71804,-190.21053,0.91923624,-0.8747534,32.69053,355000
13
+ 1.0,1.0,0.027504835,2.7504835,1.0275048,1.347749,-23.00677,-97.6818,-189.5472,0.23139882,-0.28074902,20.395578,360000
14
+ 1.0,1.0,0.02593712,2.593712,1.0259371,1.3600177,-20.220642,-94.66597,-187.67415,0.28263286,-0.25005642,18.987928,365000
15
+ 1.0,0.99999994,0.026539763,2.6539764,1.0265397,1.4376891,-10.259895,-91.938126,-196.85551,0.22555135,-0.24404359,15.463736,370000
16
+ 1.0,1.0000002,0.029647395,2.9647396,1.0296476,2.093026,-24.879921,-93.2969,-189.80333,0.6199899,-0.6904321,32.90751,375000
17
+ 1.0,0.99999994,0.029641354,2.9641354,1.0296413,2.8429334,-6.753205,-93.804,-180.04564,0.22864452,-0.28644386,22.350397,380000
18
+ 1.0,0.99999994,0.028743897,2.8743896,1.0287439,1.2493395,-3.482328,-92.5494,-178.198,0.45098293,-0.57453597,23.32129,385000
19
+ 1.0,1.0,0.030125756,3.0125754,1.0301257,1.4858295,-13.328147,-90.66831,-184.16116,0.2663263,-0.22266287,19.334219,390000
20
+ 1.0,1.0,0.030704072,3.070407,1.030704,1.4174905,1.4585557,-91.84765,-174.84428,0.18346721,-0.16610174,16.984112,395000
21
+ 1.0,0.99999994,0.028152477,2.8152478,1.0281525,1.174852,-19.192045,-86.13014,-160.22984,0.3018727,-0.19470216,14.601456,400000
22
+ 1.0,1.0,0.029939774,2.9939775,1.0299398,1.137135,-1.367926,-87.66848,-165.08939,0.14824641,-0.15510102,12.757724,405000
23
+ 1.0,0.99999994,0.030181902,3.0181901,1.0301819,1.6288594,-15.692904,-87.709755,-156.14171,0.37674382,-0.33528775,24.011173,410000
24
+ 1.0,0.9998845,0.029349096,2.9349098,1.0292336,1.0171874,1.9547448,-84.91956,-179.92557,0.224294,-0.14463592,12.607237,415000
25
+ 1.0,1.0,0.030203335,3.0203338,1.0302033,0.9725605,-7.612387,-84.70607,-173.13293,0.16637543,-0.22601117,14.511656,420000
26
+ 1.0,1.0,0.029837746,2.983775,1.0298377,1.4719096,-4.523689,-86.43562,-172.28146,0.24101304,-0.4022084,21.746063,425000
27
+ 1.0,0.99999994,0.031215683,3.1215682,1.0312157,1.1666243,-0.621766,-86.52639,-173.84575,0.18478253,-0.13005427,15.246854,430000
28
+ 1.0,0.9999389,0.030666508,3.0666509,1.0306054,1.3576425,1.3815085,-84.50162,-161.53247,0.3761146,-0.22600876,19.066484,435000
29
+ 1.0,0.99999994,0.031642217,3.1642218,1.0316422,1.3217419,-5.035165,-80.033,-173.03848,0.38146323,-0.4314169,21.916441,440000
30
+ 1.0,0.9999999,0.031383082,3.1383083,1.0313829,1.1573004,-3.65542,-82.10425,-163.45523,0.14388916,-0.12313154,14.391802,445000
31
+ 1.0,1.0,0.030858772,3.0858774,1.0308588,1.3424736,-3.709149,-82.378044,-190.84026,0.20015103,-0.21729986,15.850815,450000
32
+ 1.0,1.0000001,0.029661484,2.9661486,1.0296617,2.1374233,-1.9868177,-83.40203,-188.55676,0.8654126,-0.8754444,37.308678,455000
33
+ 1.0,1.0,0.030179318,3.017932,1.0301793,1.4842345,-0.21859603,-85.39974,-171.95277,0.34767607,-0.22139913,18.637077,460000
34
+ 1.0,1.0,0.03074146,3.074146,1.0307415,1.1450975,-1.1607375,-83.54258,-166.8056,0.1860245,-0.2961151,18.06142,465000
35
+ 1.0,0.99999994,0.03373386,3.3733861,1.0337338,1.339273,-6.300381,-80.80837,-169.58092,0.6987014,-0.6940768,26.906128,470000
36
+ 1.0,1.0,0.03259988,3.2599883,1.0325999,1.8981717,-0.77594745,-84.019554,-178.02205,0.5587725,-0.3400071,23.869677,475000
37
+ 1.0,0.999905,0.030698944,3.0698946,1.0306039,1.7692112,2.3665307,-83.74553,-173.58675,0.4186941,-0.41102505,23.606571,480000
38
+ 1.0,0.9999999,0.03167137,3.1671371,1.0316713,1.2740253,-0.44332445,-80.48379,-162.8863,0.3127696,-0.28837344,15.915227,485000
39
+ 1.0,1.0,0.031455263,3.1455264,1.0314553,1.6969767,-13.836949,-79.78822,-167.91647,0.60418046,-0.62567663,30.689327,490000
40
+ 1.0,1.0,0.033401582,3.3401585,1.0334016,1.4847941,-8.586334,-80.1708,-171.52502,0.14482026,-0.20694083,17.05365,495000
41
+ 1.0,0.99999994,0.031268936,3.1268935,1.0312688,1.209678,-2.7779028,-80.297935,-173.72461,0.3260636,-0.39363047,22.495419,500000
42
+ 1.0,1.0,0.032819696,3.2819698,1.0328197,1.2413424,-4.4433513,-80.049,-172.7935,0.24822594,-0.32857692,17.431831,505000
43
+ 1.0,1.0,0.032206334,3.2206337,1.0322063,0.99547255,-2.0257387,-78.47825,-159.94205,0.26130122,-0.17986342,16.022758,510000
44
+ 1.0,1.0,0.03184907,3.184907,1.031849,1.5465404,-6.743034,-80.90395,-171.89903,0.21831024,-0.22446845,20.02318,515000
45
+ 1.0,1.0,0.031025518,3.1025517,1.0310255,1.3203449,-5.5931,-78.168236,-169.48325,0.30399337,-0.4825654,20.675695,520000
46
+ 1.0,1.0,0.030954044,3.0954046,1.030954,1.6724478,-3.6360633,-76.43373,-145.50067,0.29218525,-0.46965092,25.039577,525000
47
+ 1.0,1.0,0.03419694,3.419694,1.034197,1.3715729,-6.2684956,-81.52063,-157.6875,0.20582281,-0.24045487,17.452372,530000
48
+ 1.0,1.0,0.029367778,2.936778,1.0293678,1.3024606,-2.4041758,-78.330284,-154.91835,0.141869,-0.14368004,14.08783,535000
49
+ 1.0,0.9999012,0.030907474,3.0907476,1.0308087,1.4228268,1.2555124,-78.415565,-168.78181,0.78444,-0.5195512,31.483822,540000
50
+ 1.0,0.9999999,0.0337763,3.3776298,1.0337762,1.351764,-3.5755327,-81.46997,-152.02417,0.22034785,-0.1984426,15.18378,545000
51
+ 1.0,1.0,0.029828142,2.9828143,1.0298282,2.3572137,0.2679395,-74.508934,-173.46431,0.3351168,-0.46852615,26.10388,550000
52
+ 1.0,1.0,0.031699724,3.1699724,1.0316998,1.2801898,0.8271607,-79.29699,-162.04356,0.18852474,-0.28073752,14.616115,555000
53
+ 1.0,1.0,0.031780906,3.178091,1.031781,1.625774,1.3246003,-76.07964,-171.21703,0.4283538,-0.41769668,22.14267,560000
54
+ 1.0,1.0,0.03344983,3.344983,1.0334499,16.017694,-1.4612627,-75.648125,-171.92348,3.3133323,-3.3451102,95.795135,565000
55
+ 1.0,1.0000001,0.030947067,3.094707,1.0309472,1.6849556,0.7214161,-76.21171,-153.61516,0.34507835,-0.3120985,22.81577,570000
56
+ 1.0,1.0,0.030237097,3.0237095,1.0302371,1.5069698,-0.595807,-75.60787,-175.41429,0.4352113,-0.15727258,18.072308,575000
57
+ 1.0,1.0,0.031588245,3.1588247,1.0315882,1.2193358,-2.9080946,-75.9464,-162.61143,0.27560276,-0.35351598,16.492746,580000
58
+ 1.0,1.0,0.030126799,3.01268,1.0301268,1.1559385,-4.1794643,-75.33663,-161.75754,0.29052818,-0.34248358,15.277493,585000
59
+ 1.0,0.99999994,0.029949972,2.9949975,1.0299499,1.1157866,-1.8244305,-72.82251,-168.13348,0.21694712,-0.16966791,15.092472,590000
60
+ 1.0,1.0,0.03200285,3.2002852,1.0320028,2.2222068,1.2567415,-75.29958,-153.51605,0.28892347,-0.3703931,25.73973,595000
61
+ 1.0,1.0,0.029341798,2.93418,1.0293418,1.0068554,-2.0198584,-76.202965,-160.56458,0.23660174,-0.18319799,11.321814,600000
62
+ 1.0,0.99999994,0.032258797,3.22588,1.0322587,2.6988413,-0.7239052,-76.63749,-150.8965,0.68426996,-0.70081484,33.10107,605000
63
+ 1.0,1.0,0.03558142,3.5581422,1.0355815,1.5785003,-5.101623,-73.95965,-154.1837,0.22952145,-0.22787346,18.722895,610000
64
+ 1.0,0.99999994,0.030895427,3.0895426,1.0308954,1.3040155,-5.044939,-75.2369,-150.12013,2.787803,-2.82185,34.990284,615000
65
+ 1.0,0.9999999,0.032885164,3.2885165,1.0328851,1.1160873,-4.0502987,-73.55358,-148.9154,0.2696564,-0.14822036,15.908524,620000
66
+ 1.0,0.99999994,0.03491494,3.4914942,1.0349149,1.3472639,-3.152269,-72.53079,-176.00545,0.21937364,-0.31539676,17.786564,625000
67
+ 1.0,0.99999994,0.031720348,3.172035,1.0317203,1.4399548,-2.6382403,-72.104126,-142.33696,0.3083681,-0.5282302,23.567396,630000
68
+ 1.0,0.99999994,0.032286264,3.2286263,1.0322862,1.5705748,-2.468065,-71.757744,-170.16425,0.20047921,-0.22548467,21.150293,635000
69
+ 1.0,1.0,0.032496672,3.2496672,1.0324967,1.1775327,-0.77121735,-73.92078,-148.00293,0.18685286,-0.18910535,15.325074,640000
70
+ 1.0,1.0,0.03228181,3.228181,1.0322818,1.2618818,-1.9631743,-76.65282,-154.2353,0.15404934,-0.18152857,15.768902,645000
71
+ 1.0,1.0,0.029512506,2.9512506,1.0295125,1.2127136,-3.5900738,-70.93663,-154.27995,0.29151207,-0.27993584,18.57493,650000
72
+ 1.0,0.9999999,0.031470135,3.1470137,1.0314701,1.1232098,1.4667127,-77.14154,-163.62471,0.20630932,-0.16764575,12.823296,655000
73
+ 1.0,1.0,0.030943763,3.0943763,1.0309438,1.0791585,-4.7858787,-70.91695,-160.8167,0.120213546,-0.26107085,12.854346,660000
74
+ 1.0,0.99999994,0.030199796,3.0199795,1.0301998,1.14361,-3.5024016,-72.28202,-158.71751,0.16492786,-0.29146308,15.387384,665000
75
+ 1.0,1.0,0.030801263,3.0801263,1.0308013,1.369837,-3.8097172,-70.67834,-141.4685,0.17607671,-0.17866711,15.826492,670000
76
+ 1.0,1.0000001,0.031449042,3.1449044,1.0314492,2.6550965,0.61832976,-71.54462,-162.30405,0.2691045,-0.3915677,25.754328,675000
77
+ 1.0,1.0000001,0.03187311,3.187311,1.0318732,1.7178322,-1.9108498,-73.47057,-151.91049,0.43845862,-0.34298536,22.142466,680000
78
+ 1.0,0.99999994,0.032033782,3.2033782,1.0320337,1.3725023,-6.0816736,-73.18013,-152.22961,0.36489367,-0.3861867,17.481806,685000
79
+ 1.0,0.99999994,0.035278056,3.5278058,1.035278,1.3051045,-6.802564,-74.438255,-162.61978,0.22680324,-0.33500135,21.514647,690000
80
+ 1.0,1.0,0.031692423,3.1692424,1.0316924,1.3266491,-6.7748857,-73.13553,-135.03961,0.32267055,-0.18928246,15.705068,695000
81
+ 1.0,1.0000001,0.032505848,3.2505844,1.032506,1.8400964,-0.4125327,-71.42125,-147.94923,0.29090878,-0.41242343,26.23286,700000
82
+ 1.0,1.0,0.030766511,3.0766513,1.0307665,1.1338634,-0.6511265,-69.57879,-159.24617,0.16429389,-0.3549353,14.974909,705000
83
+ 1.0,1.0,0.032606572,3.2606568,1.0326066,1.1511444,0.31815112,-72.11944,-138.8939,0.58689976,-0.65151083,22.271599,710000
84
+ 1.0,1.0,0.030843128,3.084313,1.0308431,1.2358466,-5.8933325,-69.614456,-153.08177,0.3505729,-0.35293922,17.546595,715000
85
+ 1.0,1.0,0.03484597,3.484597,1.034846,1.2776264,-2.9479403,-69.73804,-148.94511,0.2815615,-0.25882635,14.67079,720000
86
+ 1.0,1.0000001,0.033019986,3.3019986,1.0330201,1.0122999,-1.8517076,-70.11432,-162.63448,0.22147627,-0.16788472,14.029137,725000
87
+ 1.0,0.99999994,0.03505851,3.505851,1.0350585,1.1720668,-6.164068,-68.51537,-149.3577,0.16140425,-0.14975393,14.543343,730000
88
+ 1.0,1.0,0.033847503,3.3847504,1.0338475,1.4934441,-1.6866816,-71.18555,-157.40546,0.4522859,-0.33478385,19.780056,735000
89
+ 1.0,0.99999994,0.03305051,3.3050513,1.0330504,1.1364739,-3.033078,-65.76893,-146.1934,0.22095922,-0.2421422,13.419214,740000
90
+ 1.0,1.0,0.03388377,3.388377,1.0338838,0.89143753,-2.5165186,-72.707115,-139.53392,0.12855297,-0.21848407,12.204435,745000
91
+ 1.0,1.0,0.032122504,3.2122502,1.0321225,1.2144057,-1.4629948,-67.90535,-145.89539,0.34964505,-0.20484483,14.536982,750000
92
+ 1.0,1.0,0.030859383,3.0859385,1.0308594,2.905049,0.18387985,-67.61903,-148.88385,0.32593668,-0.18808894,18.432854,755000
93
+ 1.0,1.0,0.032328416,3.2328417,1.0323284,1.11977,-2.938629,-67.11894,-131.53659,0.2885465,-0.19455637,15.464851,760000
94
+ 1.0,1.0,0.0351802,3.5180202,1.0351802,0.9154064,-4.0914273,-66.38386,-141.36455,0.17471592,-0.16705902,13.351176,765000
95
+ 1.0,1.0,0.03437395,3.437395,1.034374,1.5323299,0.08685258,-66.84939,-131.24068,0.5782699,-0.61017936,23.542889,770000
96
+ 1.0,1.0,0.03137696,3.1376963,1.031377,1.116166,-0.49188706,-67.96752,-146.40535,0.21924964,-0.31558943,16.625122,775000
97
+ 1.0,1.0,0.032022875,3.2022877,1.0320228,1.3057535,0.7701128,-66.7344,-134.0267,0.6199541,-0.65984535,18.416992,780000
98
+ 1.0,1.0,0.034123898,3.4123898,1.0341239,0.79152,-1.6244937,-65.2934,-167.721,0.18452904,-0.20514823,11.737368,785000
99
+ 1.0,1.0,0.03284663,3.284663,1.0328467,1.5301571,-1.272017,-66.81696,-149.69717,0.45190057,-0.4174839,24.294365,790000
100
+ 1.0,0.99999994,0.030926447,3.0926447,1.0309263,1.3812237,-3.38074,-64.26676,-147.28783,0.2918481,-0.5710223,20.813961,795000
101
+ 1.0,1.0,0.033369966,3.336997,1.03337,1.5455695,0.92182755,-65.57903,-151.04001,0.7860269,-0.67315143,22.234379,800000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d49b87f25ba6505c15cbc065721f193a38f0d29321bfd6ee70350b881abc943
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b13d12c092eb1b876a3b5d6e77f8a72c00ece3c7acbf8c6b279157b2f8135c6
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:240936d15a9255371bd32d4dc207637f20d3dce7fcd828b533b43989816be8d6
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8428724225e18f75dbd6a85fea030f25e6836a859bf2a59b1eb4151e92de5673
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f104558933378ce790ba42751c0de9f2e347ab8fe41ff513d6bb915ce073d14f
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0e2a9bcf56794ef76714d2a75582a17ac3bcf07bc5003fa6737d750ff78748c
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66fcf819a5dd0d6d0d1dd6adca0ae188b239dcf2482ea30932f006cc448f92a5
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05902dd2d9c440de59b03e298268cb5f697f6f7db26bbb10225df45ca2fc3e96
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ae4ef763e10376756770db82da19cfa9304b8a3f3bc7e40928d3745f8ab55ea
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f9a217469888ad95299b6d94038249fb794b6ba980caf3d55e2a99245e1660b
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_125232/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/iq6nm65z