Tiredsheep commited on
Commit
732dfd3
·
verified ·
1 Parent(s): a14193e

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1050000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1100000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1150000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1200000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_750000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_800000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_850000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_900000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.020264853252635592,-0.005407346477807357,-0.019335609445779275,-0.02371159297989488,26.76092923675909,8.34499999999928,0.84,3861.54,-0.22,-236.14,164.9,0.5651007795333862,750000
3
+ 0.0,0.0,-0.026139405194360588,0.011444584785547041,-0.024945803277505806,0.0037697963596363196,33.72779904528973,5.628999999999744,0.94,11495.24,-0.08,-153.96,110.58,0.3495628261566162,800000
4
+ 0.0,0.0,-0.0420695551479682,0.025245198408926205,-0.04047154266685685,0.010276321118691225,33.87308955370947,4.3009999999998625,0.96,16046.98,-0.04,-110.38,84.02,0.28444026470184325,850000
5
+ 0.0,0.0,-0.03790129005226323,0.038063675209538676,-0.035956150092924084,0.029216847347266203,34.218191380432,4.421999999999774,0.94,20894.68,-0.06,-121.66,86.44,0.27287257194519043,900000
6
+ 0.0,0.0,-0.03813167078202632,0.03328377560616838,-0.035528113455253314,0.03534875499619008,35.305628455800445,2.7789999999999155,1.0,24711.58,0.0,-76.12,53.58,0.1804073905944824,950000
7
+ 0.0,0.0,-0.03540433641287757,0.04806811553949735,-0.03263426301328477,0.05789555974567652,34.54246812137347,3.881999999999778,0.96,28549.46,-0.08,-118.1,75.64,0.2408988046646118,1000000
8
+ 0.0,0.0,-0.03750684726674135,0.04614151394501952,-0.034289795892071526,0.03950262487758873,35.48389182572202,2.936999999999888,0.98,31493.56,-0.04,-86.4,56.74,0.19544536590576173,1050000
9
+ 0.0,0.0,-0.03652945034181664,0.04417998354084703,-0.033528981994137584,0.05428610069811135,35.62125978646346,2.609999999999953,1.0,34210.16,0.0,-71.66,50.2,0.16621946334838866,1100000
10
+ 0.0,0.0,-0.057052425279297735,0.04817057754345527,-0.05364102195948961,0.054364656571635694,34.51163834312884,3.4969999999998165,0.96,37140.44,-0.06,-107.72,67.94,0.21675355911254882,1150000
11
+ 0.0,0.0,-0.04775132876360858,0.06453600926386531,-0.0439217120910967,0.06323749135626422,35.12531185811779,3.0249999999998782,0.98,40567.86,-0.04,-91.04,58.5,0.18239949703216551,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.020264853252635592,-0.005407346477807357,-0.019335609445779275,-0.02371159297989488,26.76092923675909,8.34499999999928,0.84,3861.54,-0.22,-236.14,164.9,0.5651007795333862,750000
3
+ 0.0,0.0,-0.026139405194360588,0.011444584785547041,-0.024945803277505806,0.0037697963596363196,33.72779904528973,5.628999999999744,0.94,11495.24,-0.08,-153.96,110.58,0.3495628261566162,800000
4
+ 0.0,0.0,-0.0420695551479682,0.025245198408926205,-0.04047154266685685,0.010276321118691225,33.87308955370947,4.3009999999998625,0.96,16046.98,-0.04,-110.38,84.02,0.28444026470184325,850000
5
+ 0.0,0.0,-0.03790129005226323,0.038063675209538676,-0.035956150092924084,0.029216847347266203,34.218191380432,4.421999999999774,0.94,20894.68,-0.06,-121.66,86.44,0.27287257194519043,900000
6
+ 0.0,0.0,-0.03813167078202632,0.03328377560616838,-0.035528113455253314,0.03534875499619008,35.305628455800445,2.7789999999999155,1.0,24711.58,0.0,-76.12,53.58,0.1804073905944824,950000
7
+ 0.0,0.0,-0.03540433641287757,0.04806811553949735,-0.03263426301328477,0.05789555974567652,34.54246812137347,3.881999999999778,0.96,28549.46,-0.08,-118.1,75.64,0.2408988046646118,1000000
8
+ 0.0,0.0,-0.03750684726674135,0.04614151394501952,-0.034289795892071526,0.03950262487758873,35.48389182572202,2.936999999999888,0.98,31493.56,-0.04,-86.4,56.74,0.19544536590576173,1050000
9
+ 0.0,0.0,-0.03652945034181664,0.04417998354084703,-0.033528981994137584,0.05428610069811135,35.62125978646346,2.609999999999953,1.0,34210.16,0.0,-71.66,50.2,0.16621946334838866,1100000
10
+ 0.0,0.0,-0.057052425279297735,0.04817057754345527,-0.05364102195948961,0.054364656571635694,34.51163834312884,3.4969999999998165,0.96,37140.44,-0.06,-107.72,67.94,0.21675355911254882,1150000
11
+ 0.0,0.0,-0.04775132876360858,0.06453600926386531,-0.0439217120910967,0.06323749135626422,35.12531185811779,3.0249999999998782,0.98,40567.86,-0.04,-91.04,58.5,0.18239949703216551,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,1.0,0.024012838,2.4012837,1.0240128,1.2723457,-24.662727,-105.29711,-185.35219,0.1526872,-0.095688134,8.740143,705000
3
+ 1.0,1.0,0.023707345,2.3707347,1.0237074,0.57563,-21.409925,-103.93418,-176.364,0.124592625,-0.1309376,7.901575,710000
4
+ 1.0,1.0,0.021445667,2.144567,1.0214456,0.94369525,-28.925314,-107.92338,-183.50214,0.29171798,-0.32674506,15.2024,715000
5
+ 1.0,1.0,0.021710001,2.1710002,1.02171,1.2623943,-27.273762,-107.90281,-195.46007,0.30311868,-0.3164054,13.47684,720000
6
+ 1.0,1.0,0.021689832,2.1689832,1.0216899,1.187218,-38.0472,-107.88372,-192.3461,0.12650031,-0.13121921,10.256374,725000
7
+ 1.0,1.0,0.02261357,2.261357,1.0226135,1.370944,-37.19675,-107.159294,-190.44743,0.36622426,-0.31513196,20.202456,730000
8
+ 1.0,1.0,0.022743465,2.2743468,1.0227435,1.3030539,-22.920933,-106.38744,-191.91328,0.43704677,-0.5308689,19.961607,735000
9
+ 1.0,1.0,0.023134911,2.3134913,1.023135,1.3013569,-31.241083,-105.46362,-181.18753,0.39850184,-0.41642624,18.882904,740000
10
+ 1.0,0.9999999,0.022217914,2.2217913,1.0222178,15.816063,-4.545556,-106.10779,-203.57996,0.8917403,-0.9023798,69.60323,745000
11
+ 1.0,0.99999994,0.025379065,2.5379066,1.0253791,1.5135564,-1.7106844,-103.20542,-179.71254,0.55518377,-0.5701973,29.989235,750000
12
+ 1.0,1.0,0.024754705,2.4754705,1.0247548,1.0268643,-11.461878,-102.24599,-195.19115,0.2204624,-0.21521577,13.575521,755000
13
+ 1.0,0.99999994,0.025807545,2.5807543,1.0258075,1.3389372,-4.798184,-100.192986,-185.30006,0.1803965,-0.3550552,16.726248,760000
14
+ 1.0,1.0,0.024380768,2.438077,1.0243808,1.3034371,-14.634602,-97.91239,-192.23311,0.41207725,-0.44214237,18.508484,765000
15
+ 1.0,1.0,0.025879923,2.5879922,1.02588,5.1159167,-14.520742,-94.81141,-204.06117,0.43491724,-0.37131694,26.403204,770000
16
+ 1.0,1.0,0.027208291,2.720829,1.0272083,1.455141,-2.9311323,-96.06028,-190.6495,0.38222775,-0.42751676,19.495255,775000
17
+ 1.0,1.0,0.028343529,2.8343527,1.0283436,1.2564484,-4.0549994,-94.173256,-179.43459,0.2945637,-0.1377712,16.378197,780000
18
+ 1.0,1.0,0.02620868,2.6208682,1.0262086,1.1520796,-2.7153132,-95.87205,-193.40872,0.1848624,-0.13725185,15.162318,785000
19
+ 1.0,1.0,0.028331881,2.8331883,1.0283319,1.2493715,-4.2247844,-95.35549,-187.41042,0.1549953,-0.15605935,14.706223,790000
20
+ 1.0,0.99999994,0.027650537,2.7650535,1.0276505,1.51111,-4.0733714,-93.49097,-187.895,0.31820005,-0.20418857,17.69716,795000
21
+ 1.0,1.0,0.026879538,2.687954,1.0268795,1.1600558,-1.0246199,-89.64431,-165.19139,0.27406466,-0.11211168,14.886754,800000
22
+ 1.0,1.0,0.028145652,2.8145654,1.0281457,1.0951366,-5.804304,-93.18801,-185.3236,0.2797567,-0.16926031,13.477581,805000
23
+ 1.0,1.0,0.026933746,2.6933746,1.0269338,1.160848,-0.13398013,-92.82406,-159.06303,0.09052866,-0.23654807,12.004321,810000
24
+ 1.0,0.9999482,0.027906943,2.7906947,1.0278552,1.1321156,1.1132469,-89.17222,-173.7459,0.1684756,-0.15176775,13.733924,815000
25
+ 1.0,1.0000001,0.028558536,2.8558536,1.0285586,1.598738,-9.57521,-90.41593,-170.23042,0.19958007,-0.37521458,21.522892,820000
26
+ 1.0,0.99999994,0.027587354,2.7587357,1.0275873,1.1488405,-5.830238,-90.32376,-165.724,0.18674333,-0.20193203,13.69313,825000
27
+ 1.0,1.0,0.028519005,2.8519006,1.028519,1.4919982,-0.26551977,-91.311104,-175.01666,0.2380815,-0.21282303,18.195503,830000
28
+ 1.0,0.99991584,0.028381238,2.8381238,1.0282971,0.9269621,1.8265023,-90.30597,-169.50179,0.15068623,-0.22912535,12.916338,835000
29
+ 1.0,0.99999994,0.029831605,2.9831607,1.0298315,3.357578,-7.9902587,-86.33682,-167.55916,0.5330514,-0.59384537,35.54627,840000
30
+ 1.0,1.0,0.02840748,2.8407478,1.0284075,1.3195412,-5.6388235,-89.75706,-196.29399,0.12191413,-0.17293268,13.512232,845000
31
+ 1.0,1.0,0.027947836,2.7947834,1.0279478,1.1123797,-1.090759,-88.21664,-187.01724,0.16956486,-0.3363493,16.65753,850000
32
+ 1.0,1.0,0.027949307,2.7949307,1.0279493,1.8840573,-6.319189,-87.863014,-187.52267,0.24761726,-0.37375957,22.993511,855000
33
+ 1.0,1.0,0.02857348,2.857348,1.0285735,1.5124453,-4.017386,-90.4908,-187.51408,0.24783431,-0.4442185,19.346916,860000
34
+ 1.0,1.0,0.028072929,2.807293,1.028073,1.0615629,-1.3906708,-87.02603,-182.02057,0.35503715,-0.3527348,17.937408,865000
35
+ 1.0,0.99998295,0.029781995,2.9781997,1.0297649,1.5408785,0.8411551,-86.66303,-189.05011,0.21484037,-0.19484034,17.868538,870000
36
+ 1.0,1.0,0.028663471,2.8663473,1.0286635,1.2389568,-0.7721813,-90.15779,-184.09096,0.10674888,-0.14631559,11.288504,875000
37
+ 1.0,1.0,0.027509792,2.7509794,1.0275098,1.3351091,0.17237698,-87.42756,-193.55305,0.43300843,-0.47023168,17.957443,880000
38
+ 1.0,1.0,0.02880209,2.880209,1.028802,1.1192135,-4.4047194,-83.28618,-162.6812,0.15110199,-0.273574,14.277037,885000
39
+ 1.0,1.0,0.027743874,2.7743874,1.0277438,1.3349017,-2.6192358,-82.86458,-201.68796,0.21840008,-0.27212664,18.265041,890000
40
+ 1.0,0.99999994,0.028557446,2.8557446,1.0285574,1.0260231,-0.92979515,-85.89008,-196.98602,0.15248533,-0.37137547,16.83471,895000
41
+ 1.0,1.0,0.028781444,2.8781445,1.0287814,1.7520306,-2.6716874,-83.56286,-199.63364,0.29224885,-0.30344552,18.16819,900000
42
+ 1.0,1.0,0.028700247,2.8700252,1.0287002,0.956798,1.7310927,-84.246925,-168.9958,0.23966132,-0.23269057,13.323522,905000
43
+ 1.0,1.0,0.028465884,2.8465886,1.0284659,1.1331698,-2.3298173,-85.93447,-167.68211,0.32857147,-0.37641168,17.80765,910000
44
+ 1.0,1.0,0.028369656,2.8369656,1.0283697,1.0912105,1.5263796,-83.59518,-186.4214,0.31856316,-0.1470359,16.350925,915000
45
+ 1.0,1.0000001,0.027730804,2.7730803,1.027731,1.564505,0.24879187,-83.18184,-184.5336,0.5704717,-0.5377143,22.763288,920000
46
+ 1.0,1.0,0.029524812,2.9524813,1.0295248,1.4130989,-0.23850597,-84.09878,-167.06125,0.23170128,-0.19484165,18.21174,925000
47
+ 1.0,1.0,0.030538704,3.0538707,1.0305387,1.4501625,-2.701228,-84.68267,-171.29672,0.54826343,-0.54156107,17.908714,930000
48
+ 1.0,1.0,0.028250806,2.8250806,1.0282508,1.466508,1.2978963,-82.19287,-171.39853,0.30140448,-0.15948565,15.481417,935000
49
+ 1.0,0.9999229,0.027275976,2.7275977,1.0271988,1.3917176,1.7950208,-84.8374,-184.55214,0.2703735,-0.23539652,19.753155,940000
50
+ 1.0,1.0,0.030505903,3.0505905,1.0305059,1.1502289,-5.643862,-85.479645,-179.82677,0.14381987,-0.43954343,19.067928,945000
51
+ 1.0,1.0,0.0258137,2.58137,1.0258137,2.89737,0.9131657,-77.84419,-186.56885,0.4433033,-0.31167126,27.10165,950000
52
+ 1.0,1.0,0.02875876,2.8758762,1.0287588,1.255955,-0.83540833,-84.54818,-181.79503,0.33612266,-0.34618255,16.592096,955000
53
+ 1.0,0.99999505,0.029632924,2.9632924,1.0296279,1.0571977,1.4050438,-81.5748,-180.69098,0.2304138,-0.21569042,14.098614,960000
54
+ 1.0,1.0,0.029349979,2.9349978,1.0293499,1.1782897,-5.8922925,-81.81655,-200.74324,0.19837955,-0.20909712,15.862142,965000
55
+ 1.0,1.0,0.02783557,2.7835574,1.0278356,0.9220519,-6.096468,-81.83041,-161.69658,0.14673844,-0.154044,12.447058,970000
56
+ 1.0,1.0000001,0.02637513,2.6375132,1.0263753,1.1732345,-1.8829153,-81.57527,-201.88097,0.3029332,-0.21158093,16.1036,975000
57
+ 1.0,1.0,0.02802156,2.802156,1.0280216,0.95352507,-3.1705449,-82.65246,-185.30136,0.19359645,-0.16939348,11.208377,980000
58
+ 1.0,1.0,0.029657496,2.9657497,1.0296575,1.4957966,0.017994478,-80.607506,-170.46194,0.21292496,-0.3869986,17.675045,985000
59
+ 1.0,1.0,0.028041875,2.8041875,1.0280418,1.5556835,-2.5521023,-79.334526,-187.42195,0.4586102,-0.31144822,21.023714,990000
60
+ 1.0,1.0,0.02829137,2.829137,1.0282913,1.3142264,0.6155375,-79.31854,-178.30893,0.5995166,-0.6327397,23.166058,995000
61
+ 1.0,1.0,0.026534284,2.6534286,1.0265343,1.6561803,-4.212124,-81.98434,-173.1492,0.31248426,-0.4481518,20.72166,1000000
62
+ 1.0,1.0,0.030182008,3.0182009,1.030182,1.1862125,-5.7683887,-84.4824,-174.07268,0.31856415,-0.23030755,16.205898,1005000
63
+ 1.0,0.99999994,0.03004419,3.0044193,1.0300441,1.1586212,-5.5077353,-79.120094,-174.0701,0.34982383,-0.23077941,14.599337,1010000
64
+ 1.0,1.0,0.027140193,2.7140193,1.0271401,1.1860598,-1.3777947,-79.19021,-158.81319,0.42857862,-0.43100813,17.898163,1015000
65
+ 1.0,1.0,0.028470434,2.8470435,1.0284704,0.861907,0.8567828,-78.9825,-167.24942,0.17467666,-0.13387677,10.987938,1020000
66
+ 1.0,1.0,0.02895967,2.895967,1.0289596,1.0698975,0.12888281,-79.87421,-184.14401,0.258761,-0.2528072,13.034304,1025000
67
+ 1.0,1.0,0.02832482,2.8324819,1.0283248,1.5477357,-1.8458403,-79.95991,-164.2332,0.27233574,-0.311223,18.863976,1030000
68
+ 1.0,1.0,0.02892049,2.8920493,1.0289205,1.2520822,-1.5454396,-78.85424,-198.42805,0.13739352,-0.27068868,14.510336,1035000
69
+ 1.0,1.0,0.028910423,2.8910422,1.0289104,1.0282582,-1.6147338,-79.65812,-159.6773,0.25041378,-0.25142872,15.937954,1040000
70
+ 1.0,0.9999999,0.02719151,2.719151,1.0271914,0.9042786,-2.1968393,-81.15893,-183.03111,0.11093836,-0.16056733,10.782464,1045000
71
+ 1.0,1.0,0.02701093,2.7010932,1.0270109,1.4128466,-4.3406324,-77.748146,-184.98854,0.30421302,-0.20115529,18.96693,1050000
72
+ 1.0,1.0,0.02765151,2.765151,1.0276515,0.95665914,-1.3688016,-80.134514,-173.37038,0.26395774,-0.23297673,13.747454,1055000
73
+ 1.0,1.0,0.029585125,2.9585123,1.0295851,1.0679648,0.18483296,-77.2176,-192.59337,0.24571055,-0.2567013,14.612358,1060000
74
+ 1.0,1.0,0.030396588,3.039659,1.0303966,1.0406846,0.32557285,-80.286545,-177.6343,0.21649565,-0.32052448,16.109016,1065000
75
+ 1.0,1.0,0.029619988,2.961999,1.0296199,1.2090944,-2.5272548,-77.83218,-174.21747,0.8102204,-0.8210534,21.819508,1070000
76
+ 1.0,0.999979,0.027449377,2.7449377,1.0274284,3.2755487,1.126768,-75.49337,-189.9803,0.4095169,-0.37846842,27.248863,1075000
77
+ 1.0,1.0,0.02529833,2.529833,1.0252984,1.5418706,-2.3223994,-78.135414,-171.07039,0.32683542,-0.2806016,16.626844,1080000
78
+ 1.0,0.9999999,0.027583469,2.758347,1.0275834,1.0351157,-2.517568,-77.29214,-175.46005,0.19381997,-0.17104724,14.65946,1085000
79
+ 1.0,0.99999994,0.031600412,3.1600413,1.0316004,1.4023423,-3.4127834,-80.30568,-171.41876,0.29186824,-0.16235593,16.727196,1090000
80
+ 1.0,1.0,0.028274067,2.827407,1.028274,1.865008,-0.6285291,-80.52997,-151.57782,0.4490252,-0.4364411,22.35796,1095000
81
+ 1.0,0.99999994,0.027064253,2.7064252,1.0270642,1.507824,-2.5851905,-76.52153,-158.33723,0.20500986,-0.22814205,16.102036,1100000
82
+ 1.0,0.9999999,0.028742554,2.8742557,1.0287424,1.2553014,1.4708884,-75.56115,-171.08884,0.29467282,-0.27342802,16.758911,1105000
83
+ 1.0,1.0,0.029495358,2.9495358,1.0294954,1.2777443,0.7888876,-79.72372,-160.17538,0.2637516,-0.34863546,18.86536,1110000
84
+ 1.0,0.9998708,0.027508654,2.7508655,1.0273794,1.6125206,0.3692652,-75.64657,-154.85307,1.0941831,-0.9644186,34.665485,1115000
85
+ 1.0,1.0,0.030152982,3.0152981,1.030153,1.040396,-6.0905366,-76.780014,-170.88629,0.28726697,-0.34271675,15.039329,1120000
86
+ 1.0,0.99999994,0.028887948,2.888795,1.0288879,1.6480693,-0.17054968,-75.66206,-199.00504,0.42511237,-0.38465545,21.087162,1125000
87
+ 1.0,1.0,0.029454391,2.9454393,1.0294544,1.0771248,-1.322575,-74.613464,-160.23616,0.35133106,-0.1518932,12.889261,1130000
88
+ 1.0,1.0,0.029804919,2.980492,1.029805,1.2881039,-3.3112028,-79.90068,-194.5727,0.31301403,-0.35474843,14.968933,1135000
89
+ 1.0,1.0,0.030409262,3.040926,1.0304092,1.2675184,-2.688983,-76.21565,-181.85033,0.24351603,-0.26877475,16.333555,1140000
90
+ 1.0,0.99999994,0.028607497,2.8607497,1.0286075,0.89748573,-1.4188491,-76.49584,-162.9271,0.2783904,-0.17603634,14.859274,1145000
91
+ 1.0,1.0,0.027074602,2.70746,1.0270746,1.1294523,-1.7899525,-73.04853,-162.99664,0.31863987,-0.19803257,15.079624,1150000
92
+ 1.0,1.0,0.029681802,2.9681802,1.0296818,1.9695419,-2.108262,-74.33327,-171.06862,0.37476957,-0.27680868,19.034615,1155000
93
+ 1.0,1.0,0.028555876,2.8555875,1.0285559,2.1303303,-3.5725415,-74.94375,-146.90239,0.75409704,-0.35132116,22.388435,1160000
94
+ 1.0,1.0,0.030284062,3.0284061,1.030284,1.1267331,-2.288056,-73.69024,-156.80742,0.3308489,-0.2180911,16.713707,1165000
95
+ 1.0,1.0,0.02984085,2.9840848,1.0298408,3.4205728,-1.7871873,-73.80999,-144.09102,1.0866984,-0.8109901,51.804573,1170000
96
+ 1.0,1.0,0.026533606,2.6533606,1.0265336,1.1726216,-1.591659,-74.68691,-177.70525,0.10775562,-0.19501784,12.234542,1175000
97
+ 1.0,0.9999999,0.02900317,2.900317,1.029003,0.99650663,0.43385345,-74.2754,-154.4253,0.32021976,-0.19189504,12.104555,1180000
98
+ 1.0,1.0,0.02939372,2.939372,1.0293937,0.96631145,-1.4154615,-72.80747,-196.57823,0.23076247,-0.16846296,12.592501,1185000
99
+ 1.0,1.0,0.028377973,2.8377972,1.028378,0.9011642,-1.1906068,-74.05562,-162.45383,0.16990471,-0.28843552,13.40048,1190000
100
+ 1.0,1.0,0.02758477,2.7584772,1.0275848,1.1954025,-0.9842883,-70.669525,-175.0718,0.2895577,-0.42086715,15.298462,1195000
101
+ 1.0,1.0000001,0.027248101,2.7248101,1.0272483,1.1796162,-0.445978,-68.85748,-183.07611,0.3398074,-0.37641662,12.936899,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,1.0,0.024012838,2.4012837,1.0240128,1.2723457,-24.662727,-105.29711,-185.35219,0.1526872,-0.095688134,8.740143,705000
3
+ 1.0,1.0,0.023707345,2.3707347,1.0237074,0.57563,-21.409925,-103.93418,-176.364,0.124592625,-0.1309376,7.901575,710000
4
+ 1.0,1.0,0.021445667,2.144567,1.0214456,0.94369525,-28.925314,-107.92338,-183.50214,0.29171798,-0.32674506,15.2024,715000
5
+ 1.0,1.0,0.021710001,2.1710002,1.02171,1.2623943,-27.273762,-107.90281,-195.46007,0.30311868,-0.3164054,13.47684,720000
6
+ 1.0,1.0,0.021689832,2.1689832,1.0216899,1.187218,-38.0472,-107.88372,-192.3461,0.12650031,-0.13121921,10.256374,725000
7
+ 1.0,1.0,0.02261357,2.261357,1.0226135,1.370944,-37.19675,-107.159294,-190.44743,0.36622426,-0.31513196,20.202456,730000
8
+ 1.0,1.0,0.022743465,2.2743468,1.0227435,1.3030539,-22.920933,-106.38744,-191.91328,0.43704677,-0.5308689,19.961607,735000
9
+ 1.0,1.0,0.023134911,2.3134913,1.023135,1.3013569,-31.241083,-105.46362,-181.18753,0.39850184,-0.41642624,18.882904,740000
10
+ 1.0,0.9999999,0.022217914,2.2217913,1.0222178,15.816063,-4.545556,-106.10779,-203.57996,0.8917403,-0.9023798,69.60323,745000
11
+ 1.0,0.99999994,0.025379065,2.5379066,1.0253791,1.5135564,-1.7106844,-103.20542,-179.71254,0.55518377,-0.5701973,29.989235,750000
12
+ 1.0,1.0,0.024754705,2.4754705,1.0247548,1.0268643,-11.461878,-102.24599,-195.19115,0.2204624,-0.21521577,13.575521,755000
13
+ 1.0,0.99999994,0.025807545,2.5807543,1.0258075,1.3389372,-4.798184,-100.192986,-185.30006,0.1803965,-0.3550552,16.726248,760000
14
+ 1.0,1.0,0.024380768,2.438077,1.0243808,1.3034371,-14.634602,-97.91239,-192.23311,0.41207725,-0.44214237,18.508484,765000
15
+ 1.0,1.0,0.025879923,2.5879922,1.02588,5.1159167,-14.520742,-94.81141,-204.06117,0.43491724,-0.37131694,26.403204,770000
16
+ 1.0,1.0,0.027208291,2.720829,1.0272083,1.455141,-2.9311323,-96.06028,-190.6495,0.38222775,-0.42751676,19.495255,775000
17
+ 1.0,1.0,0.028343529,2.8343527,1.0283436,1.2564484,-4.0549994,-94.173256,-179.43459,0.2945637,-0.1377712,16.378197,780000
18
+ 1.0,1.0,0.02620868,2.6208682,1.0262086,1.1520796,-2.7153132,-95.87205,-193.40872,0.1848624,-0.13725185,15.162318,785000
19
+ 1.0,1.0,0.028331881,2.8331883,1.0283319,1.2493715,-4.2247844,-95.35549,-187.41042,0.1549953,-0.15605935,14.706223,790000
20
+ 1.0,0.99999994,0.027650537,2.7650535,1.0276505,1.51111,-4.0733714,-93.49097,-187.895,0.31820005,-0.20418857,17.69716,795000
21
+ 1.0,1.0,0.026879538,2.687954,1.0268795,1.1600558,-1.0246199,-89.64431,-165.19139,0.27406466,-0.11211168,14.886754,800000
22
+ 1.0,1.0,0.028145652,2.8145654,1.0281457,1.0951366,-5.804304,-93.18801,-185.3236,0.2797567,-0.16926031,13.477581,805000
23
+ 1.0,1.0,0.026933746,2.6933746,1.0269338,1.160848,-0.13398013,-92.82406,-159.06303,0.09052866,-0.23654807,12.004321,810000
24
+ 1.0,0.9999482,0.027906943,2.7906947,1.0278552,1.1321156,1.1132469,-89.17222,-173.7459,0.1684756,-0.15176775,13.733924,815000
25
+ 1.0,1.0000001,0.028558536,2.8558536,1.0285586,1.598738,-9.57521,-90.41593,-170.23042,0.19958007,-0.37521458,21.522892,820000
26
+ 1.0,0.99999994,0.027587354,2.7587357,1.0275873,1.1488405,-5.830238,-90.32376,-165.724,0.18674333,-0.20193203,13.69313,825000
27
+ 1.0,1.0,0.028519005,2.8519006,1.028519,1.4919982,-0.26551977,-91.311104,-175.01666,0.2380815,-0.21282303,18.195503,830000
28
+ 1.0,0.99991584,0.028381238,2.8381238,1.0282971,0.9269621,1.8265023,-90.30597,-169.50179,0.15068623,-0.22912535,12.916338,835000
29
+ 1.0,0.99999994,0.029831605,2.9831607,1.0298315,3.357578,-7.9902587,-86.33682,-167.55916,0.5330514,-0.59384537,35.54627,840000
30
+ 1.0,1.0,0.02840748,2.8407478,1.0284075,1.3195412,-5.6388235,-89.75706,-196.29399,0.12191413,-0.17293268,13.512232,845000
31
+ 1.0,1.0,0.027947836,2.7947834,1.0279478,1.1123797,-1.090759,-88.21664,-187.01724,0.16956486,-0.3363493,16.65753,850000
32
+ 1.0,1.0,0.027949307,2.7949307,1.0279493,1.8840573,-6.319189,-87.863014,-187.52267,0.24761726,-0.37375957,22.993511,855000
33
+ 1.0,1.0,0.02857348,2.857348,1.0285735,1.5124453,-4.017386,-90.4908,-187.51408,0.24783431,-0.4442185,19.346916,860000
34
+ 1.0,1.0,0.028072929,2.807293,1.028073,1.0615629,-1.3906708,-87.02603,-182.02057,0.35503715,-0.3527348,17.937408,865000
35
+ 1.0,0.99998295,0.029781995,2.9781997,1.0297649,1.5408785,0.8411551,-86.66303,-189.05011,0.21484037,-0.19484034,17.868538,870000
36
+ 1.0,1.0,0.028663471,2.8663473,1.0286635,1.2389568,-0.7721813,-90.15779,-184.09096,0.10674888,-0.14631559,11.288504,875000
37
+ 1.0,1.0,0.027509792,2.7509794,1.0275098,1.3351091,0.17237698,-87.42756,-193.55305,0.43300843,-0.47023168,17.957443,880000
38
+ 1.0,1.0,0.02880209,2.880209,1.028802,1.1192135,-4.4047194,-83.28618,-162.6812,0.15110199,-0.273574,14.277037,885000
39
+ 1.0,1.0,0.027743874,2.7743874,1.0277438,1.3349017,-2.6192358,-82.86458,-201.68796,0.21840008,-0.27212664,18.265041,890000
40
+ 1.0,0.99999994,0.028557446,2.8557446,1.0285574,1.0260231,-0.92979515,-85.89008,-196.98602,0.15248533,-0.37137547,16.83471,895000
41
+ 1.0,1.0,0.028781444,2.8781445,1.0287814,1.7520306,-2.6716874,-83.56286,-199.63364,0.29224885,-0.30344552,18.16819,900000
42
+ 1.0,1.0,0.028700247,2.8700252,1.0287002,0.956798,1.7310927,-84.246925,-168.9958,0.23966132,-0.23269057,13.323522,905000
43
+ 1.0,1.0,0.028465884,2.8465886,1.0284659,1.1331698,-2.3298173,-85.93447,-167.68211,0.32857147,-0.37641168,17.80765,910000
44
+ 1.0,1.0,0.028369656,2.8369656,1.0283697,1.0912105,1.5263796,-83.59518,-186.4214,0.31856316,-0.1470359,16.350925,915000
45
+ 1.0,1.0000001,0.027730804,2.7730803,1.027731,1.564505,0.24879187,-83.18184,-184.5336,0.5704717,-0.5377143,22.763288,920000
46
+ 1.0,1.0,0.029524812,2.9524813,1.0295248,1.4130989,-0.23850597,-84.09878,-167.06125,0.23170128,-0.19484165,18.21174,925000
47
+ 1.0,1.0,0.030538704,3.0538707,1.0305387,1.4501625,-2.701228,-84.68267,-171.29672,0.54826343,-0.54156107,17.908714,930000
48
+ 1.0,1.0,0.028250806,2.8250806,1.0282508,1.466508,1.2978963,-82.19287,-171.39853,0.30140448,-0.15948565,15.481417,935000
49
+ 1.0,0.9999229,0.027275976,2.7275977,1.0271988,1.3917176,1.7950208,-84.8374,-184.55214,0.2703735,-0.23539652,19.753155,940000
50
+ 1.0,1.0,0.030505903,3.0505905,1.0305059,1.1502289,-5.643862,-85.479645,-179.82677,0.14381987,-0.43954343,19.067928,945000
51
+ 1.0,1.0,0.0258137,2.58137,1.0258137,2.89737,0.9131657,-77.84419,-186.56885,0.4433033,-0.31167126,27.10165,950000
52
+ 1.0,1.0,0.02875876,2.8758762,1.0287588,1.255955,-0.83540833,-84.54818,-181.79503,0.33612266,-0.34618255,16.592096,955000
53
+ 1.0,0.99999505,0.029632924,2.9632924,1.0296279,1.0571977,1.4050438,-81.5748,-180.69098,0.2304138,-0.21569042,14.098614,960000
54
+ 1.0,1.0,0.029349979,2.9349978,1.0293499,1.1782897,-5.8922925,-81.81655,-200.74324,0.19837955,-0.20909712,15.862142,965000
55
+ 1.0,1.0,0.02783557,2.7835574,1.0278356,0.9220519,-6.096468,-81.83041,-161.69658,0.14673844,-0.154044,12.447058,970000
56
+ 1.0,1.0000001,0.02637513,2.6375132,1.0263753,1.1732345,-1.8829153,-81.57527,-201.88097,0.3029332,-0.21158093,16.1036,975000
57
+ 1.0,1.0,0.02802156,2.802156,1.0280216,0.95352507,-3.1705449,-82.65246,-185.30136,0.19359645,-0.16939348,11.208377,980000
58
+ 1.0,1.0,0.029657496,2.9657497,1.0296575,1.4957966,0.017994478,-80.607506,-170.46194,0.21292496,-0.3869986,17.675045,985000
59
+ 1.0,1.0,0.028041875,2.8041875,1.0280418,1.5556835,-2.5521023,-79.334526,-187.42195,0.4586102,-0.31144822,21.023714,990000
60
+ 1.0,1.0,0.02829137,2.829137,1.0282913,1.3142264,0.6155375,-79.31854,-178.30893,0.5995166,-0.6327397,23.166058,995000
61
+ 1.0,1.0,0.026534284,2.6534286,1.0265343,1.6561803,-4.212124,-81.98434,-173.1492,0.31248426,-0.4481518,20.72166,1000000
62
+ 1.0,1.0,0.030182008,3.0182009,1.030182,1.1862125,-5.7683887,-84.4824,-174.07268,0.31856415,-0.23030755,16.205898,1005000
63
+ 1.0,0.99999994,0.03004419,3.0044193,1.0300441,1.1586212,-5.5077353,-79.120094,-174.0701,0.34982383,-0.23077941,14.599337,1010000
64
+ 1.0,1.0,0.027140193,2.7140193,1.0271401,1.1860598,-1.3777947,-79.19021,-158.81319,0.42857862,-0.43100813,17.898163,1015000
65
+ 1.0,1.0,0.028470434,2.8470435,1.0284704,0.861907,0.8567828,-78.9825,-167.24942,0.17467666,-0.13387677,10.987938,1020000
66
+ 1.0,1.0,0.02895967,2.895967,1.0289596,1.0698975,0.12888281,-79.87421,-184.14401,0.258761,-0.2528072,13.034304,1025000
67
+ 1.0,1.0,0.02832482,2.8324819,1.0283248,1.5477357,-1.8458403,-79.95991,-164.2332,0.27233574,-0.311223,18.863976,1030000
68
+ 1.0,1.0,0.02892049,2.8920493,1.0289205,1.2520822,-1.5454396,-78.85424,-198.42805,0.13739352,-0.27068868,14.510336,1035000
69
+ 1.0,1.0,0.028910423,2.8910422,1.0289104,1.0282582,-1.6147338,-79.65812,-159.6773,0.25041378,-0.25142872,15.937954,1040000
70
+ 1.0,0.9999999,0.02719151,2.719151,1.0271914,0.9042786,-2.1968393,-81.15893,-183.03111,0.11093836,-0.16056733,10.782464,1045000
71
+ 1.0,1.0,0.02701093,2.7010932,1.0270109,1.4128466,-4.3406324,-77.748146,-184.98854,0.30421302,-0.20115529,18.96693,1050000
72
+ 1.0,1.0,0.02765151,2.765151,1.0276515,0.95665914,-1.3688016,-80.134514,-173.37038,0.26395774,-0.23297673,13.747454,1055000
73
+ 1.0,1.0,0.029585125,2.9585123,1.0295851,1.0679648,0.18483296,-77.2176,-192.59337,0.24571055,-0.2567013,14.612358,1060000
74
+ 1.0,1.0,0.030396588,3.039659,1.0303966,1.0406846,0.32557285,-80.286545,-177.6343,0.21649565,-0.32052448,16.109016,1065000
75
+ 1.0,1.0,0.029619988,2.961999,1.0296199,1.2090944,-2.5272548,-77.83218,-174.21747,0.8102204,-0.8210534,21.819508,1070000
76
+ 1.0,0.999979,0.027449377,2.7449377,1.0274284,3.2755487,1.126768,-75.49337,-189.9803,0.4095169,-0.37846842,27.248863,1075000
77
+ 1.0,1.0,0.02529833,2.529833,1.0252984,1.5418706,-2.3223994,-78.135414,-171.07039,0.32683542,-0.2806016,16.626844,1080000
78
+ 1.0,0.9999999,0.027583469,2.758347,1.0275834,1.0351157,-2.517568,-77.29214,-175.46005,0.19381997,-0.17104724,14.65946,1085000
79
+ 1.0,0.99999994,0.031600412,3.1600413,1.0316004,1.4023423,-3.4127834,-80.30568,-171.41876,0.29186824,-0.16235593,16.727196,1090000
80
+ 1.0,1.0,0.028274067,2.827407,1.028274,1.865008,-0.6285291,-80.52997,-151.57782,0.4490252,-0.4364411,22.35796,1095000
81
+ 1.0,0.99999994,0.027064253,2.7064252,1.0270642,1.507824,-2.5851905,-76.52153,-158.33723,0.20500986,-0.22814205,16.102036,1100000
82
+ 1.0,0.9999999,0.028742554,2.8742557,1.0287424,1.2553014,1.4708884,-75.56115,-171.08884,0.29467282,-0.27342802,16.758911,1105000
83
+ 1.0,1.0,0.029495358,2.9495358,1.0294954,1.2777443,0.7888876,-79.72372,-160.17538,0.2637516,-0.34863546,18.86536,1110000
84
+ 1.0,0.9998708,0.027508654,2.7508655,1.0273794,1.6125206,0.3692652,-75.64657,-154.85307,1.0941831,-0.9644186,34.665485,1115000
85
+ 1.0,1.0,0.030152982,3.0152981,1.030153,1.040396,-6.0905366,-76.780014,-170.88629,0.28726697,-0.34271675,15.039329,1120000
86
+ 1.0,0.99999994,0.028887948,2.888795,1.0288879,1.6480693,-0.17054968,-75.66206,-199.00504,0.42511237,-0.38465545,21.087162,1125000
87
+ 1.0,1.0,0.029454391,2.9454393,1.0294544,1.0771248,-1.322575,-74.613464,-160.23616,0.35133106,-0.1518932,12.889261,1130000
88
+ 1.0,1.0,0.029804919,2.980492,1.029805,1.2881039,-3.3112028,-79.90068,-194.5727,0.31301403,-0.35474843,14.968933,1135000
89
+ 1.0,1.0,0.030409262,3.040926,1.0304092,1.2675184,-2.688983,-76.21565,-181.85033,0.24351603,-0.26877475,16.333555,1140000
90
+ 1.0,0.99999994,0.028607497,2.8607497,1.0286075,0.89748573,-1.4188491,-76.49584,-162.9271,0.2783904,-0.17603634,14.859274,1145000
91
+ 1.0,1.0,0.027074602,2.70746,1.0270746,1.1294523,-1.7899525,-73.04853,-162.99664,0.31863987,-0.19803257,15.079624,1150000
92
+ 1.0,1.0,0.029681802,2.9681802,1.0296818,1.9695419,-2.108262,-74.33327,-171.06862,0.37476957,-0.27680868,19.034615,1155000
93
+ 1.0,1.0,0.028555876,2.8555875,1.0285559,2.1303303,-3.5725415,-74.94375,-146.90239,0.75409704,-0.35132116,22.388435,1160000
94
+ 1.0,1.0,0.030284062,3.0284061,1.030284,1.1267331,-2.288056,-73.69024,-156.80742,0.3308489,-0.2180911,16.713707,1165000
95
+ 1.0,1.0,0.02984085,2.9840848,1.0298408,3.4205728,-1.7871873,-73.80999,-144.09102,1.0866984,-0.8109901,51.804573,1170000
96
+ 1.0,1.0,0.026533606,2.6533606,1.0265336,1.1726216,-1.591659,-74.68691,-177.70525,0.10775562,-0.19501784,12.234542,1175000
97
+ 1.0,0.9999999,0.02900317,2.900317,1.029003,0.99650663,0.43385345,-74.2754,-154.4253,0.32021976,-0.19189504,12.104555,1180000
98
+ 1.0,1.0,0.02939372,2.939372,1.0293937,0.96631145,-1.4154615,-72.80747,-196.57823,0.23076247,-0.16846296,12.592501,1185000
99
+ 1.0,1.0,0.028377973,2.8377972,1.028378,0.9011642,-1.1906068,-74.05562,-162.45383,0.16990471,-0.28843552,13.40048,1190000
100
+ 1.0,1.0,0.02758477,2.7584772,1.0275848,1.1954025,-0.9842883,-70.669525,-175.0718,0.2895577,-0.42086715,15.298462,1195000
101
+ 1.0,1.0000001,0.027248101,2.7248101,1.0272483,1.1796162,-0.445978,-68.85748,-183.07611,0.3398074,-0.37641662,12.936899,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d295c1e58f47b1cc31e035a98ece9f60c77fd6c678ea2c7d2c2e1bf9f765fa93
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65cf1e4e22e87e92da487bc5ff1991548a8f39ef22c10c4860b126925b4ccc27
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2813dbebb083d8e45c75634a3db5548d37a0b759f80dde601100f6b17f419eb3
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28708428c4a3788ab8d8635ae46e8f47ed5900271b6878d61fb15e58ed5ed779
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_1200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e7ad4a8bfc7f68695f12481161362e8d04e837f3dfd2676376bcf316d8b77e1
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b620ec1e384050f732bebd61e6c6327d0f8d52d1f7d2d00d7b247bdd2425070
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd581d6bda213c67227430f371c734a2520abd6966fca871759d2ecc0e49554c
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11321eb48d783ebbe42f142482b9e728a6eddfb4a1aefbc8c8d9f613b7f11ec2
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bcbb9fc9a8468acf2192d51027cd2b004e5d4a9e3b1851a9b64396343ff36d4
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b00f464d8adc3d523867fb600b57e8c32c261e3bfdb3cf38981bc1f7c00c39f1
3
+ size 217655954
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_172917/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/3exn81fp