Tiredsheep commited on
Commit
46bc1e1
·
verified ·
1 Parent(s): 3f3ccce

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_550000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_600000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_650000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_700000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_750000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_800000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_850000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_900000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.058051539590106796,-0.009714371814203693,-0.057889270375573745,0.0042440759890497995,6.2861072216726,47.85500000001435,0.06,24321.74,-0.96,-956.06,955.1,2.7791292762756346,550000
3
+ 0.0,0.0,-0.06903038612869271,0.0012719866174974303,-0.06928653970464389,-0.008178191281581837,3.9092299809013085,49.75000000001484,0.02,75241.0,-1.0,-1013.36,993.0,2.9026382112503053,600000
4
+ 0.0,0.0,-0.0692712832279847,-0.007781982006638175,-0.06970682207603954,-0.007198182310800074,4.000715022112355,50.10000000001527,0.0,126905.0,-1.0,-1000.0,1000.0,2.9354470014572143,650000
5
+ 0.0,0.0,-0.0735685004609191,-0.004411416515282266,-0.07398208625359835,-0.011016057546417109,5.9439652168045525,49.17800000001438,0.06,178401.9,-0.94,-981.5,981.56,2.906328320503235,700000
6
+ 0.0,0.0,-0.08493163571601378,0.010807766251753307,-0.08464450219013989,0.003722805954382937,5.796150764975926,48.48000000001412,0.08,229579.04,-0.98,-984.18,967.6,2.856766018867493,750000
7
+ 0.0,0.0,-0.06058980671556299,0.0024107077192007044,-0.060400592035991275,0.0014193203490672156,5.308694093934771,49.99000000001514,0.04,280277.4,-1.0,-1026.18,997.8,2.9398497200012206,800000
8
+ 0.0,0.0,-0.07423456565467518,-0.015134163634005757,-0.07489799647980801,-0.01195842906431555,3.5681022511657994,48.1000000000139,0.08,331076.92,-0.92,-959.92,960.0,2.8190100955963135,850000
9
+ 0.0,0.0,-0.04575368260974698,0.005312171266863164,-0.04598667611023551,-0.0022432383272939557,3.174731037779891,47.96900000001425,0.06,381266.42,-0.94,-957.32,957.38,2.809519300460815,900000
10
+ 0.0,0.0,-0.06925384355080605,-0.003300019334835147,-0.06931932821479979,-0.0010701771407658532,8.027126787838144,42.19300000001206,0.2,429153.68,-0.8,-841.66,841.86,2.471133704185486,950000
11
+ 0.0,0.0,-0.06957097951040804,0.003072593061179909,-0.07053221759715667,-0.014584333385815568,7.471131835787796,45.35600000001309,0.16,472732.86,-0.88,-924.12,905.12,2.678335452079773,1000000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.058051539590106796,-0.009714371814203693,-0.057889270375573745,0.0042440759890497995,6.2861072216726,47.85500000001435,0.06,24321.74,-0.96,-956.06,955.1,2.7791292762756346,550000
3
+ 0.0,0.0,-0.06903038612869271,0.0012719866174974303,-0.06928653970464389,-0.008178191281581837,3.9092299809013085,49.75000000001484,0.02,75241.0,-1.0,-1013.36,993.0,2.9026382112503053,600000
4
+ 0.0,0.0,-0.0692712832279847,-0.007781982006638175,-0.06970682207603954,-0.007198182310800074,4.000715022112355,50.10000000001527,0.0,126905.0,-1.0,-1000.0,1000.0,2.9354470014572143,650000
5
+ 0.0,0.0,-0.0735685004609191,-0.004411416515282266,-0.07398208625359835,-0.011016057546417109,5.9439652168045525,49.17800000001438,0.06,178401.9,-0.94,-981.5,981.56,2.906328320503235,700000
6
+ 0.0,0.0,-0.08493163571601378,0.010807766251753307,-0.08464450219013989,0.003722805954382937,5.796150764975926,48.48000000001412,0.08,229579.04,-0.98,-984.18,967.6,2.856766018867493,750000
7
+ 0.0,0.0,-0.06058980671556299,0.0024107077192007044,-0.060400592035991275,0.0014193203490672156,5.308694093934771,49.99000000001514,0.04,280277.4,-1.0,-1026.18,997.8,2.9398497200012206,800000
8
+ 0.0,0.0,-0.07423456565467518,-0.015134163634005757,-0.07489799647980801,-0.01195842906431555,3.5681022511657994,48.1000000000139,0.08,331076.92,-0.92,-959.92,960.0,2.8190100955963135,850000
9
+ 0.0,0.0,-0.04575368260974698,0.005312171266863164,-0.04598667611023551,-0.0022432383272939557,3.174731037779891,47.96900000001425,0.06,381266.42,-0.94,-957.32,957.38,2.809519300460815,900000
10
+ 0.0,0.0,-0.06925384355080605,-0.003300019334835147,-0.06931932821479979,-0.0010701771407658532,8.027126787838144,42.19300000001206,0.2,429153.68,-0.8,-841.66,841.86,2.471133704185486,950000
11
+ 0.0,0.0,-0.06957097951040804,0.003072593061179909,-0.07053221759715667,-0.014584333385815568,7.471131835787796,45.35600000001309,0.16,472732.86,-0.88,-924.12,905.12,2.678335452079773,1000000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,0.99999994,0.007396961,0.73969615,1.0073969,3.968153,-136.70201,-279.35425,-307.91046,2.4079533,-2.1559212,63.133064,505000
3
+ 1.0,1.0,0.008048757,0.80487573,1.0080488,1.8152279,-146.13803,-276.42273,-307.14557,0.67230934,-0.7321273,32.235985,510000
4
+ 1.0,1.0000001,0.007615964,0.76159644,1.007616,2.5992181,-127.10021,-271.91672,-308.4174,0.5601063,-0.65795135,42.29136,515000
5
+ 1.0,0.99999994,0.007572887,0.7572887,1.0075728,2.4609373,-169.41626,-278.45728,-308.20456,1.3660331,-1.2916882,44.43788,520000
6
+ 1.0,0.9999999,0.007833958,0.78339577,1.0078338,2.1340358,-108.84383,-277.76572,-306.9331,0.6318604,-0.6971867,35.894817,525000
7
+ 1.0,0.9999894,0.006865694,0.68656945,1.0068551,3.6994,2.40514,-276.6747,-307.49695,4.7780433,-2.0950255,85.88197,530000
8
+ 1.0,1.0,0.0075504403,0.75504404,1.0075505,1.9613632,-107.37689,-280.77756,-308.8597,0.2805871,-0.34039742,29.635174,535000
9
+ 1.0,1.0000001,0.0073400205,0.73400205,1.0073402,2.123347,-101.69337,-276.76187,-307.00964,0.45221895,-0.5777211,33.553787,540000
10
+ 1.0,1.0,0.0069027646,0.6902765,1.0069028,2.003095,-100.04296,-278.99112,-307.73236,0.3259119,-0.42186368,29.187613,545000
11
+ 1.0,1.0,0.007207052,0.7207053,1.007207,1.9346548,-102.69283,-276.02704,-307.75305,0.97085214,-0.6119304,33.751427,550000
12
+ 1.0,1.0,0.0070777354,0.70777357,1.0070777,1.8755153,-101.30759,-274.5611,-307.79077,0.32899928,-0.5940442,28.571743,555000
13
+ 1.0,0.9999999,0.007896065,0.7896065,1.007896,2.099874,-100.6079,-276.0327,-309.53592,0.3586638,-0.39859983,29.088385,560000
14
+ 1.0,1.0,0.007866342,0.7866341,1.0078664,2.2232425,-101.765396,-276.64624,-307.96524,0.8219118,-0.60632586,36.566643,565000
15
+ 1.0,1.0,0.008125585,0.81255853,1.0081255,1.889876,-101.124695,-270.4195,-307.45267,0.33296663,-0.25732714,25.359245,570000
16
+ 1.0,1.0,0.008259395,0.82593954,1.0082594,2.8119895,-34.6264,-267.18588,-308.71042,2.0696084,-1.5094155,53.34698,575000
17
+ 1.0,1.0000001,0.008385367,0.8385366,1.0083855,2.3795764,-100.93347,-270.17285,-306.89246,0.7550418,-1.3182652,39.393345,580000
18
+ 1.0,0.99999994,0.008190772,0.8190772,1.0081908,1.9120411,-94.144104,-271.1406,-307.13397,0.4390317,-0.5713517,28.490772,585000
19
+ 1.0,1.0,0.0075050155,0.7505016,1.007505,1.7746403,-101.2742,-272.85043,-307.54507,0.3922326,-0.27956307,26.064026,590000
20
+ 1.0,0.9999998,0.008414587,0.8414587,1.0084144,1.8932583,-100.04456,-273.14786,-307.02246,0.5445146,-0.47613433,34.230637,595000
21
+ 1.0,1.0,0.0073146266,0.7314627,1.0073147,2.5382822,-99.86018,-269.5482,-308.18582,0.750116,-1.0597526,38.690456,600000
22
+ 1.0,0.9999999,0.0072612506,0.7261251,1.0072612,1.8565506,-99.873215,-273.5824,-305.9784,0.36168864,-0.34017846,28.51985,605000
23
+ 1.0,1.0,0.007933683,0.7933682,1.0079337,2.288739,-100.54296,-274.9977,-307.68933,1.575415,-0.8435814,46.26982,610000
24
+ 1.0,0.9999999,0.007259953,0.7259953,1.0072598,2.0974853,-98.141464,-268.37558,-307.885,0.52424204,-0.5949646,31.458546,615000
25
+ 1.0,1.0000001,0.007133987,0.7133987,1.0071341,1.955512,-100.14969,-267.80005,-307.15253,0.95347744,-1.1586851,33.226086,620000
26
+ 1.0,1.0,0.007198617,0.7198617,1.0071986,2.1956365,-100.76039,-274.42172,-307.01877,0.9136755,-0.56140924,39.165024,625000
27
+ 1.0,0.99999994,0.0075774817,0.7577482,1.0075774,1.9286139,-100.711876,-272.80127,-306.73483,0.40352225,-0.47541398,29.531387,630000
28
+ 1.0,0.99999994,0.006997576,0.6997576,1.0069975,2.2693758,-101.02249,-272.2158,-306.822,4.1708326,-4.7313585,83.45372,635000
29
+ 1.0,1.0,0.007845145,0.7845144,1.0078452,1.8133625,-100.691536,-268.57745,-306.41077,0.6015786,-0.53079534,34.60227,640000
30
+ 1.0,1.0000001,0.0081526255,0.8152625,1.0081527,1.8174294,-100.615204,-267.2517,-306.41388,0.99178773,-1.458635,35.58221,645000
31
+ 1.0,1.0,0.007124742,0.7124742,1.0071248,2.0110447,-100.13889,-270.267,-307.40567,0.4672503,-0.6103318,34.564445,650000
32
+ 1.0,1.0,0.0072615063,0.7261507,1.0072615,1.5666474,-100.3726,-270.75122,-307.63843,0.2523687,-0.3787462,24.498001,655000
33
+ 1.0,1.0,0.0070333667,0.7033367,1.0070333,2.3751342,-99.82209,-265.0137,-309.06387,0.6647452,-0.5296116,35.800404,660000
34
+ 1.0,1.0000001,0.008400537,0.8400537,1.0084007,2.138152,-100.4167,-267.77805,-307.65417,0.48520595,-0.5644812,30.84504,665000
35
+ 1.0,0.99999994,0.008119814,0.8119814,1.0081197,6.470164,-100.584236,-266.3355,-307.03577,4.4926066,-4.7861514,147.30148,670000
36
+ 1.0,0.9999999,0.007903293,0.7903293,1.0079032,1.8297844,-100.340515,-267.1866,-306.6495,0.57480764,-0.37293774,30.854841,675000
37
+ 1.0,1.0,0.008458397,0.84583974,1.0084584,2.3464537,-100.80573,-266.3547,-306.95648,2.2611427,-1.9853977,52.08563,680000
38
+ 1.0,1.0,0.007299325,0.72993255,1.0072993,1.8319899,-100.654495,-262.67953,-307.17847,0.35021394,-0.5536397,30.868181,685000
39
+ 1.0,1.0000001,0.007996542,0.7996543,1.0079967,1.5019563,-100.23745,-265.17538,-307.31482,0.47299358,-0.62591803,24.452997,690000
40
+ 1.0,1.0000001,0.0077168737,0.7716873,1.007717,2.0608566,-100.08418,-269.61813,-306.57367,0.3778512,-0.748732,33.634243,695000
41
+ 1.0,0.99999994,0.008435283,0.8435284,1.0084352,2.291792,-100.67912,-263.2044,-306.51068,0.5672797,-0.6457275,38.342472,700000
42
+ 1.0,1.0,0.008764412,0.8764412,1.0087644,2.0127425,-96.87042,-263.19492,-306.81784,0.7026994,-0.52072954,36.755356,705000
43
+ 1.0,1.0,0.007945934,0.7945936,1.0079459,2.084535,-99.69593,-265.78513,-306.35785,1.1091021,-0.43898332,35.77311,710000
44
+ 1.0,0.9999998,0.0077437493,0.77437496,1.0077436,1.8151817,-100.29158,-261.82397,-307.72144,0.6835909,-0.39732444,28.069195,715000
45
+ 1.0,1.0,0.0080063585,0.8006359,1.0080063,1.7931212,-21.051516,-267.22412,-306.91537,0.5408041,-0.28676254,29.282978,720000
46
+ 1.0,1.0,0.007369361,0.7369361,1.0073694,2.903956,-100.609406,-268.40308,-307.29437,1.0712274,-0.6221457,48.253044,725000
47
+ 1.0,1.0000001,0.008080055,0.8080055,1.0080801,3.581413,-100.75393,-268.0486,-308.1371,0.5838383,-0.995267,43.403915,730000
48
+ 1.0,0.99999994,0.007578984,0.75789845,1.007579,1.351052,-43.972958,-266.03415,-306.62823,0.54327047,-0.22874418,21.856956,735000
49
+ 1.0,1.0,0.0076707257,0.7670726,1.0076708,1.9451655,-100.11214,-267.83917,-306.86343,0.40335816,-0.28425616,27.047321,740000
50
+ 1.0,0.9999999,0.0077339,0.77339005,1.0077338,1.3873252,-100.67105,-260.0399,-306.68732,0.63812256,-0.43469554,25.8509,745000
51
+ 1.0,1.0,0.007613639,0.7613639,1.0076137,2.046611,-100.82102,-271.85263,-307.498,5.158666,-5.1582675,65.71833,750000
52
+ 1.0,1.0,0.006823267,0.6823267,1.0068233,1.7851114,-100.258965,-263.2427,-306.7119,0.95263237,-0.4286154,28.62216,755000
53
+ 1.0,0.9999999,0.007040728,0.70407283,1.0070406,1.9014677,-100.49715,-265.5795,-306.71466,0.7659905,-0.8448128,39.322136,760000
54
+ 1.0,1.0,0.007701124,0.7701124,1.0077012,1.5628251,-97.51721,-264.7893,-306.65338,0.3072752,-0.3337128,25.963793,765000
55
+ 1.0,1.0,0.0072311414,0.72311413,1.0072311,1.6316884,-99.0343,-267.05505,-306.64923,0.5680131,-0.6124497,28.744928,770000
56
+ 1.0,1.0,0.007569814,0.7569814,1.0075698,1.843474,-40.912937,-261.12708,-307.44788,0.40425754,-0.4317653,26.021439,775000
57
+ 1.0,0.99999994,0.007816406,0.78164065,1.0078163,1.659483,-100.66247,-261.66977,-307.2629,0.2725393,-0.7753077,28.035254,780000
58
+ 1.0,1.0,0.0071961256,0.71961254,1.0071961,1.6632931,-100.55968,-266.7285,-306.57758,0.3950683,-0.32358283,23.531609,785000
59
+ 1.0,1.0,0.007891433,0.7891433,1.0078914,1.5964974,-100.70107,-260.42813,-307.47577,0.42943567,-0.6739689,27.686356,790000
60
+ 1.0,1.0,0.008059664,0.8059664,1.0080596,1.2890654,-99.58843,-266.4476,-306.45813,0.841638,-0.8311934,24.977379,795000
61
+ 1.0,0.99999994,0.008182872,0.81828725,1.0081828,1.6687214,-100.379524,-260.7599,-306.2004,0.50999093,-0.649148,31.366928,800000
62
+ 1.0,0.99999994,0.007508847,0.7508847,1.0075088,1.4736481,-98.55538,-260.5425,-306.26346,0.83698,-0.7837655,32.775475,805000
63
+ 1.0,0.99999994,0.008550283,0.8550283,1.0085502,1.5123811,-100.15986,-259.15762,-306.50253,0.66393846,-0.34845728,25.221977,810000
64
+ 1.0,1.0,0.008746498,0.8746499,1.0087465,2.3193989,-100.76847,-255.98753,-307.47388,0.52779025,-0.6635053,35.215927,815000
65
+ 1.0,1.0,0.006724396,0.6724396,1.0067244,1.620101,-70.66515,-251.96284,-307.76523,0.6240629,-2.1127434,35.17873,820000
66
+ 1.0,0.99999994,0.007970024,0.79700243,1.00797,1.8205235,-100.41714,-262.72583,-307.72574,0.81670237,-0.49110055,29.000164,825000
67
+ 1.0,1.0,0.0076911235,0.7691124,1.0076911,1.7489058,-95.15194,-257.60153,-306.25278,0.45949557,-0.32406172,25.127995,830000
68
+ 1.0,0.9999998,0.007943465,0.7943466,1.0079433,1.2762903,-99.07161,-257.8607,-306.7122,0.1778484,-0.29549223,22.50092,835000
69
+ 1.0,0.9999999,0.008444082,0.8444083,1.008444,1.6080235,-98.5555,-264.84833,-306.57248,0.79933363,-0.19287735,24.562849,840000
70
+ 1.0,0.99999994,0.0076494683,0.7649468,1.0076494,1.9069397,-100.644516,-265.9293,-306.86868,0.7347599,-0.4431768,29.849064,845000
71
+ 1.0,0.99999994,0.00807463,0.80746305,1.0080745,1.567407,-100.51904,-256.916,-307.50696,0.40426755,-0.35422248,22.831388,850000
72
+ 1.0,1.0000001,0.008369176,0.8369176,1.0083693,2.0169888,-100.07935,-259.6963,-306.50067,0.44342816,-0.63660526,30.164015,855000
73
+ 1.0,1.0000001,0.007520531,0.7520531,1.0075207,4.600072,-81.32264,-258.48486,-306.41852,4.8027277,-9.431124,140.00635,860000
74
+ 1.0,1.0000001,0.0069423495,0.69423497,1.0069425,1.3181337,-76.283165,-262.23825,-307.3291,0.5964843,-0.23853786,20.201857,865000
75
+ 1.0,0.9999999,0.0083329715,0.83329725,1.0083328,1.1287673,-98.670784,-253.82408,-306.64526,0.4527012,-0.27471164,19.082123,870000
76
+ 1.0,0.9999999,0.0070878053,0.7087805,1.0070877,1.580825,-99.6263,-262.14648,-306.2462,0.49521253,-0.4249605,26.11988,875000
77
+ 1.0,1.0,0.007735015,0.77350146,1.007735,1.5817844,-61.33023,-260.27658,-306.33292,0.28319052,-0.38439813,25.618252,880000
78
+ 1.0,1.0,0.007619445,0.76194453,1.0076195,1.5382749,-48.72706,-258.65994,-306.4709,0.34095567,-0.35643655,25.635258,885000
79
+ 1.0,1.0,0.007705211,0.77052116,1.0077052,1.3948911,-38.889355,-255.54753,-306.59113,0.575054,-0.43839324,25.005054,890000
80
+ 1.0,1.0,0.0079781925,0.79781926,1.0079782,1.564211,-70.17223,-259.02884,-306.4312,0.48623157,-0.73407435,26.023708,895000
81
+ 1.0,0.99999994,0.0075883567,0.7588357,1.0075883,1.436489,-62.54796,-255.89363,-306.0714,0.4659593,-0.47066033,25.425173,900000
82
+ 1.0,1.0,0.007734817,0.7734817,1.0077348,1.4620479,-73.79853,-258.16595,-306.38333,0.44941604,-0.37596446,25.104185,905000
83
+ 1.0,0.99999994,0.008486243,0.8486243,1.0084862,1.4098845,-82.77889,-258.70328,-306.79654,0.6468291,-0.55294883,28.366236,910000
84
+ 1.0,0.9999999,0.007555368,0.7555368,1.0075552,1.2197443,-78.15496,-251.6313,-307.0959,0.5481484,-0.40793556,19.759054,915000
85
+ 1.0,0.9999999,0.0074164355,0.74164355,1.0074164,1.1560892,-86.31111,-256.89795,-306.4766,0.34133384,-0.46843484,22.105116,920000
86
+ 1.0,1.0,0.0074436925,0.74436927,1.0074437,1.2428576,-100.68514,-260.1018,-306.51437,0.3625068,-0.31318513,21.950014,925000
87
+ 1.0,1.0,0.008197955,0.8197955,1.0081979,2.109369,-98.944084,-255.4376,-306.88913,0.65028065,-0.6797187,42.152153,930000
88
+ 1.0,1.0,0.0079369005,0.7936901,1.007937,1.5851191,-81.70023,-252.90416,-305.54214,0.40185845,-0.8464864,28.42187,935000
89
+ 1.0,1.0,0.008123852,0.8123852,1.0081239,1.6309103,-35.433758,-251.82686,-306.85562,0.34266996,-0.5423857,29.245817,940000
90
+ 1.0,1.0,0.008569241,0.85692406,1.0085692,2.1425688,-84.87623,-249.61974,-306.6212,0.7368357,-0.5023135,35.19102,945000
91
+ 1.0,1.0,0.0077395686,0.7739569,1.0077395,1.3378657,-75.01177,-254.8297,-306.24356,0.32538676,-0.662514,21.812876,950000
92
+ 1.0,0.9999999,0.007790274,0.77902746,1.0077902,1.3914421,-39.56459,-255.10706,-307.24374,0.42793113,-0.4770121,23.926886,955000
93
+ 1.0,1.0,0.008010961,0.8010962,1.008011,1.6084903,-98.21707,-246.12791,-306.45267,0.42137578,-0.47535557,25.074097,960000
94
+ 1.0,1.0,0.0074970652,0.7497065,1.0074971,1.4322947,-99.97839,-250.47945,-306.8277,0.5875556,-0.31838647,23.744133,965000
95
+ 1.0,1.0,0.0075362287,0.7536229,1.0075362,1.6905552,-100.4699,-254.84619,-306.3321,0.4742586,-0.8549227,27.496588,970000
96
+ 1.0,1.0,0.007616853,0.7616853,1.0076169,1.3662456,-62.159874,-251.05675,-306.0201,0.48372385,-0.27651793,22.276367,975000
97
+ 1.0,0.99999994,0.007901754,0.79017544,1.0079017,1.6320229,-97.15902,-260.3293,-305.9605,1.8211375,-2.1558492,56.04828,980000
98
+ 1.0,1.0,0.007342912,0.7342912,1.0073429,1.3747529,-97.29328,-258.2906,-306.38654,0.615772,-0.4294805,26.704357,985000
99
+ 1.0,1.0,0.008275476,0.82754767,1.0082755,1.6447858,-69.51142,-251.2888,-306.5117,0.29183918,-0.5269276,22.156528,990000
100
+ 1.0,1.0,0.0075624306,0.7562431,1.0075624,1.6897564,-71.128334,-249.52359,-306.04605,0.27429843,-0.52514344,25.169968,995000
101
+ 1.0,0.99999994,0.007843675,0.78436756,1.0078436,1.4324793,-94.334694,-257.59897,-307.0432,0.5793227,-0.25542247,21.065424,1000000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 1.0,0.99999994,0.007396961,0.73969615,1.0073969,3.968153,-136.70201,-279.35425,-307.91046,2.4079533,-2.1559212,63.133064,505000
3
+ 1.0,1.0,0.008048757,0.80487573,1.0080488,1.8152279,-146.13803,-276.42273,-307.14557,0.67230934,-0.7321273,32.235985,510000
4
+ 1.0,1.0000001,0.007615964,0.76159644,1.007616,2.5992181,-127.10021,-271.91672,-308.4174,0.5601063,-0.65795135,42.29136,515000
5
+ 1.0,0.99999994,0.007572887,0.7572887,1.0075728,2.4609373,-169.41626,-278.45728,-308.20456,1.3660331,-1.2916882,44.43788,520000
6
+ 1.0,0.9999999,0.007833958,0.78339577,1.0078338,2.1340358,-108.84383,-277.76572,-306.9331,0.6318604,-0.6971867,35.894817,525000
7
+ 1.0,0.9999894,0.006865694,0.68656945,1.0068551,3.6994,2.40514,-276.6747,-307.49695,4.7780433,-2.0950255,85.88197,530000
8
+ 1.0,1.0,0.0075504403,0.75504404,1.0075505,1.9613632,-107.37689,-280.77756,-308.8597,0.2805871,-0.34039742,29.635174,535000
9
+ 1.0,1.0000001,0.0073400205,0.73400205,1.0073402,2.123347,-101.69337,-276.76187,-307.00964,0.45221895,-0.5777211,33.553787,540000
10
+ 1.0,1.0,0.0069027646,0.6902765,1.0069028,2.003095,-100.04296,-278.99112,-307.73236,0.3259119,-0.42186368,29.187613,545000
11
+ 1.0,1.0,0.007207052,0.7207053,1.007207,1.9346548,-102.69283,-276.02704,-307.75305,0.97085214,-0.6119304,33.751427,550000
12
+ 1.0,1.0,0.0070777354,0.70777357,1.0070777,1.8755153,-101.30759,-274.5611,-307.79077,0.32899928,-0.5940442,28.571743,555000
13
+ 1.0,0.9999999,0.007896065,0.7896065,1.007896,2.099874,-100.6079,-276.0327,-309.53592,0.3586638,-0.39859983,29.088385,560000
14
+ 1.0,1.0,0.007866342,0.7866341,1.0078664,2.2232425,-101.765396,-276.64624,-307.96524,0.8219118,-0.60632586,36.566643,565000
15
+ 1.0,1.0,0.008125585,0.81255853,1.0081255,1.889876,-101.124695,-270.4195,-307.45267,0.33296663,-0.25732714,25.359245,570000
16
+ 1.0,1.0,0.008259395,0.82593954,1.0082594,2.8119895,-34.6264,-267.18588,-308.71042,2.0696084,-1.5094155,53.34698,575000
17
+ 1.0,1.0000001,0.008385367,0.8385366,1.0083855,2.3795764,-100.93347,-270.17285,-306.89246,0.7550418,-1.3182652,39.393345,580000
18
+ 1.0,0.99999994,0.008190772,0.8190772,1.0081908,1.9120411,-94.144104,-271.1406,-307.13397,0.4390317,-0.5713517,28.490772,585000
19
+ 1.0,1.0,0.0075050155,0.7505016,1.007505,1.7746403,-101.2742,-272.85043,-307.54507,0.3922326,-0.27956307,26.064026,590000
20
+ 1.0,0.9999998,0.008414587,0.8414587,1.0084144,1.8932583,-100.04456,-273.14786,-307.02246,0.5445146,-0.47613433,34.230637,595000
21
+ 1.0,1.0,0.0073146266,0.7314627,1.0073147,2.5382822,-99.86018,-269.5482,-308.18582,0.750116,-1.0597526,38.690456,600000
22
+ 1.0,0.9999999,0.0072612506,0.7261251,1.0072612,1.8565506,-99.873215,-273.5824,-305.9784,0.36168864,-0.34017846,28.51985,605000
23
+ 1.0,1.0,0.007933683,0.7933682,1.0079337,2.288739,-100.54296,-274.9977,-307.68933,1.575415,-0.8435814,46.26982,610000
24
+ 1.0,0.9999999,0.007259953,0.7259953,1.0072598,2.0974853,-98.141464,-268.37558,-307.885,0.52424204,-0.5949646,31.458546,615000
25
+ 1.0,1.0000001,0.007133987,0.7133987,1.0071341,1.955512,-100.14969,-267.80005,-307.15253,0.95347744,-1.1586851,33.226086,620000
26
+ 1.0,1.0,0.007198617,0.7198617,1.0071986,2.1956365,-100.76039,-274.42172,-307.01877,0.9136755,-0.56140924,39.165024,625000
27
+ 1.0,0.99999994,0.0075774817,0.7577482,1.0075774,1.9286139,-100.711876,-272.80127,-306.73483,0.40352225,-0.47541398,29.531387,630000
28
+ 1.0,0.99999994,0.006997576,0.6997576,1.0069975,2.2693758,-101.02249,-272.2158,-306.822,4.1708326,-4.7313585,83.45372,635000
29
+ 1.0,1.0,0.007845145,0.7845144,1.0078452,1.8133625,-100.691536,-268.57745,-306.41077,0.6015786,-0.53079534,34.60227,640000
30
+ 1.0,1.0000001,0.0081526255,0.8152625,1.0081527,1.8174294,-100.615204,-267.2517,-306.41388,0.99178773,-1.458635,35.58221,645000
31
+ 1.0,1.0,0.007124742,0.7124742,1.0071248,2.0110447,-100.13889,-270.267,-307.40567,0.4672503,-0.6103318,34.564445,650000
32
+ 1.0,1.0,0.0072615063,0.7261507,1.0072615,1.5666474,-100.3726,-270.75122,-307.63843,0.2523687,-0.3787462,24.498001,655000
33
+ 1.0,1.0,0.0070333667,0.7033367,1.0070333,2.3751342,-99.82209,-265.0137,-309.06387,0.6647452,-0.5296116,35.800404,660000
34
+ 1.0,1.0000001,0.008400537,0.8400537,1.0084007,2.138152,-100.4167,-267.77805,-307.65417,0.48520595,-0.5644812,30.84504,665000
35
+ 1.0,0.99999994,0.008119814,0.8119814,1.0081197,6.470164,-100.584236,-266.3355,-307.03577,4.4926066,-4.7861514,147.30148,670000
36
+ 1.0,0.9999999,0.007903293,0.7903293,1.0079032,1.8297844,-100.340515,-267.1866,-306.6495,0.57480764,-0.37293774,30.854841,675000
37
+ 1.0,1.0,0.008458397,0.84583974,1.0084584,2.3464537,-100.80573,-266.3547,-306.95648,2.2611427,-1.9853977,52.08563,680000
38
+ 1.0,1.0,0.007299325,0.72993255,1.0072993,1.8319899,-100.654495,-262.67953,-307.17847,0.35021394,-0.5536397,30.868181,685000
39
+ 1.0,1.0000001,0.007996542,0.7996543,1.0079967,1.5019563,-100.23745,-265.17538,-307.31482,0.47299358,-0.62591803,24.452997,690000
40
+ 1.0,1.0000001,0.0077168737,0.7716873,1.007717,2.0608566,-100.08418,-269.61813,-306.57367,0.3778512,-0.748732,33.634243,695000
41
+ 1.0,0.99999994,0.008435283,0.8435284,1.0084352,2.291792,-100.67912,-263.2044,-306.51068,0.5672797,-0.6457275,38.342472,700000
42
+ 1.0,1.0,0.008764412,0.8764412,1.0087644,2.0127425,-96.87042,-263.19492,-306.81784,0.7026994,-0.52072954,36.755356,705000
43
+ 1.0,1.0,0.007945934,0.7945936,1.0079459,2.084535,-99.69593,-265.78513,-306.35785,1.1091021,-0.43898332,35.77311,710000
44
+ 1.0,0.9999998,0.0077437493,0.77437496,1.0077436,1.8151817,-100.29158,-261.82397,-307.72144,0.6835909,-0.39732444,28.069195,715000
45
+ 1.0,1.0,0.0080063585,0.8006359,1.0080063,1.7931212,-21.051516,-267.22412,-306.91537,0.5408041,-0.28676254,29.282978,720000
46
+ 1.0,1.0,0.007369361,0.7369361,1.0073694,2.903956,-100.609406,-268.40308,-307.29437,1.0712274,-0.6221457,48.253044,725000
47
+ 1.0,1.0000001,0.008080055,0.8080055,1.0080801,3.581413,-100.75393,-268.0486,-308.1371,0.5838383,-0.995267,43.403915,730000
48
+ 1.0,0.99999994,0.007578984,0.75789845,1.007579,1.351052,-43.972958,-266.03415,-306.62823,0.54327047,-0.22874418,21.856956,735000
49
+ 1.0,1.0,0.0076707257,0.7670726,1.0076708,1.9451655,-100.11214,-267.83917,-306.86343,0.40335816,-0.28425616,27.047321,740000
50
+ 1.0,0.9999999,0.0077339,0.77339005,1.0077338,1.3873252,-100.67105,-260.0399,-306.68732,0.63812256,-0.43469554,25.8509,745000
51
+ 1.0,1.0,0.007613639,0.7613639,1.0076137,2.046611,-100.82102,-271.85263,-307.498,5.158666,-5.1582675,65.71833,750000
52
+ 1.0,1.0,0.006823267,0.6823267,1.0068233,1.7851114,-100.258965,-263.2427,-306.7119,0.95263237,-0.4286154,28.62216,755000
53
+ 1.0,0.9999999,0.007040728,0.70407283,1.0070406,1.9014677,-100.49715,-265.5795,-306.71466,0.7659905,-0.8448128,39.322136,760000
54
+ 1.0,1.0,0.007701124,0.7701124,1.0077012,1.5628251,-97.51721,-264.7893,-306.65338,0.3072752,-0.3337128,25.963793,765000
55
+ 1.0,1.0,0.0072311414,0.72311413,1.0072311,1.6316884,-99.0343,-267.05505,-306.64923,0.5680131,-0.6124497,28.744928,770000
56
+ 1.0,1.0,0.007569814,0.7569814,1.0075698,1.843474,-40.912937,-261.12708,-307.44788,0.40425754,-0.4317653,26.021439,775000
57
+ 1.0,0.99999994,0.007816406,0.78164065,1.0078163,1.659483,-100.66247,-261.66977,-307.2629,0.2725393,-0.7753077,28.035254,780000
58
+ 1.0,1.0,0.0071961256,0.71961254,1.0071961,1.6632931,-100.55968,-266.7285,-306.57758,0.3950683,-0.32358283,23.531609,785000
59
+ 1.0,1.0,0.007891433,0.7891433,1.0078914,1.5964974,-100.70107,-260.42813,-307.47577,0.42943567,-0.6739689,27.686356,790000
60
+ 1.0,1.0,0.008059664,0.8059664,1.0080596,1.2890654,-99.58843,-266.4476,-306.45813,0.841638,-0.8311934,24.977379,795000
61
+ 1.0,0.99999994,0.008182872,0.81828725,1.0081828,1.6687214,-100.379524,-260.7599,-306.2004,0.50999093,-0.649148,31.366928,800000
62
+ 1.0,0.99999994,0.007508847,0.7508847,1.0075088,1.4736481,-98.55538,-260.5425,-306.26346,0.83698,-0.7837655,32.775475,805000
63
+ 1.0,0.99999994,0.008550283,0.8550283,1.0085502,1.5123811,-100.15986,-259.15762,-306.50253,0.66393846,-0.34845728,25.221977,810000
64
+ 1.0,1.0,0.008746498,0.8746499,1.0087465,2.3193989,-100.76847,-255.98753,-307.47388,0.52779025,-0.6635053,35.215927,815000
65
+ 1.0,1.0,0.006724396,0.6724396,1.0067244,1.620101,-70.66515,-251.96284,-307.76523,0.6240629,-2.1127434,35.17873,820000
66
+ 1.0,0.99999994,0.007970024,0.79700243,1.00797,1.8205235,-100.41714,-262.72583,-307.72574,0.81670237,-0.49110055,29.000164,825000
67
+ 1.0,1.0,0.0076911235,0.7691124,1.0076911,1.7489058,-95.15194,-257.60153,-306.25278,0.45949557,-0.32406172,25.127995,830000
68
+ 1.0,0.9999998,0.007943465,0.7943466,1.0079433,1.2762903,-99.07161,-257.8607,-306.7122,0.1778484,-0.29549223,22.50092,835000
69
+ 1.0,0.9999999,0.008444082,0.8444083,1.008444,1.6080235,-98.5555,-264.84833,-306.57248,0.79933363,-0.19287735,24.562849,840000
70
+ 1.0,0.99999994,0.0076494683,0.7649468,1.0076494,1.9069397,-100.644516,-265.9293,-306.86868,0.7347599,-0.4431768,29.849064,845000
71
+ 1.0,0.99999994,0.00807463,0.80746305,1.0080745,1.567407,-100.51904,-256.916,-307.50696,0.40426755,-0.35422248,22.831388,850000
72
+ 1.0,1.0000001,0.008369176,0.8369176,1.0083693,2.0169888,-100.07935,-259.6963,-306.50067,0.44342816,-0.63660526,30.164015,855000
73
+ 1.0,1.0000001,0.007520531,0.7520531,1.0075207,4.600072,-81.32264,-258.48486,-306.41852,4.8027277,-9.431124,140.00635,860000
74
+ 1.0,1.0000001,0.0069423495,0.69423497,1.0069425,1.3181337,-76.283165,-262.23825,-307.3291,0.5964843,-0.23853786,20.201857,865000
75
+ 1.0,0.9999999,0.0083329715,0.83329725,1.0083328,1.1287673,-98.670784,-253.82408,-306.64526,0.4527012,-0.27471164,19.082123,870000
76
+ 1.0,0.9999999,0.0070878053,0.7087805,1.0070877,1.580825,-99.6263,-262.14648,-306.2462,0.49521253,-0.4249605,26.11988,875000
77
+ 1.0,1.0,0.007735015,0.77350146,1.007735,1.5817844,-61.33023,-260.27658,-306.33292,0.28319052,-0.38439813,25.618252,880000
78
+ 1.0,1.0,0.007619445,0.76194453,1.0076195,1.5382749,-48.72706,-258.65994,-306.4709,0.34095567,-0.35643655,25.635258,885000
79
+ 1.0,1.0,0.007705211,0.77052116,1.0077052,1.3948911,-38.889355,-255.54753,-306.59113,0.575054,-0.43839324,25.005054,890000
80
+ 1.0,1.0,0.0079781925,0.79781926,1.0079782,1.564211,-70.17223,-259.02884,-306.4312,0.48623157,-0.73407435,26.023708,895000
81
+ 1.0,0.99999994,0.0075883567,0.7588357,1.0075883,1.436489,-62.54796,-255.89363,-306.0714,0.4659593,-0.47066033,25.425173,900000
82
+ 1.0,1.0,0.007734817,0.7734817,1.0077348,1.4620479,-73.79853,-258.16595,-306.38333,0.44941604,-0.37596446,25.104185,905000
83
+ 1.0,0.99999994,0.008486243,0.8486243,1.0084862,1.4098845,-82.77889,-258.70328,-306.79654,0.6468291,-0.55294883,28.366236,910000
84
+ 1.0,0.9999999,0.007555368,0.7555368,1.0075552,1.2197443,-78.15496,-251.6313,-307.0959,0.5481484,-0.40793556,19.759054,915000
85
+ 1.0,0.9999999,0.0074164355,0.74164355,1.0074164,1.1560892,-86.31111,-256.89795,-306.4766,0.34133384,-0.46843484,22.105116,920000
86
+ 1.0,1.0,0.0074436925,0.74436927,1.0074437,1.2428576,-100.68514,-260.1018,-306.51437,0.3625068,-0.31318513,21.950014,925000
87
+ 1.0,1.0,0.008197955,0.8197955,1.0081979,2.109369,-98.944084,-255.4376,-306.88913,0.65028065,-0.6797187,42.152153,930000
88
+ 1.0,1.0,0.0079369005,0.7936901,1.007937,1.5851191,-81.70023,-252.90416,-305.54214,0.40185845,-0.8464864,28.42187,935000
89
+ 1.0,1.0,0.008123852,0.8123852,1.0081239,1.6309103,-35.433758,-251.82686,-306.85562,0.34266996,-0.5423857,29.245817,940000
90
+ 1.0,1.0,0.008569241,0.85692406,1.0085692,2.1425688,-84.87623,-249.61974,-306.6212,0.7368357,-0.5023135,35.19102,945000
91
+ 1.0,1.0,0.0077395686,0.7739569,1.0077395,1.3378657,-75.01177,-254.8297,-306.24356,0.32538676,-0.662514,21.812876,950000
92
+ 1.0,0.9999999,0.007790274,0.77902746,1.0077902,1.3914421,-39.56459,-255.10706,-307.24374,0.42793113,-0.4770121,23.926886,955000
93
+ 1.0,1.0,0.008010961,0.8010962,1.008011,1.6084903,-98.21707,-246.12791,-306.45267,0.42137578,-0.47535557,25.074097,960000
94
+ 1.0,1.0,0.0074970652,0.7497065,1.0074971,1.4322947,-99.97839,-250.47945,-306.8277,0.5875556,-0.31838647,23.744133,965000
95
+ 1.0,1.0,0.0075362287,0.7536229,1.0075362,1.6905552,-100.4699,-254.84619,-306.3321,0.4742586,-0.8549227,27.496588,970000
96
+ 1.0,1.0,0.007616853,0.7616853,1.0076169,1.3662456,-62.159874,-251.05675,-306.0201,0.48372385,-0.27651793,22.276367,975000
97
+ 1.0,0.99999994,0.007901754,0.79017544,1.0079017,1.6320229,-97.15902,-260.3293,-305.9605,1.8211375,-2.1558492,56.04828,980000
98
+ 1.0,1.0,0.007342912,0.7342912,1.0073429,1.3747529,-97.29328,-258.2906,-306.38654,0.615772,-0.4294805,26.704357,985000
99
+ 1.0,1.0,0.008275476,0.82754767,1.0082755,1.6447858,-69.51142,-251.2888,-306.5117,0.29183918,-0.5269276,22.156528,990000
100
+ 1.0,1.0,0.0075624306,0.7562431,1.0075624,1.6897564,-71.128334,-249.52359,-306.04605,0.27429843,-0.52514344,25.169968,995000
101
+ 1.0,0.99999994,0.007843675,0.78436756,1.0078436,1.4324793,-94.334694,-257.59897,-307.0432,0.5793227,-0.25542247,21.065424,1000000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:418864301c14ab0bdc83d789682be80fb498505eca9bfcc9af181ccc6f527ecf
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a683ef3a1c3879c9abf34946a9cc8fef0c513509ec646cc7650e76eee762d5ce
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e2f4ddd6a4a945b0a47189c12d53f423af1f5220171887b8e465e385cf6e37e
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:879e2d3da68ff4a1f73397d01455e4154974c5e707b06208f12623f262f9e68d
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:203615a4bfd06b0222c3e1e751d756b6268cc076be1bf0254b625b9f62c27b22
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9a5fe9f3191c3a75c95498b3eed014d2be6a431e10acfb6b54e005d5ede1ee
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe44d394ecc14310a2c70231616a05c301e6ea5389e4995b02340487321aca77
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89486622b21f62054a0390f68002d60e73762281953ca9ef67318d311720250c
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0df7614933ab94f48fca9c80f86cfb264daa81dcb183f35b8900269256df04a
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d42ae758aa4190744d0bf28cb54a1fca4ed6fa2508106b3cfa90096b629ed9c
3
+ size 218872466
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/rebrac/20260326_144921/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/yy613jid