Tiredsheep commited on
Commit
127f0b4
·
verified ·
1 Parent(s): 3397428

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_150000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_200000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_250000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_300000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_350000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_400000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_450000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_500000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_550000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_600000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.1082994422001929,0.003011505866011959,-0.10790569295182573,0.004536970518118108,21.830278772622208,24.73999999999702,0.04,12648.6,-1.24,-760.68,492.8,1.4122252988815307,150000
3
+ 0.0,0.0,-0.07273981965148434,0.0007607505564756634,-0.07326182728802899,-0.001774200896895223,25.906153610682647,20.37899999999817,0.38,35989.5,-0.76,-591.02,405.58,1.1899633693695069,200000
4
+ 0.0,0.0,-0.03392553203456798,-0.0038452520494004095,-0.03432573511752833,-0.008445330630372975,32.223182731138294,12.860999999999478,0.82,52941.82,-0.18,-358.3,255.22,0.7875207948684693,250000
5
+ 0.0,0.0,-0.036968987953707774,-0.005447807782881667,-0.03707245933198696,-0.005786821411527158,33.624170763598165,9.570999999999474,0.92,64528.46,-0.12,-267.14,189.42,0.5965239715576172,300000
6
+ 0.0,0.0,-0.04966370424580055,-0.005347870406606667,-0.04986510776049742,-0.00458418710003229,34.414831882748416,8.756999999999476,0.96,74142.66,-0.06,-245.78,173.14,0.5569100570678711,350000
7
+ 0.0,0.0,-0.01634530758458798,-0.0008786739541335655,-0.01613896782981276,-0.0010769550841284213,34.2487810466259,8.498999999999523,0.96,83286.12,-0.06,-235.08,167.98,0.5338046264648437,400000
8
+ 0.0,0.0,-0.028978953325945554,-0.0038878405150012296,-0.02897230768957166,-0.0034891184730423156,35.62727951990254,7.40499999999943,0.96,91565.9,-0.06,-205.34,146.1,0.46874956130981443,450000
9
+ 0.0,0.0,-0.028165050988662062,-0.003351250961580319,-0.02779330005309437,0.01789551158531212,35.56706930880914,6.414999999999612,1.0,98595.64,0.0,-176.88,126.3,0.4177889966964722,500000
10
+ 0.0,0.0,-0.038642823044209455,-0.0010554350740517575,-0.03831615989651927,0.028976557441591135,35.056014344020944,7.352999999999688,0.98,105424.58,-0.02,-200.12,145.06,0.46813130378723145,550000
11
+ 0.0,0.0,-0.03390552310154314,0.013562974781448673,-0.03313436006515467,0.0067784316148002555,35.62427346643689,5.857999999999705,1.0,112560.96,0.0,-161.22,115.16,0.37461525917053223,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.1082994422001929,0.003011505866011959,-0.10790569295182573,0.004536970518118108,21.830278772622208,24.73999999999702,0.04,12648.6,-1.24,-760.68,492.8,1.4122252988815307,150000
3
+ 0.0,0.0,-0.07273981965148434,0.0007607505564756634,-0.07326182728802899,-0.001774200896895223,25.906153610682647,20.37899999999817,0.38,35989.5,-0.76,-591.02,405.58,1.1899633693695069,200000
4
+ 0.0,0.0,-0.03392553203456798,-0.0038452520494004095,-0.03432573511752833,-0.008445330630372975,32.223182731138294,12.860999999999478,0.82,52941.82,-0.18,-358.3,255.22,0.7875207948684693,250000
5
+ 0.0,0.0,-0.036968987953707774,-0.005447807782881667,-0.03707245933198696,-0.005786821411527158,33.624170763598165,9.570999999999474,0.92,64528.46,-0.12,-267.14,189.42,0.5965239715576172,300000
6
+ 0.0,0.0,-0.04966370424580055,-0.005347870406606667,-0.04986510776049742,-0.00458418710003229,34.414831882748416,8.756999999999476,0.96,74142.66,-0.06,-245.78,173.14,0.5569100570678711,350000
7
+ 0.0,0.0,-0.01634530758458798,-0.0008786739541335655,-0.01613896782981276,-0.0010769550841284213,34.2487810466259,8.498999999999523,0.96,83286.12,-0.06,-235.08,167.98,0.5338046264648437,400000
8
+ 0.0,0.0,-0.028978953325945554,-0.0038878405150012296,-0.02897230768957166,-0.0034891184730423156,35.62727951990254,7.40499999999943,0.96,91565.9,-0.06,-205.34,146.1,0.46874956130981443,450000
9
+ 0.0,0.0,-0.028165050988662062,-0.003351250961580319,-0.02779330005309437,0.01789551158531212,35.56706930880914,6.414999999999612,1.0,98595.64,0.0,-176.88,126.3,0.4177889966964722,500000
10
+ 0.0,0.0,-0.038642823044209455,-0.0010554350740517575,-0.03831615989651927,0.028976557441591135,35.056014344020944,7.352999999999688,0.98,105424.58,-0.02,-200.12,145.06,0.46813130378723145,550000
11
+ 0.0,0.0,-0.03390552310154314,0.013562974781448673,-0.03313436006515467,0.0067784316148002555,35.62427346643689,5.857999999999705,1.0,112560.96,0.0,-161.22,115.16,0.37461525917053223,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 170.36433,0.21894172,0.006029191,7.30685,-77.37833,-170.39343,-205.4688,0.7845931,-0.8711581,82.360916,105000
3
+ 169.17783,0.19607791,0.006546308,6.729875,-60.224895,-169.07054,-205.06429,2.074533,-1.4942386,82.69476,110000
4
+ 167.67525,0.19802313,0.0057289028,7.6522784,-62.147114,-167.57787,-205.40822,1.0178978,-1.069851,74.35617,115000
5
+ 169.63168,0.20277095,0.0058093974,9.601883,-70.78181,-169.7659,-204.72607,0.8717408,-0.7142322,76.03804,120000
6
+ 168.48828,0.19374391,0.007202891,6.742466,-96.76988,-168.10051,-205.08267,1.5551095,-1.6026022,67.93953,125000
7
+ 166.5464,0.19563828,0.005621531,8.509864,-93.04726,-166.5781,-205.50827,1.1672877,-0.9607878,76.76318,130000
8
+ 166.74307,0.17378657,0.006387247,7.1664047,-50.24512,-166.75803,-204.93959,0.76640326,-0.6341237,71.68039,135000
9
+ 166.6372,0.18906733,0.0065080486,7.3975067,-66.13559,-166.97327,-206.3076,0.6904578,-0.7056025,71.36244,140000
10
+ 166.85966,0.18073499,0.006719387,6.3656893,-99.785194,-166.71233,-206.48392,7.013233,-7.8439493,148.12427,145000
11
+ 166.17963,0.20729432,0.005079087,9.659443,-88.73269,-166.27373,-206.91754,0.56020427,-0.83641684,79.49196,150000
12
+ 165.34685,0.20561716,0.0067161703,8.543812,-44.281883,-165.59138,-205.81795,1.3302803,-1.3829083,97.52431,155000
13
+ 163.94308,0.21787202,0.0069280206,7.521175,-60.326332,-164.50148,-206.91759,1.4113789,-1.4440593,82.18639,160000
14
+ 164.86636,0.17405638,0.0058633066,7.365646,-77.90503,-164.5954,-206.43721,1.0911732,-0.5000456,70.99501,165000
15
+ 159.11969,0.18866064,0.006610118,10.405631,-47.078773,-159.22746,-205.77167,1.829257,-2.45594,115.98605,170000
16
+ 163.75331,0.18817297,0.0067227012,9.4044485,-44.88467,-163.5277,-206.50441,0.9992245,-0.8565229,80.21806,175000
17
+ 163.07016,0.17400765,0.0056139273,7.7165427,-89.98117,-163.53116,-206.34828,0.61332476,-0.9117926,83.88816,180000
18
+ 161.94952,0.17026816,0.0062036025,8.116173,-68.62124,-161.84923,-205.81209,0.5785081,-0.6366843,74.3481,185000
19
+ 160.6735,0.18766049,0.00744603,6.353201,-25.06006,-160.50224,-206.77081,1.9802917,-2.1133678,90.35126,190000
20
+ 158.23639,0.15247436,0.0063208584,6.964598,-12.33769,-158.50166,-205.68327,0.6933593,-0.6916895,60.824055,195000
21
+ 156.27238,0.17519215,0.0067133605,10.779881,-31.722887,-155.8781,-205.82666,15.378744,-16.81961,277.5628,200000
22
+ 158.63504,0.19566041,0.0074162907,7.8488183,-52.798462,-159.1885,-206.42793,0.76031506,-0.5136889,66.516335,205000
23
+ 156.99013,0.17775333,0.0064749736,8.407059,-44.420174,-156.77927,-206.96283,0.8568773,-0.9689222,86.82034,210000
24
+ 154.83827,0.16183841,0.0076118507,7.608043,1.6605824,-155.00995,-206.22096,0.9419573,-1.0868781,77.26083,215000
25
+ 154.38905,0.17617625,0.006247711,9.952843,-36.3563,-154.70604,-205.66072,1.2745763,-1.3791659,94.39198,220000
26
+ 156.08891,0.20951201,0.008045672,5.424497,-19.197014,-155.94826,-206.44539,1.0179567,-0.9485631,66.62096,225000
27
+ 152.78012,0.16920249,0.0062982365,7.4996657,-29.1067,-153.15428,-206.78116,1.3159482,-1.334151,79.85596,230000
28
+ 151.4758,0.18569055,0.007306645,9.70651,2.2225487,-152.2435,-206.66393,2.494657,-2.3951373,114.173256,235000
29
+ 147.49304,0.21323606,0.0067745815,6.4634295,-45.2182,-148.23262,-205.96294,0.981453,-0.97025824,70.38358,240000
30
+ 151.94766,0.17840144,0.0075463173,8.088499,-30.566624,-152.2557,-206.0048,1.5482494,-0.7557701,77.22226,245000
31
+ 147.03555,0.19981742,0.006065391,6.650284,-6.035357,-147.28279,-206.94173,0.6972202,-0.9527101,73.369576,250000
32
+ 146.29326,0.16906586,0.007982335,7.9737396,-5.8075724,-146.98903,-207.14362,2.1590302,-1.7333362,98.75754,255000
33
+ 148.94885,0.19283384,0.0073309676,6.470512,-23.270819,-148.91365,-206.22253,1.2497947,-0.97256464,72.69933,260000
34
+ 144.72977,0.18187001,0.0073369606,11.183514,-1.155612,-145.28871,-206.17592,0.7613717,-0.8631334,81.84578,265000
35
+ 145.48438,0.18519565,0.0062072407,8.774543,-13.601801,-146.09267,-208.34697,0.8630998,-0.86108655,71.16887,270000
36
+ 148.03642,0.21036658,0.007136873,7.040549,-29.635118,-147.86443,-206.07816,1.0923246,-1.1224921,72.76837,275000
37
+ 146.32558,0.18033716,0.005982998,8.836471,2.6608799,-146.89323,-206.76927,3.9294307,-3.9761124,95.1454,280000
38
+ 142.91388,0.18972206,0.007756878,5.3909545,-10.443463,-143.14188,-206.70886,1.0673277,-1.0787406,68.59964,285000
39
+ 142.78514,0.16356176,0.008048165,9.379755,-26.021898,-143.66222,-206.86331,1.5797837,-1.3398582,97.0882,290000
40
+ 144.18135,0.17861168,0.007491418,8.012003,-4.4531703,-144.1055,-206.52899,1.5188723,-1.5138438,77.4846,295000
41
+ 143.2969,0.20481169,0.008429656,6.07559,-10.642406,-143.74448,-207.38278,0.84008896,-0.8546343,68.82912,300000
42
+ 141.90186,0.16033593,0.0059093037,5.9377527,-6.3765426,-142.53456,-206.47383,1.2694974,-1.3443509,73.80471,305000
43
+ 140.3665,0.16564643,0.008206978,7.568438,-18.62672,-140.3671,-206.08751,1.0662369,-1.0767798,88.83289,310000
44
+ 142.09285,0.1659788,0.007707567,10.117618,-10.6708,-142.1759,-207.16382,2.0725381,-1.812202,95.91617,315000
45
+ 139.95119,0.16143797,0.00683396,8.789693,-11.989407,-140.10677,-206.10672,1.3851298,-1.2626438,85.89223,320000
46
+ 136.67232,0.18466502,0.0074616023,9.425267,-10.429409,-136.63457,-205.65352,2.3044367,-2.1029897,108.597824,325000
47
+ 139.35927,0.20021755,0.008027626,6.7536607,-14.795733,-139.28845,-208.64197,0.98190236,-0.9411231,76.56332,330000
48
+ 138.55115,0.17118013,0.0063351044,5.5394306,-14.277614,-138.39743,-206.40433,3.6484606,-2.434829,72.00805,335000
49
+ 137.33824,0.18192746,0.0062597846,5.342087,1.8706388,-137.53511,-206.50905,0.9245131,-1.0123506,83.54138,340000
50
+ 139.0793,0.1848338,0.007351497,8.179608,-5.207801,-139.67552,-205.5466,1.333427,-0.86655194,76.48338,345000
51
+ 128.3735,0.1796968,0.0070594847,12.247507,-6.0065517,-128.841,-208.78543,2.6052685,-1.5861846,101.34641,350000
52
+ 141.19482,0.17602775,0.008147542,6.362179,-6.2299647,-142.0682,-208.96477,1.0425229,-0.93115,67.09405,355000
53
+ 136.1879,0.2051761,0.0071761105,9.735938,1.3996044,-136.97746,-205.51555,0.9840314,-1.8309411,86.27194,360000
54
+ 137.49907,0.17588153,0.007344768,5.59571,-22.756165,-137.83142,-206.64748,1.3585284,-1.3916738,68.95637,365000
55
+ 136.87233,0.17739311,0.006796496,6.238601,-14.863088,-137.18018,-205.36304,2.0899448,-2.3912437,106.574875,370000
56
+ 130.977,0.1902206,0.008613426,8.625649,-2.899521,-131.1317,-207.09421,1.2342834,-1.1851927,89.53218,375000
57
+ 133.28494,0.18393755,0.009118933,6.2765994,-1.8302927,-134.14232,-206.487,2.1198874,-2.0513363,91.72352,380000
58
+ 130.60258,0.16541028,0.007889809,5.1797004,-10.091493,-131.86226,-206.40796,1.7279665,-1.1581593,74.531204,385000
59
+ 128.24393,0.15922618,0.0071567404,9.754177,-9.080371,-128.99095,-208.31445,0.93972504,-0.9569409,86.97763,390000
60
+ 128.90193,0.16625214,0.007382805,8.647094,2.1610925,-129.38737,-206.00694,4.5666046,-5.0987144,128.72467,395000
61
+ 135.62279,0.1445878,0.00767932,7.0351763,0.5494194,-135.4263,-206.41792,1.3773159,-1.5316556,71.32526,400000
62
+ 131.56271,0.17303348,0.007859079,8.0727415,-2.488693,-132.63094,-206.77599,1.6989218,-1.4858683,96.86947,405000
63
+ 128.0134,0.16459425,0.006940962,5.316918,-3.9886737,-128.53572,-206.6262,2.5825028,-2.5795941,72.312744,410000
64
+ 128.7348,0.19685663,0.0064651417,4.7107363,-0.4697784,-128.94424,-205.43286,0.95871913,-0.96215534,67.11398,415000
65
+ 130.60416,0.16490093,0.008074075,6.933126,-0.32970625,-131.34515,-205.92598,1.1734091,-1.2569215,70.03881,420000
66
+ 128.78223,0.18530758,0.006585499,6.5972443,-3.5288134,-129.1845,-206.02101,1.393192,-1.3716276,77.95216,425000
67
+ 126.042755,0.20583215,0.0076041333,5.129434,-16.48037,-126.184265,-205.78636,1.481667,-1.5007421,71.87279,430000
68
+ 128.91081,0.16685365,0.0081781,6.4570346,6.2812867,-129.16763,-206.42761,1.6147461,-1.8175046,95.39056,435000
69
+ 129.843,0.19702086,0.00647768,7.91386,-6.440866,-130.07437,-205.21628,1.86248,-1.3439138,105.48244,440000
70
+ 134.47449,0.16819046,0.007918379,6.4390335,-9.009464,-135.63834,-205.63628,1.2989765,-0.9598222,76.34581,445000
71
+ 120.78238,0.16124439,0.008011321,5.213465,-4.4561105,-121.09501,-205.4993,2.2102125,-2.1412358,72.354355,450000
72
+ 129.32608,0.16403216,0.006540787,5.4983726,-1.8250384,-129.40652,-205.61757,0.85649663,-0.95740795,60.905594,455000
73
+ 123.35592,0.19912824,0.0061948844,4.9346747,-2.7656236,-123.891495,-203.82954,0.711717,-0.9721967,60.907852,460000
74
+ 128.76097,0.17102051,0.0071913037,6.949721,-4.2728677,-129.377,-207.45792,0.9348949,-1.1507661,67.40925,465000
75
+ 126.36452,0.16768114,0.008505501,6.7580767,-1.5945193,-126.5169,-207.26532,0.92392313,-1.2034451,75.088135,470000
76
+ 123.19831,0.16238818,0.0072487947,7.732679,1.5296301,-124.48549,-205.95447,1.538346,-1.1151538,93.29498,475000
77
+ 124.65933,0.16884959,0.0068334127,7.8628373,-4.225449,-125.290726,-206.28015,1.6040239,-1.4948745,112.16365,480000
78
+ 125.65905,0.13786928,0.006195744,5.581975,2.37257,-126.34688,-205.18672,0.91230965,-0.89154774,72.81787,485000
79
+ 128.69356,0.17004785,0.00793877,6.062862,-2.1094599,-129.02336,-206.22798,2.8397713,-3.1757445,109.75796,490000
80
+ 125.74614,0.16022219,0.007102709,7.2238297,2.3845646,-126.99214,-206.37772,0.8479984,-1.0374699,68.55626,495000
81
+ 120.099335,0.14688605,0.0058261943,6.2558866,-2.9229774,-120.7476,-206.8186,0.6332418,-0.6682107,53.365814,500000
82
+ 125.9198,0.1828177,0.00619709,5.4703093,2.660671,-126.4475,-207.645,1.5038699,-0.96893364,71.80914,505000
83
+ 129.78273,0.19624226,0.0070684124,6.105505,-6.7256465,-129.93819,-205.47493,1.0892931,-1.0320286,82.10678,510000
84
+ 123.67054,0.16573784,0.008028347,6.3732266,-1.8154807,-123.99491,-206.53903,0.9027804,-0.7386992,64.92002,515000
85
+ 124.69497,0.16809386,0.007857343,6.458307,-4.4270134,-125.66161,-208.81415,5.671386,-6.3832283,141.8532,520000
86
+ 119.915245,0.15855086,0.007855251,8.984485,-5.7908792,-120.821045,-207.70482,1.6197314,-1.547155,114.31679,525000
87
+ 119.972824,0.18677655,0.0058567575,7.368203,4.2591844,-120.47227,-206.89934,1.4433677,-1.4354756,72.31756,530000
88
+ 121.36884,0.19349036,0.006261016,8.673092,-5.783006,-121.95227,-205.99469,1.7397449,-1.5402676,99.24326,535000
89
+ 118.66977,0.15409777,0.0064587127,6.922184,-3.0481927,-119.37325,-207.90236,1.964745,-2.2784834,115.43329,540000
90
+ 125.055046,0.18204316,0.006504793,4.317791,-4.225568,-125.9175,-206.24545,0.9811372,-1.0443765,63.738922,545000
91
+ 116.697136,0.14854501,0.0065281503,6.8946533,-3.1851313,-117.6181,-205.59828,0.7752272,-0.83128864,81.660706,550000
92
+ 122.2359,0.17779335,0.0063771554,4.260939,-4.072661,-122.74955,-205.43623,0.6868709,-0.9449014,46.488945,555000
93
+ 117.77301,0.1546013,0.006839685,4.6886954,0.5398868,-118.70988,-205.98552,1.608045,-1.6602875,70.31387,560000
94
+ 121.37623,0.17227824,0.0072939782,6.018552,-5.249189,-121.63273,-205.70364,1.0832206,-1.1368798,71.503,565000
95
+ 117.4453,0.15827319,0.0066221277,5.13947,-1.5730124,-117.985306,-205.27672,0.9608782,-0.93175024,55.85295,570000
96
+ 121.91157,0.17913774,0.006647667,6.6887345,-1.7272011,-122.758385,-205.83427,0.9667392,-0.979988,74.90047,575000
97
+ 115.88664,0.14975587,0.0075136735,7.6345935,0.47374815,-116.734825,-206.4812,0.6163561,-0.6725199,66.7888,580000
98
+ 121.62561,0.1758306,0.0073668663,7.580495,3.0248332,-122.32151,-206.1131,3.6969879,-3.1692827,127.265,585000
99
+ 116.766174,0.17129938,0.006323202,7.2183976,-0.9948119,-117.08543,-205.74246,0.9726885,-1.1822499,94.52745,590000
100
+ 109.61898,0.13844872,0.0071428907,6.1544733,-3.0178797,-110.118095,-206.10524,1.1577383,-1.2149646,76.931046,595000
101
+ 108.46011,0.17863686,0.0067828363,4.6912613,-2.2519913,-109.35579,-206.15337,0.71140885,-0.7565845,55.287464,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 170.36433,0.21894172,0.006029191,7.30685,-77.37833,-170.39343,-205.4688,0.7845931,-0.8711581,82.360916,105000
3
+ 169.17783,0.19607791,0.006546308,6.729875,-60.224895,-169.07054,-205.06429,2.074533,-1.4942386,82.69476,110000
4
+ 167.67525,0.19802313,0.0057289028,7.6522784,-62.147114,-167.57787,-205.40822,1.0178978,-1.069851,74.35617,115000
5
+ 169.63168,0.20277095,0.0058093974,9.601883,-70.78181,-169.7659,-204.72607,0.8717408,-0.7142322,76.03804,120000
6
+ 168.48828,0.19374391,0.007202891,6.742466,-96.76988,-168.10051,-205.08267,1.5551095,-1.6026022,67.93953,125000
7
+ 166.5464,0.19563828,0.005621531,8.509864,-93.04726,-166.5781,-205.50827,1.1672877,-0.9607878,76.76318,130000
8
+ 166.74307,0.17378657,0.006387247,7.1664047,-50.24512,-166.75803,-204.93959,0.76640326,-0.6341237,71.68039,135000
9
+ 166.6372,0.18906733,0.0065080486,7.3975067,-66.13559,-166.97327,-206.3076,0.6904578,-0.7056025,71.36244,140000
10
+ 166.85966,0.18073499,0.006719387,6.3656893,-99.785194,-166.71233,-206.48392,7.013233,-7.8439493,148.12427,145000
11
+ 166.17963,0.20729432,0.005079087,9.659443,-88.73269,-166.27373,-206.91754,0.56020427,-0.83641684,79.49196,150000
12
+ 165.34685,0.20561716,0.0067161703,8.543812,-44.281883,-165.59138,-205.81795,1.3302803,-1.3829083,97.52431,155000
13
+ 163.94308,0.21787202,0.0069280206,7.521175,-60.326332,-164.50148,-206.91759,1.4113789,-1.4440593,82.18639,160000
14
+ 164.86636,0.17405638,0.0058633066,7.365646,-77.90503,-164.5954,-206.43721,1.0911732,-0.5000456,70.99501,165000
15
+ 159.11969,0.18866064,0.006610118,10.405631,-47.078773,-159.22746,-205.77167,1.829257,-2.45594,115.98605,170000
16
+ 163.75331,0.18817297,0.0067227012,9.4044485,-44.88467,-163.5277,-206.50441,0.9992245,-0.8565229,80.21806,175000
17
+ 163.07016,0.17400765,0.0056139273,7.7165427,-89.98117,-163.53116,-206.34828,0.61332476,-0.9117926,83.88816,180000
18
+ 161.94952,0.17026816,0.0062036025,8.116173,-68.62124,-161.84923,-205.81209,0.5785081,-0.6366843,74.3481,185000
19
+ 160.6735,0.18766049,0.00744603,6.353201,-25.06006,-160.50224,-206.77081,1.9802917,-2.1133678,90.35126,190000
20
+ 158.23639,0.15247436,0.0063208584,6.964598,-12.33769,-158.50166,-205.68327,0.6933593,-0.6916895,60.824055,195000
21
+ 156.27238,0.17519215,0.0067133605,10.779881,-31.722887,-155.8781,-205.82666,15.378744,-16.81961,277.5628,200000
22
+ 158.63504,0.19566041,0.0074162907,7.8488183,-52.798462,-159.1885,-206.42793,0.76031506,-0.5136889,66.516335,205000
23
+ 156.99013,0.17775333,0.0064749736,8.407059,-44.420174,-156.77927,-206.96283,0.8568773,-0.9689222,86.82034,210000
24
+ 154.83827,0.16183841,0.0076118507,7.608043,1.6605824,-155.00995,-206.22096,0.9419573,-1.0868781,77.26083,215000
25
+ 154.38905,0.17617625,0.006247711,9.952843,-36.3563,-154.70604,-205.66072,1.2745763,-1.3791659,94.39198,220000
26
+ 156.08891,0.20951201,0.008045672,5.424497,-19.197014,-155.94826,-206.44539,1.0179567,-0.9485631,66.62096,225000
27
+ 152.78012,0.16920249,0.0062982365,7.4996657,-29.1067,-153.15428,-206.78116,1.3159482,-1.334151,79.85596,230000
28
+ 151.4758,0.18569055,0.007306645,9.70651,2.2225487,-152.2435,-206.66393,2.494657,-2.3951373,114.173256,235000
29
+ 147.49304,0.21323606,0.0067745815,6.4634295,-45.2182,-148.23262,-205.96294,0.981453,-0.97025824,70.38358,240000
30
+ 151.94766,0.17840144,0.0075463173,8.088499,-30.566624,-152.2557,-206.0048,1.5482494,-0.7557701,77.22226,245000
31
+ 147.03555,0.19981742,0.006065391,6.650284,-6.035357,-147.28279,-206.94173,0.6972202,-0.9527101,73.369576,250000
32
+ 146.29326,0.16906586,0.007982335,7.9737396,-5.8075724,-146.98903,-207.14362,2.1590302,-1.7333362,98.75754,255000
33
+ 148.94885,0.19283384,0.0073309676,6.470512,-23.270819,-148.91365,-206.22253,1.2497947,-0.97256464,72.69933,260000
34
+ 144.72977,0.18187001,0.0073369606,11.183514,-1.155612,-145.28871,-206.17592,0.7613717,-0.8631334,81.84578,265000
35
+ 145.48438,0.18519565,0.0062072407,8.774543,-13.601801,-146.09267,-208.34697,0.8630998,-0.86108655,71.16887,270000
36
+ 148.03642,0.21036658,0.007136873,7.040549,-29.635118,-147.86443,-206.07816,1.0923246,-1.1224921,72.76837,275000
37
+ 146.32558,0.18033716,0.005982998,8.836471,2.6608799,-146.89323,-206.76927,3.9294307,-3.9761124,95.1454,280000
38
+ 142.91388,0.18972206,0.007756878,5.3909545,-10.443463,-143.14188,-206.70886,1.0673277,-1.0787406,68.59964,285000
39
+ 142.78514,0.16356176,0.008048165,9.379755,-26.021898,-143.66222,-206.86331,1.5797837,-1.3398582,97.0882,290000
40
+ 144.18135,0.17861168,0.007491418,8.012003,-4.4531703,-144.1055,-206.52899,1.5188723,-1.5138438,77.4846,295000
41
+ 143.2969,0.20481169,0.008429656,6.07559,-10.642406,-143.74448,-207.38278,0.84008896,-0.8546343,68.82912,300000
42
+ 141.90186,0.16033593,0.0059093037,5.9377527,-6.3765426,-142.53456,-206.47383,1.2694974,-1.3443509,73.80471,305000
43
+ 140.3665,0.16564643,0.008206978,7.568438,-18.62672,-140.3671,-206.08751,1.0662369,-1.0767798,88.83289,310000
44
+ 142.09285,0.1659788,0.007707567,10.117618,-10.6708,-142.1759,-207.16382,2.0725381,-1.812202,95.91617,315000
45
+ 139.95119,0.16143797,0.00683396,8.789693,-11.989407,-140.10677,-206.10672,1.3851298,-1.2626438,85.89223,320000
46
+ 136.67232,0.18466502,0.0074616023,9.425267,-10.429409,-136.63457,-205.65352,2.3044367,-2.1029897,108.597824,325000
47
+ 139.35927,0.20021755,0.008027626,6.7536607,-14.795733,-139.28845,-208.64197,0.98190236,-0.9411231,76.56332,330000
48
+ 138.55115,0.17118013,0.0063351044,5.5394306,-14.277614,-138.39743,-206.40433,3.6484606,-2.434829,72.00805,335000
49
+ 137.33824,0.18192746,0.0062597846,5.342087,1.8706388,-137.53511,-206.50905,0.9245131,-1.0123506,83.54138,340000
50
+ 139.0793,0.1848338,0.007351497,8.179608,-5.207801,-139.67552,-205.5466,1.333427,-0.86655194,76.48338,345000
51
+ 128.3735,0.1796968,0.0070594847,12.247507,-6.0065517,-128.841,-208.78543,2.6052685,-1.5861846,101.34641,350000
52
+ 141.19482,0.17602775,0.008147542,6.362179,-6.2299647,-142.0682,-208.96477,1.0425229,-0.93115,67.09405,355000
53
+ 136.1879,0.2051761,0.0071761105,9.735938,1.3996044,-136.97746,-205.51555,0.9840314,-1.8309411,86.27194,360000
54
+ 137.49907,0.17588153,0.007344768,5.59571,-22.756165,-137.83142,-206.64748,1.3585284,-1.3916738,68.95637,365000
55
+ 136.87233,0.17739311,0.006796496,6.238601,-14.863088,-137.18018,-205.36304,2.0899448,-2.3912437,106.574875,370000
56
+ 130.977,0.1902206,0.008613426,8.625649,-2.899521,-131.1317,-207.09421,1.2342834,-1.1851927,89.53218,375000
57
+ 133.28494,0.18393755,0.009118933,6.2765994,-1.8302927,-134.14232,-206.487,2.1198874,-2.0513363,91.72352,380000
58
+ 130.60258,0.16541028,0.007889809,5.1797004,-10.091493,-131.86226,-206.40796,1.7279665,-1.1581593,74.531204,385000
59
+ 128.24393,0.15922618,0.0071567404,9.754177,-9.080371,-128.99095,-208.31445,0.93972504,-0.9569409,86.97763,390000
60
+ 128.90193,0.16625214,0.007382805,8.647094,2.1610925,-129.38737,-206.00694,4.5666046,-5.0987144,128.72467,395000
61
+ 135.62279,0.1445878,0.00767932,7.0351763,0.5494194,-135.4263,-206.41792,1.3773159,-1.5316556,71.32526,400000
62
+ 131.56271,0.17303348,0.007859079,8.0727415,-2.488693,-132.63094,-206.77599,1.6989218,-1.4858683,96.86947,405000
63
+ 128.0134,0.16459425,0.006940962,5.316918,-3.9886737,-128.53572,-206.6262,2.5825028,-2.5795941,72.312744,410000
64
+ 128.7348,0.19685663,0.0064651417,4.7107363,-0.4697784,-128.94424,-205.43286,0.95871913,-0.96215534,67.11398,415000
65
+ 130.60416,0.16490093,0.008074075,6.933126,-0.32970625,-131.34515,-205.92598,1.1734091,-1.2569215,70.03881,420000
66
+ 128.78223,0.18530758,0.006585499,6.5972443,-3.5288134,-129.1845,-206.02101,1.393192,-1.3716276,77.95216,425000
67
+ 126.042755,0.20583215,0.0076041333,5.129434,-16.48037,-126.184265,-205.78636,1.481667,-1.5007421,71.87279,430000
68
+ 128.91081,0.16685365,0.0081781,6.4570346,6.2812867,-129.16763,-206.42761,1.6147461,-1.8175046,95.39056,435000
69
+ 129.843,0.19702086,0.00647768,7.91386,-6.440866,-130.07437,-205.21628,1.86248,-1.3439138,105.48244,440000
70
+ 134.47449,0.16819046,0.007918379,6.4390335,-9.009464,-135.63834,-205.63628,1.2989765,-0.9598222,76.34581,445000
71
+ 120.78238,0.16124439,0.008011321,5.213465,-4.4561105,-121.09501,-205.4993,2.2102125,-2.1412358,72.354355,450000
72
+ 129.32608,0.16403216,0.006540787,5.4983726,-1.8250384,-129.40652,-205.61757,0.85649663,-0.95740795,60.905594,455000
73
+ 123.35592,0.19912824,0.0061948844,4.9346747,-2.7656236,-123.891495,-203.82954,0.711717,-0.9721967,60.907852,460000
74
+ 128.76097,0.17102051,0.0071913037,6.949721,-4.2728677,-129.377,-207.45792,0.9348949,-1.1507661,67.40925,465000
75
+ 126.36452,0.16768114,0.008505501,6.7580767,-1.5945193,-126.5169,-207.26532,0.92392313,-1.2034451,75.088135,470000
76
+ 123.19831,0.16238818,0.0072487947,7.732679,1.5296301,-124.48549,-205.95447,1.538346,-1.1151538,93.29498,475000
77
+ 124.65933,0.16884959,0.0068334127,7.8628373,-4.225449,-125.290726,-206.28015,1.6040239,-1.4948745,112.16365,480000
78
+ 125.65905,0.13786928,0.006195744,5.581975,2.37257,-126.34688,-205.18672,0.91230965,-0.89154774,72.81787,485000
79
+ 128.69356,0.17004785,0.00793877,6.062862,-2.1094599,-129.02336,-206.22798,2.8397713,-3.1757445,109.75796,490000
80
+ 125.74614,0.16022219,0.007102709,7.2238297,2.3845646,-126.99214,-206.37772,0.8479984,-1.0374699,68.55626,495000
81
+ 120.099335,0.14688605,0.0058261943,6.2558866,-2.9229774,-120.7476,-206.8186,0.6332418,-0.6682107,53.365814,500000
82
+ 125.9198,0.1828177,0.00619709,5.4703093,2.660671,-126.4475,-207.645,1.5038699,-0.96893364,71.80914,505000
83
+ 129.78273,0.19624226,0.0070684124,6.105505,-6.7256465,-129.93819,-205.47493,1.0892931,-1.0320286,82.10678,510000
84
+ 123.67054,0.16573784,0.008028347,6.3732266,-1.8154807,-123.99491,-206.53903,0.9027804,-0.7386992,64.92002,515000
85
+ 124.69497,0.16809386,0.007857343,6.458307,-4.4270134,-125.66161,-208.81415,5.671386,-6.3832283,141.8532,520000
86
+ 119.915245,0.15855086,0.007855251,8.984485,-5.7908792,-120.821045,-207.70482,1.6197314,-1.547155,114.31679,525000
87
+ 119.972824,0.18677655,0.0058567575,7.368203,4.2591844,-120.47227,-206.89934,1.4433677,-1.4354756,72.31756,530000
88
+ 121.36884,0.19349036,0.006261016,8.673092,-5.783006,-121.95227,-205.99469,1.7397449,-1.5402676,99.24326,535000
89
+ 118.66977,0.15409777,0.0064587127,6.922184,-3.0481927,-119.37325,-207.90236,1.964745,-2.2784834,115.43329,540000
90
+ 125.055046,0.18204316,0.006504793,4.317791,-4.225568,-125.9175,-206.24545,0.9811372,-1.0443765,63.738922,545000
91
+ 116.697136,0.14854501,0.0065281503,6.8946533,-3.1851313,-117.6181,-205.59828,0.7752272,-0.83128864,81.660706,550000
92
+ 122.2359,0.17779335,0.0063771554,4.260939,-4.072661,-122.74955,-205.43623,0.6868709,-0.9449014,46.488945,555000
93
+ 117.77301,0.1546013,0.006839685,4.6886954,0.5398868,-118.70988,-205.98552,1.608045,-1.6602875,70.31387,560000
94
+ 121.37623,0.17227824,0.0072939782,6.018552,-5.249189,-121.63273,-205.70364,1.0832206,-1.1368798,71.503,565000
95
+ 117.4453,0.15827319,0.0066221277,5.13947,-1.5730124,-117.985306,-205.27672,0.9608782,-0.93175024,55.85295,570000
96
+ 121.91157,0.17913774,0.006647667,6.6887345,-1.7272011,-122.758385,-205.83427,0.9667392,-0.979988,74.90047,575000
97
+ 115.88664,0.14975587,0.0075136735,7.6345935,0.47374815,-116.734825,-206.4812,0.6163561,-0.6725199,66.7888,580000
98
+ 121.62561,0.1758306,0.0073668663,7.580495,3.0248332,-122.32151,-206.1131,3.6969879,-3.1692827,127.265,585000
99
+ 116.766174,0.17129938,0.006323202,7.2183976,-0.9948119,-117.08543,-205.74246,0.9726885,-1.1822499,94.52745,590000
100
+ 109.61898,0.13844872,0.0071428907,6.1544733,-3.0178797,-110.118095,-206.10524,1.1577383,-1.2149646,76.931046,595000
101
+ 108.46011,0.17863686,0.0067828363,4.6912613,-2.2519913,-109.35579,-206.15337,0.71140885,-0.7565845,55.287464,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b333389558f76787219d935dde4333da8f9efcb8e83eedc939ce0df6f6b9b2a2
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:159e41a3258f1d20e4af5818af1f2b88e06851f4fecdcc4a7f7ee6f7717a9a61
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab9e1599fd13d96433b45d52cd17d6dd1290fd8a274d6b171095d936305bcd22
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37d0bc3af1714fcd864206f3d4738135383f8b3c51225d24761d9ac3f66195d9
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc47083599d9512be49fb55d3fa1a8fc760d86ab1c869b61271ed4b0e37def7
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d54d5afcb93d67e3e4da214120cdc3f23927c5d7df9f371299d5069c27451fb9
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0ecd96ff7c8efad160b32bbcee6bbee21afe031edddf79f4494155e77ef5778
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12cf46f6d45028b17fe208b07f9a1b342b120e2e97eb3b1abd37f6d28997eba1
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:498bfe6f317b3f2d592f8dca2cd053d011d2c3c43b39294f62158d89ba56ea00
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ae9c61e2805ff54bf5a72346d441372b808943ac1b15366a7ae19f0ae556411
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260318_110630/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/dwmdpsyj