Tiredsheep commited on
Commit
2831946
·
verified ·
1 Parent(s): 13b12a8

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1050000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1100000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1150000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1200000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1250000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1300000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_850000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_900000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.02107627084199197,-0.004675492368147307,-0.021309391521087743,-0.004221191436439539,34.699158553374694,10.476999999999498,0.9,5041.84,-0.16,-300.3,207.54,0.6580933856964112,850000
3
+ 0.0,0.0,-0.04921792567813937,7.399888900830755e-05,-0.049245046610473964,-0.000639689417890807,32.99950456622831,9.57599999999965,0.94,15808.04,-0.08,-267.28,189.52,0.6001264667510986,900000
4
+ 0.0,0.0,-0.06833937992334083,-0.0024387624703611664,-0.0685028220353917,-0.0022007525834053365,34.81228741919733,7.459999999999582,1.0,24640.24,0.0,-208.44,147.2,0.4844835805892944,950000
5
+ 0.0,0.0,-0.03668442227696203,0.010190318383377143,-0.0355876812794475,0.019421567625957703,35.68056489886779,6.961999999999655,1.0,31904.32,0.0,-192.3,137.24,0.4453004026412964,1000000
6
+ 0.0,0.0,-0.05153750933476707,0.010671181127148502,-0.050740977678442746,0.007537259015766066,35.70684506522962,6.4139999999995645,1.0,38988.84,0.0,-172.0,126.28,0.4103929662704468,1050000
7
+ 0.0,0.0,-0.04969128744642682,0.018741234927554137,-0.04842071349495502,0.006808841006438723,35.678826703028264,5.587999999999614,1.0,44995.72,0.0,-151.94,109.76,0.35749550342559816,1100000
8
+ 0.0,0.0,-0.058657392687681664,0.03382875370975367,-0.0568640195532,0.025316209744802462,35.28384654773997,5.678999999999597,0.98,50931.24,-0.02,-148.18,111.58,0.36297250270843506,1150000
9
+ 0.0,0.0,-0.054116872329740065,0.047434332673411884,-0.05167478505239372,0.038494251436910085,35.50707765485937,5.245999999999674,1.0,56423.16,0.0,-143.64,102.92,0.33424689292907717,1200000
10
+ 0.0,0.0,-0.06508318934126844,0.07331873402384874,-0.0616814506880217,0.05520115932037156,35.77393719843283,4.583999999999716,1.0,61394.62,0.0,-122.14,89.68,0.2923939371109009,1250000
11
+ 0.0,0.0,-0.07541865845288216,0.06651926379704681,-0.07202787500800799,0.058866741964176954,35.42919082789601,4.662999999999722,1.0,66075.86,0.0,-126.16,91.26,0.30060941696166993,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.02107627084199197,-0.004675492368147307,-0.021309391521087743,-0.004221191436439539,34.699158553374694,10.476999999999498,0.9,5041.84,-0.16,-300.3,207.54,0.6580933856964112,850000
3
+ 0.0,0.0,-0.04921792567813937,7.399888900830755e-05,-0.049245046610473964,-0.000639689417890807,32.99950456622831,9.57599999999965,0.94,15808.04,-0.08,-267.28,189.52,0.6001264667510986,900000
4
+ 0.0,0.0,-0.06833937992334083,-0.0024387624703611664,-0.0685028220353917,-0.0022007525834053365,34.81228741919733,7.459999999999582,1.0,24640.24,0.0,-208.44,147.2,0.4844835805892944,950000
5
+ 0.0,0.0,-0.03668442227696203,0.010190318383377143,-0.0355876812794475,0.019421567625957703,35.68056489886779,6.961999999999655,1.0,31904.32,0.0,-192.3,137.24,0.4453004026412964,1000000
6
+ 0.0,0.0,-0.05153750933476707,0.010671181127148502,-0.050740977678442746,0.007537259015766066,35.70684506522962,6.4139999999995645,1.0,38988.84,0.0,-172.0,126.28,0.4103929662704468,1050000
7
+ 0.0,0.0,-0.04969128744642682,0.018741234927554137,-0.04842071349495502,0.006808841006438723,35.678826703028264,5.587999999999614,1.0,44995.72,0.0,-151.94,109.76,0.35749550342559816,1100000
8
+ 0.0,0.0,-0.058657392687681664,0.03382875370975367,-0.0568640195532,0.025316209744802462,35.28384654773997,5.678999999999597,0.98,50931.24,-0.02,-148.18,111.58,0.36297250270843506,1150000
9
+ 0.0,0.0,-0.054116872329740065,0.047434332673411884,-0.05167478505239372,0.038494251436910085,35.50707765485937,5.245999999999674,1.0,56423.16,0.0,-143.64,102.92,0.33424689292907717,1200000
10
+ 0.0,0.0,-0.06508318934126844,0.07331873402384874,-0.0616814506880217,0.05520115932037156,35.77393719843283,4.583999999999716,1.0,61394.62,0.0,-122.14,89.68,0.2923939371109009,1250000
11
+ 0.0,0.0,-0.07541865845288216,0.06651926379704681,-0.07202787500800799,0.058866741964176954,35.42919082789601,4.662999999999722,1.0,66075.86,0.0,-126.16,91.26,0.30060941696166993,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 165.94916,0.19220218,0.008821499,8.290423,-51.291126,-165.52391,-203.88777,2.6303725,-2.8633673,69.38124,805000
3
+ 160.52025,0.19856778,0.0075184917,5.6842246,-31.582855,-160.24405,-203.67157,1.0538582,-0.8785346,59.47021,810000
4
+ 159.94086,0.19715247,0.006898749,4.2486653,-42.350197,-160.32104,-203.56375,1.2570997,-1.3855804,62.890934,815000
5
+ 154.44083,0.16816002,0.008057651,6.31364,-33.507942,-155.21086,-204.39262,0.75263095,-0.7328983,52.542034,820000
6
+ 154.58711,0.16861342,0.00849723,5.9834924,-49.36386,-154.62512,-206.64568,0.91326153,-1.1097666,56.140114,825000
7
+ 150.42992,0.17648949,0.0067119855,8.786559,-29.69646,-151.27698,-204.0968,1.1677624,-1.3498764,80.08734,830000
8
+ 148.58722,0.18318821,0.009992071,7.331376,-26.944452,-149.10797,-203.99857,2.9292023,-3.0595114,83.68346,835000
9
+ 148.27496,0.18606454,0.008475147,6.14106,-33.39048,-149.38486,-204.77693,2.460623,-1.3962342,63.72415,840000
10
+ 146.26338,0.17207545,0.008946105,6.560231,-12.627028,-146.99345,-205.06725,0.9414781,-1.02624,59.209534,845000
11
+ 147.68811,0.17911208,0.0078436695,6.5400386,-35.449913,-147.98929,-205.04051,1.5505333,-1.3992028,63.25874,850000
12
+ 144.42937,0.18734269,0.007139745,5.6427684,-23.260338,-144.94595,-204.84871,0.7009237,-0.95371246,59.82173,855000
13
+ 141.38696,0.18870589,0.008889404,7.299225,-8.418949,-141.90779,-204.16833,1.6422588,-1.7173201,67.30147,860000
14
+ 142.54419,0.18281195,0.007416223,5.66791,-11.800163,-142.87486,-204.07089,1.1755475,-1.3799818,56.882973,865000
15
+ 138.68076,0.16002369,0.008880051,7.9106965,-9.667673,-139.04816,-205.47841,1.1198872,-1.0530244,74.9519,870000
16
+ 141.76353,0.1584831,0.009295257,8.211008,-28.120613,-142.23468,-206.26633,1.4573519,-1.5022671,92.48317,875000
17
+ 143.27043,0.16749263,0.008582355,5.9484186,-20.66303,-143.96284,-204.41641,2.3222246,-1.5330964,65.36554,880000
18
+ 141.58824,0.14298585,0.0076311743,5.9809666,1.9390942,-141.43596,-204.70366,2.5973742,-2.022761,78.48702,885000
19
+ 138.4323,0.17972443,0.0076904627,5.5925937,-23.839842,-139.08995,-206.69687,1.9034648,-1.8803254,72.58455,890000
20
+ 136.64816,0.15509908,0.008405525,8.01037,-4.9891725,-137.04565,-206.13745,1.388764,-1.1958457,74.49407,895000
21
+ 132.11246,0.20538938,0.008152055,6.0635924,-6.901685,-132.155,-207.38654,1.1667148,-1.3091934,68.97876,900000
22
+ 138.37624,0.17612407,0.0075702583,7.0116158,-7.917455,-139.36546,-206.06708,1.0769546,-1.2226399,71.19027,905000
23
+ 137.02834,0.16055012,0.008188193,5.512173,-21.541021,-137.53276,-205.18375,0.80734485,-1.0013565,58.816277,910000
24
+ 132.19661,0.20128673,0.009361631,8.0400305,0.85599923,-132.88797,-205.39253,2.2543619,-2.0640929,66.83952,915000
25
+ 132.52579,0.1715476,0.008822063,6.818364,-13.177557,-132.8474,-204.78217,1.6692353,-1.7582146,75.51861,920000
26
+ 137.21483,0.1808653,0.009060419,5.5434847,0.20207012,-136.93262,-204.72025,0.9896584,-0.9270447,70.398254,925000
27
+ 133.43236,0.16784263,0.0075010336,5.1997313,-3.6481256,-134.01646,-204.94348,0.787507,-0.72132224,57.982323,930000
28
+ 133.58086,0.18745762,0.010384915,6.1551337,5.037883,-134.72627,-205.41478,0.848086,-0.9285534,69.02502,935000
29
+ 128.7546,0.21316627,0.008468054,7.244269,-1.8419669,-130.16911,-204.83783,0.85187715,-0.80148154,55.28707,940000
30
+ 133.84161,0.1746731,0.008895,8.031392,-9.2382345,-134.29881,-204.9968,1.5049014,-1.5168611,94.661705,945000
31
+ 131.3171,0.19351244,0.007923281,4.9794335,-8.3188505,-132.24565,-205.88187,1.3856635,-1.5825607,53.995758,950000
32
+ 128.87009,0.17320783,0.008050034,8.19686,-2.2962713,-129.89714,-205.74829,0.9209784,-0.88482463,65.22101,955000
33
+ 130.01006,0.16688453,0.008108795,5.927852,-1.304389,-130.79256,-205.22359,1.2780644,-1.2972044,68.4635,960000
34
+ 129.21565,0.17989913,0.008367352,6.61328,0.38355362,-129.89671,-206.61165,0.68854535,-0.77945,56.576866,965000
35
+ 129.43326,0.17595664,0.0077537056,5.131687,-12.129506,-130.65018,-205.87715,0.4552427,-0.6557572,52.63449,970000
36
+ 130.53914,0.16437648,0.0077765295,5.966896,-2.2695227,-131.0007,-206.43019,0.9019813,-0.77989453,64.90492,975000
37
+ 129.33366,0.16875283,0.008251767,6.935899,1.7221506,-129.16766,-204.90408,1.0542189,-0.976832,64.396034,980000
38
+ 128.42839,0.16862388,0.0086214775,5.582151,1.0114627,-128.80981,-204.33093,1.5552778,-1.5707273,71.00809,985000
39
+ 123.75526,0.16982205,0.008266096,8.275441,-9.416346,-125.0412,-205.40904,0.94350266,-0.8645546,79.87608,990000
40
+ 126.13797,0.19981635,0.0077267266,5.7712836,3.7804542,-126.27317,-205.66545,5.567564,-4.9492655,93.988106,995000
41
+ 126.23371,0.14680552,0.009841313,5.4862947,0.38236427,-127.51829,-205.78638,1.5208943,-1.7703196,78.04884,1000000
42
+ 125.632065,0.15910974,0.0074706483,3.935521,4.68182,-126.39123,-205.58195,1.2994448,-1.0586004,59.846237,1005000
43
+ 124.701294,0.15596262,0.0075536403,6.9752045,2.8827085,-125.19933,-205.28671,0.9178224,-0.9600866,75.05773,1010000
44
+ 124.59049,0.17020847,0.009268334,6.364027,-0.92835236,-125.301285,-204.8009,1.3286438,-1.9681666,57.431393,1015000
45
+ 122.7424,0.18389456,0.008207897,6.305149,-6.3268948,-123.41054,-205.1389,0.6193223,-1.2298428,58.79794,1020000
46
+ 119.69115,0.18841374,0.0069601946,4.8886604,-2.9194465,-119.90188,-204.34747,1.1042267,-1.2867147,63.666275,1025000
47
+ 124.48084,0.1783503,0.0079333605,7.187286,-4.2016344,-124.86397,-204.44522,1.2179314,-1.0788733,75.68309,1030000
48
+ 120.356125,0.20006987,0.006095456,4.8867984,0.8985565,-120.51287,-205.53253,2.6143894,-2.2040935,62.552704,1035000
49
+ 121.08256,0.12956718,0.006904505,4.481767,2.0317664,-121.9201,-205.97516,1.0905318,-1.4351697,48.877197,1040000
50
+ 122.40426,0.17467004,0.007995511,6.1667953,-1.1883826,-123.31875,-205.34535,1.4863515,-1.3650583,56.77739,1045000
51
+ 114.53068,0.16160415,0.008101795,6.9494295,-3.3645456,-114.71812,-205.4817,0.8303708,-0.9407321,61.63012,1050000
52
+ 125.163,0.15524259,0.008071062,6.491343,-2.441509,-126.63867,-205.71558,0.9849137,-0.84998775,58.238808,1055000
53
+ 119.69333,0.17897147,0.010116518,8.138878,2.466087,-120.08333,-204.98666,1.693157,-1.7550731,73.51575,1060000
54
+ 122.033356,0.17476612,0.00786695,4.456556,0.14240876,-122.57871,-205.41997,0.96973187,-1.1816943,58.221767,1065000
55
+ 121.66176,0.19518714,0.007882548,5.6166534,-1.1929069,-122.298485,-205.07585,1.2549472,-1.1040386,55.80753,1070000
56
+ 117.19871,0.18059072,0.0066429484,5.9698696,1.058733,-117.42305,-204.83601,0.91558266,-0.8436406,53.223198,1075000
57
+ 121.72849,0.18207695,0.008072308,4.9727554,-3.815113,-123.036156,-204.60371,0.68673116,-0.9627115,64.95997,1080000
58
+ 118.64969,0.17189474,0.00850601,5.382267,4.0475154,-119.57841,-203.54228,0.8728439,-0.7976788,67.979904,1085000
59
+ 112.393425,0.14399691,0.008110014,6.6636214,0.75730586,-113.027855,-205.079,1.4320526,-1.4338815,74.77426,1090000
60
+ 115.21315,0.15417504,0.0068928604,5.398086,2.4884572,-116.06714,-204.09023,0.86733747,-0.8557687,50.790577,1095000
61
+ 116.7748,0.15896212,0.0064311624,6.023456,-0.7718896,-117.44509,-202.07509,0.7582587,-1.1629001,58.292175,1100000
62
+ 119.79914,0.17963345,0.008173429,4.306043,-1.3562726,-120.66416,-204.1364,0.87339026,-0.868292,50.615417,1105000
63
+ 117.08939,0.15317449,0.0087725455,7.4945946,-5.2351265,-117.55602,-205.18793,2.1818352,-2.2626808,63.753014,1110000
64
+ 116.12992,0.13636452,0.006904235,4.786905,2.8200214,-116.61489,-204.73573,0.94186765,-1.202125,50.606476,1115000
65
+ 115.90089,0.16965127,0.008496835,6.3898034,-0.33103627,-117.20083,-204.1852,1.3468211,-1.1753488,57.836517,1120000
66
+ 114.34761,0.19101258,0.0065548145,5.099271,-4.1653533,-115.46417,-204.53168,1.9140246,-1.9413083,56.049294,1125000
67
+ 116.341896,0.15376127,0.009542024,5.2838316,-4.629658,-116.79921,-199.9816,1.4185113,-1.4834372,69.70612,1130000
68
+ 116.65713,0.18474166,0.009406144,4.1285787,-0.80077195,-117.24761,-205.73653,1.2632558,-1.0932206,56.572372,1135000
69
+ 115.69002,0.18634446,0.0061526573,4.4752917,-2.0819263,-116.05088,-203.83507,0.83858746,-1.0862011,48.37677,1140000
70
+ 120.51609,0.173125,0.007760384,5.9965544,-1.246038,-121.694336,-204.88474,0.9719372,-0.8747356,52.604397,1145000
71
+ 110.144714,0.15462843,0.0074116704,6.192411,1.8371814,-110.88789,-205.47575,2.9704707,-3.156738,64.7457,1150000
72
+ 116.20422,0.17361496,0.007388244,6.6262984,3.8823435,-116.71743,-202.99893,0.96476406,-1.0391184,54.359806,1155000
73
+ 107.868484,0.18206777,0.0077585587,6.3598704,-3.274007,-108.44663,-203.37044,1.0767595,-1.100951,62.154808,1160000
74
+ 115.04954,0.18631339,0.008828803,5.604893,-2.765142,-115.36436,-203.68132,1.41614,-1.2496438,52.14547,1165000
75
+ 114.38623,0.1322573,0.007296554,7.019756,-1.6835718,-115.085655,-203.1055,1.8529601,-1.6374226,69.08356,1170000
76
+ 110.19382,0.13401252,0.00829246,5.221402,2.534111,-111.48042,-204.2084,0.94246817,-1.386095,54.879932,1175000
77
+ 111.4961,0.1710253,0.007463596,5.088102,0.12600261,-112.39446,-204.96445,1.0335574,-1.141461,61.663498,1180000
78
+ 113.9374,0.15945598,0.0076685273,6.6902328,-1.3366901,-114.80935,-206.33511,1.1537832,-1.0798306,62.557507,1185000
79
+ 115.794525,0.16188365,0.008815119,5.540385,-6.2568617,-115.77781,-203.98451,1.5125387,-1.3605133,62.530743,1190000
80
+ 113.34915,0.15848169,0.007472796,7.8162017,2.4646256,-114.41338,-203.9645,0.6216611,-0.8227062,62.624165,1195000
81
+ 110.26903,0.14777169,0.0066797724,4.520421,-2.836627,-110.97422,-200.28885,2.0973537,-2.288017,88.22222,1200000
82
+ 110.62465,0.14088058,0.006684949,4.752586,-1.9114203,-110.779884,-204.58266,1.0614887,-0.95672345,48.821808,1205000
83
+ 114.957886,0.16426066,0.007599554,6.364536,-1.6408579,-114.968704,-203.29164,1.7431694,-1.8149033,55.23766,1210000
84
+ 109.54023,0.17196585,0.007951109,6.1331134,4.156266,-110.60342,-201.9686,0.9479598,-0.9927247,61.73542,1215000
85
+ 112.6881,0.20435384,0.00997664,6.3727045,-0.2487312,-112.95233,-204.68027,0.942125,-0.8473665,66.80377,1220000
86
+ 108.26514,0.16816115,0.0071396474,8.0941305,0.08931691,-109.4306,-205.10344,1.231857,-1.3825514,92.324356,1225000
87
+ 108.41728,0.16194472,0.0069637466,4.4214754,-2.094327,-109.16477,-202.99193,0.7124436,-0.9245611,57.779507,1230000
88
+ 112.38797,0.18169802,0.007297529,5.1552773,-0.09032315,-112.83787,-204.37962,2.7747552,-3.0544617,92.36258,1235000
89
+ 105.50321,0.17684796,0.007988238,4.9505672,-5.319994,-106.076836,-205.89455,0.687777,-0.873466,59.829605,1240000
90
+ 111.42172,0.15093523,0.0075120195,4.883906,-3.505688,-112.37371,-202.62674,0.8096473,-0.91423005,48.873734,1245000
91
+ 107.45876,0.14982663,0.0066275736,5.6353793,6.1866417,-108.46757,-204.62291,3.431531,-3.3832383,64.15373,1250000
92
+ 107.624084,0.17485535,0.007557865,3.5827482,-3.215534,-108.4432,-205.70412,0.67623514,-0.83791107,44.987774,1255000
93
+ 106.940704,0.15981328,0.0067981067,5.5511703,10.077028,-107.44329,-206.15091,0.86434364,-0.7542088,54.14126,1260000
94
+ 108.88625,0.15048127,0.007554699,5.2630043,-1.1608475,-109.53536,-202.54436,0.953123,-0.9117453,61.267845,1265000
95
+ 105.68379,0.14430399,0.0073981285,5.836721,0.84424144,-106.40206,-203.31139,1.465935,-1.4168535,49.583805,1270000
96
+ 109.24959,0.19877642,0.008876696,4.7584662,1.9255707,-109.433044,-205.64334,1.2736892,-1.33052,60.573555,1275000
97
+ 107.65992,0.17859167,0.0074919723,5.3945427,2.2186937,-108.44796,-201.61934,1.5537128,-1.5533631,59.52887,1280000
98
+ 104.51854,0.16243227,0.006887507,12.036875,-1.6011493,-105.810295,-203.29726,1.5630424,-2.261839,91.22488,1285000
99
+ 104.80957,0.16135418,0.006165684,6.629422,-2.9380229,-105.241264,-204.68524,2.282403,-2.1268702,97.96749,1290000
100
+ 100.58086,0.17044768,0.006948799,5.5577416,-1.0663985,-101.45909,-203.55699,1.6017929,-1.5931822,71.03751,1295000
101
+ 100.46707,0.15911593,0.0067497515,4.331516,0.80087775,-101.52358,-203.13579,1.1351563,-1.0752224,52.208614,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 165.94916,0.19220218,0.008821499,8.290423,-51.291126,-165.52391,-203.88777,2.6303725,-2.8633673,69.38124,805000
3
+ 160.52025,0.19856778,0.0075184917,5.6842246,-31.582855,-160.24405,-203.67157,1.0538582,-0.8785346,59.47021,810000
4
+ 159.94086,0.19715247,0.006898749,4.2486653,-42.350197,-160.32104,-203.56375,1.2570997,-1.3855804,62.890934,815000
5
+ 154.44083,0.16816002,0.008057651,6.31364,-33.507942,-155.21086,-204.39262,0.75263095,-0.7328983,52.542034,820000
6
+ 154.58711,0.16861342,0.00849723,5.9834924,-49.36386,-154.62512,-206.64568,0.91326153,-1.1097666,56.140114,825000
7
+ 150.42992,0.17648949,0.0067119855,8.786559,-29.69646,-151.27698,-204.0968,1.1677624,-1.3498764,80.08734,830000
8
+ 148.58722,0.18318821,0.009992071,7.331376,-26.944452,-149.10797,-203.99857,2.9292023,-3.0595114,83.68346,835000
9
+ 148.27496,0.18606454,0.008475147,6.14106,-33.39048,-149.38486,-204.77693,2.460623,-1.3962342,63.72415,840000
10
+ 146.26338,0.17207545,0.008946105,6.560231,-12.627028,-146.99345,-205.06725,0.9414781,-1.02624,59.209534,845000
11
+ 147.68811,0.17911208,0.0078436695,6.5400386,-35.449913,-147.98929,-205.04051,1.5505333,-1.3992028,63.25874,850000
12
+ 144.42937,0.18734269,0.007139745,5.6427684,-23.260338,-144.94595,-204.84871,0.7009237,-0.95371246,59.82173,855000
13
+ 141.38696,0.18870589,0.008889404,7.299225,-8.418949,-141.90779,-204.16833,1.6422588,-1.7173201,67.30147,860000
14
+ 142.54419,0.18281195,0.007416223,5.66791,-11.800163,-142.87486,-204.07089,1.1755475,-1.3799818,56.882973,865000
15
+ 138.68076,0.16002369,0.008880051,7.9106965,-9.667673,-139.04816,-205.47841,1.1198872,-1.0530244,74.9519,870000
16
+ 141.76353,0.1584831,0.009295257,8.211008,-28.120613,-142.23468,-206.26633,1.4573519,-1.5022671,92.48317,875000
17
+ 143.27043,0.16749263,0.008582355,5.9484186,-20.66303,-143.96284,-204.41641,2.3222246,-1.5330964,65.36554,880000
18
+ 141.58824,0.14298585,0.0076311743,5.9809666,1.9390942,-141.43596,-204.70366,2.5973742,-2.022761,78.48702,885000
19
+ 138.4323,0.17972443,0.0076904627,5.5925937,-23.839842,-139.08995,-206.69687,1.9034648,-1.8803254,72.58455,890000
20
+ 136.64816,0.15509908,0.008405525,8.01037,-4.9891725,-137.04565,-206.13745,1.388764,-1.1958457,74.49407,895000
21
+ 132.11246,0.20538938,0.008152055,6.0635924,-6.901685,-132.155,-207.38654,1.1667148,-1.3091934,68.97876,900000
22
+ 138.37624,0.17612407,0.0075702583,7.0116158,-7.917455,-139.36546,-206.06708,1.0769546,-1.2226399,71.19027,905000
23
+ 137.02834,0.16055012,0.008188193,5.512173,-21.541021,-137.53276,-205.18375,0.80734485,-1.0013565,58.816277,910000
24
+ 132.19661,0.20128673,0.009361631,8.0400305,0.85599923,-132.88797,-205.39253,2.2543619,-2.0640929,66.83952,915000
25
+ 132.52579,0.1715476,0.008822063,6.818364,-13.177557,-132.8474,-204.78217,1.6692353,-1.7582146,75.51861,920000
26
+ 137.21483,0.1808653,0.009060419,5.5434847,0.20207012,-136.93262,-204.72025,0.9896584,-0.9270447,70.398254,925000
27
+ 133.43236,0.16784263,0.0075010336,5.1997313,-3.6481256,-134.01646,-204.94348,0.787507,-0.72132224,57.982323,930000
28
+ 133.58086,0.18745762,0.010384915,6.1551337,5.037883,-134.72627,-205.41478,0.848086,-0.9285534,69.02502,935000
29
+ 128.7546,0.21316627,0.008468054,7.244269,-1.8419669,-130.16911,-204.83783,0.85187715,-0.80148154,55.28707,940000
30
+ 133.84161,0.1746731,0.008895,8.031392,-9.2382345,-134.29881,-204.9968,1.5049014,-1.5168611,94.661705,945000
31
+ 131.3171,0.19351244,0.007923281,4.9794335,-8.3188505,-132.24565,-205.88187,1.3856635,-1.5825607,53.995758,950000
32
+ 128.87009,0.17320783,0.008050034,8.19686,-2.2962713,-129.89714,-205.74829,0.9209784,-0.88482463,65.22101,955000
33
+ 130.01006,0.16688453,0.008108795,5.927852,-1.304389,-130.79256,-205.22359,1.2780644,-1.2972044,68.4635,960000
34
+ 129.21565,0.17989913,0.008367352,6.61328,0.38355362,-129.89671,-206.61165,0.68854535,-0.77945,56.576866,965000
35
+ 129.43326,0.17595664,0.0077537056,5.131687,-12.129506,-130.65018,-205.87715,0.4552427,-0.6557572,52.63449,970000
36
+ 130.53914,0.16437648,0.0077765295,5.966896,-2.2695227,-131.0007,-206.43019,0.9019813,-0.77989453,64.90492,975000
37
+ 129.33366,0.16875283,0.008251767,6.935899,1.7221506,-129.16766,-204.90408,1.0542189,-0.976832,64.396034,980000
38
+ 128.42839,0.16862388,0.0086214775,5.582151,1.0114627,-128.80981,-204.33093,1.5552778,-1.5707273,71.00809,985000
39
+ 123.75526,0.16982205,0.008266096,8.275441,-9.416346,-125.0412,-205.40904,0.94350266,-0.8645546,79.87608,990000
40
+ 126.13797,0.19981635,0.0077267266,5.7712836,3.7804542,-126.27317,-205.66545,5.567564,-4.9492655,93.988106,995000
41
+ 126.23371,0.14680552,0.009841313,5.4862947,0.38236427,-127.51829,-205.78638,1.5208943,-1.7703196,78.04884,1000000
42
+ 125.632065,0.15910974,0.0074706483,3.935521,4.68182,-126.39123,-205.58195,1.2994448,-1.0586004,59.846237,1005000
43
+ 124.701294,0.15596262,0.0075536403,6.9752045,2.8827085,-125.19933,-205.28671,0.9178224,-0.9600866,75.05773,1010000
44
+ 124.59049,0.17020847,0.009268334,6.364027,-0.92835236,-125.301285,-204.8009,1.3286438,-1.9681666,57.431393,1015000
45
+ 122.7424,0.18389456,0.008207897,6.305149,-6.3268948,-123.41054,-205.1389,0.6193223,-1.2298428,58.79794,1020000
46
+ 119.69115,0.18841374,0.0069601946,4.8886604,-2.9194465,-119.90188,-204.34747,1.1042267,-1.2867147,63.666275,1025000
47
+ 124.48084,0.1783503,0.0079333605,7.187286,-4.2016344,-124.86397,-204.44522,1.2179314,-1.0788733,75.68309,1030000
48
+ 120.356125,0.20006987,0.006095456,4.8867984,0.8985565,-120.51287,-205.53253,2.6143894,-2.2040935,62.552704,1035000
49
+ 121.08256,0.12956718,0.006904505,4.481767,2.0317664,-121.9201,-205.97516,1.0905318,-1.4351697,48.877197,1040000
50
+ 122.40426,0.17467004,0.007995511,6.1667953,-1.1883826,-123.31875,-205.34535,1.4863515,-1.3650583,56.77739,1045000
51
+ 114.53068,0.16160415,0.008101795,6.9494295,-3.3645456,-114.71812,-205.4817,0.8303708,-0.9407321,61.63012,1050000
52
+ 125.163,0.15524259,0.008071062,6.491343,-2.441509,-126.63867,-205.71558,0.9849137,-0.84998775,58.238808,1055000
53
+ 119.69333,0.17897147,0.010116518,8.138878,2.466087,-120.08333,-204.98666,1.693157,-1.7550731,73.51575,1060000
54
+ 122.033356,0.17476612,0.00786695,4.456556,0.14240876,-122.57871,-205.41997,0.96973187,-1.1816943,58.221767,1065000
55
+ 121.66176,0.19518714,0.007882548,5.6166534,-1.1929069,-122.298485,-205.07585,1.2549472,-1.1040386,55.80753,1070000
56
+ 117.19871,0.18059072,0.0066429484,5.9698696,1.058733,-117.42305,-204.83601,0.91558266,-0.8436406,53.223198,1075000
57
+ 121.72849,0.18207695,0.008072308,4.9727554,-3.815113,-123.036156,-204.60371,0.68673116,-0.9627115,64.95997,1080000
58
+ 118.64969,0.17189474,0.00850601,5.382267,4.0475154,-119.57841,-203.54228,0.8728439,-0.7976788,67.979904,1085000
59
+ 112.393425,0.14399691,0.008110014,6.6636214,0.75730586,-113.027855,-205.079,1.4320526,-1.4338815,74.77426,1090000
60
+ 115.21315,0.15417504,0.0068928604,5.398086,2.4884572,-116.06714,-204.09023,0.86733747,-0.8557687,50.790577,1095000
61
+ 116.7748,0.15896212,0.0064311624,6.023456,-0.7718896,-117.44509,-202.07509,0.7582587,-1.1629001,58.292175,1100000
62
+ 119.79914,0.17963345,0.008173429,4.306043,-1.3562726,-120.66416,-204.1364,0.87339026,-0.868292,50.615417,1105000
63
+ 117.08939,0.15317449,0.0087725455,7.4945946,-5.2351265,-117.55602,-205.18793,2.1818352,-2.2626808,63.753014,1110000
64
+ 116.12992,0.13636452,0.006904235,4.786905,2.8200214,-116.61489,-204.73573,0.94186765,-1.202125,50.606476,1115000
65
+ 115.90089,0.16965127,0.008496835,6.3898034,-0.33103627,-117.20083,-204.1852,1.3468211,-1.1753488,57.836517,1120000
66
+ 114.34761,0.19101258,0.0065548145,5.099271,-4.1653533,-115.46417,-204.53168,1.9140246,-1.9413083,56.049294,1125000
67
+ 116.341896,0.15376127,0.009542024,5.2838316,-4.629658,-116.79921,-199.9816,1.4185113,-1.4834372,69.70612,1130000
68
+ 116.65713,0.18474166,0.009406144,4.1285787,-0.80077195,-117.24761,-205.73653,1.2632558,-1.0932206,56.572372,1135000
69
+ 115.69002,0.18634446,0.0061526573,4.4752917,-2.0819263,-116.05088,-203.83507,0.83858746,-1.0862011,48.37677,1140000
70
+ 120.51609,0.173125,0.007760384,5.9965544,-1.246038,-121.694336,-204.88474,0.9719372,-0.8747356,52.604397,1145000
71
+ 110.144714,0.15462843,0.0074116704,6.192411,1.8371814,-110.88789,-205.47575,2.9704707,-3.156738,64.7457,1150000
72
+ 116.20422,0.17361496,0.007388244,6.6262984,3.8823435,-116.71743,-202.99893,0.96476406,-1.0391184,54.359806,1155000
73
+ 107.868484,0.18206777,0.0077585587,6.3598704,-3.274007,-108.44663,-203.37044,1.0767595,-1.100951,62.154808,1160000
74
+ 115.04954,0.18631339,0.008828803,5.604893,-2.765142,-115.36436,-203.68132,1.41614,-1.2496438,52.14547,1165000
75
+ 114.38623,0.1322573,0.007296554,7.019756,-1.6835718,-115.085655,-203.1055,1.8529601,-1.6374226,69.08356,1170000
76
+ 110.19382,0.13401252,0.00829246,5.221402,2.534111,-111.48042,-204.2084,0.94246817,-1.386095,54.879932,1175000
77
+ 111.4961,0.1710253,0.007463596,5.088102,0.12600261,-112.39446,-204.96445,1.0335574,-1.141461,61.663498,1180000
78
+ 113.9374,0.15945598,0.0076685273,6.6902328,-1.3366901,-114.80935,-206.33511,1.1537832,-1.0798306,62.557507,1185000
79
+ 115.794525,0.16188365,0.008815119,5.540385,-6.2568617,-115.77781,-203.98451,1.5125387,-1.3605133,62.530743,1190000
80
+ 113.34915,0.15848169,0.007472796,7.8162017,2.4646256,-114.41338,-203.9645,0.6216611,-0.8227062,62.624165,1195000
81
+ 110.26903,0.14777169,0.0066797724,4.520421,-2.836627,-110.97422,-200.28885,2.0973537,-2.288017,88.22222,1200000
82
+ 110.62465,0.14088058,0.006684949,4.752586,-1.9114203,-110.779884,-204.58266,1.0614887,-0.95672345,48.821808,1205000
83
+ 114.957886,0.16426066,0.007599554,6.364536,-1.6408579,-114.968704,-203.29164,1.7431694,-1.8149033,55.23766,1210000
84
+ 109.54023,0.17196585,0.007951109,6.1331134,4.156266,-110.60342,-201.9686,0.9479598,-0.9927247,61.73542,1215000
85
+ 112.6881,0.20435384,0.00997664,6.3727045,-0.2487312,-112.95233,-204.68027,0.942125,-0.8473665,66.80377,1220000
86
+ 108.26514,0.16816115,0.0071396474,8.0941305,0.08931691,-109.4306,-205.10344,1.231857,-1.3825514,92.324356,1225000
87
+ 108.41728,0.16194472,0.0069637466,4.4214754,-2.094327,-109.16477,-202.99193,0.7124436,-0.9245611,57.779507,1230000
88
+ 112.38797,0.18169802,0.007297529,5.1552773,-0.09032315,-112.83787,-204.37962,2.7747552,-3.0544617,92.36258,1235000
89
+ 105.50321,0.17684796,0.007988238,4.9505672,-5.319994,-106.076836,-205.89455,0.687777,-0.873466,59.829605,1240000
90
+ 111.42172,0.15093523,0.0075120195,4.883906,-3.505688,-112.37371,-202.62674,0.8096473,-0.91423005,48.873734,1245000
91
+ 107.45876,0.14982663,0.0066275736,5.6353793,6.1866417,-108.46757,-204.62291,3.431531,-3.3832383,64.15373,1250000
92
+ 107.624084,0.17485535,0.007557865,3.5827482,-3.215534,-108.4432,-205.70412,0.67623514,-0.83791107,44.987774,1255000
93
+ 106.940704,0.15981328,0.0067981067,5.5511703,10.077028,-107.44329,-206.15091,0.86434364,-0.7542088,54.14126,1260000
94
+ 108.88625,0.15048127,0.007554699,5.2630043,-1.1608475,-109.53536,-202.54436,0.953123,-0.9117453,61.267845,1265000
95
+ 105.68379,0.14430399,0.0073981285,5.836721,0.84424144,-106.40206,-203.31139,1.465935,-1.4168535,49.583805,1270000
96
+ 109.24959,0.19877642,0.008876696,4.7584662,1.9255707,-109.433044,-205.64334,1.2736892,-1.33052,60.573555,1275000
97
+ 107.65992,0.17859167,0.0074919723,5.3945427,2.2186937,-108.44796,-201.61934,1.5537128,-1.5533631,59.52887,1280000
98
+ 104.51854,0.16243227,0.006887507,12.036875,-1.6011493,-105.810295,-203.29726,1.5630424,-2.261839,91.22488,1285000
99
+ 104.80957,0.16135418,0.006165684,6.629422,-2.9380229,-105.241264,-204.68524,2.282403,-2.1268702,97.96749,1290000
100
+ 100.58086,0.17044768,0.006948799,5.5577416,-1.0663985,-101.45909,-203.55699,1.6017929,-1.5931822,71.03751,1295000
101
+ 100.46707,0.15911593,0.0067497515,4.331516,0.80087775,-101.52358,-203.13579,1.1351563,-1.0752224,52.208614,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7833cce19b805c43389db797c1fd4a09bbb2226670b5dc74ae85bb343d1f6866
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85b56b27b618ee53cab97044dafdf305e9e22481c20dc190cfe3d16c733aa8c8
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:478c5dd8ddcd7a0776e0969cdd47c365baf70c35990acbc51aad5dd081ad24b5
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:679a87ed441c44148e02698ffb8c43f011cfa2482fcd3c1bacbc8b732c3f89ca
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a8bb6580aece907b67d146b4dd1ee7319b654b435d770260b5242a75a7cd370
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c90d324527d90e2bb84f309834eb1047e39e64d47c74985d1ae58ab75163de43
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_1300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8f6c5e9306e1ccbfc65209eb95ed81e819e411c65d31fc62553b03ff116de6e
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8d6d98ce88d8ee660a49e3f56803836c9d334ea3d473e633f5eef7f364a98c6
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:541db8e796ebeccf7b43ac151a1972f19fabda68e4deee0abece643c397ee56c
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e507de4622b8ac1d408dace1beee0a5b108d5758563bd0d42acc4173fc2311c
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_131529/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/lk315p2u