Tiredsheep commited on
Commit
50e278a
·
verified ·
1 Parent(s): c967bad

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1050000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1100000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1150000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1200000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1250000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1300000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1350000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1400000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1450000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1500000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.01486739938119046,-0.007423921492802676,-0.014823491189320857,-0.004815552470076898,35.111582112287905,8.710999999999752,1.0,4270.04,0.0,-241.04,172.22,0.5644462394714356,1050000
3
+ 0.0,0.0,-0.0303455207074162,0.005197132223327359,-0.03027222570636162,0.0004590901857191028,33.502480887522374,8.729999999999517,0.96,13552.14,-0.04,-244.94,172.6,0.5602327871322632,1100000
4
+ 0.0,0.0,-0.02543749708528784,0.008358332598337822,-0.025169425576195316,-0.0056659957702533716,35.50889108299261,6.9619999999995805,1.0,21340.52,0.0,-191.8,137.24,0.45554203510284424,1150000
5
+ 0.0,0.0,-0.03280233190957643,-0.002477716885651842,-0.032337943163637174,-0.001126092805777999,35.32180234667165,7.286999999999653,1.0,28504.8,0.0,-200.46,143.74,0.47033468723297117,1200000
6
+ 0.0,0.0,-0.028214466019529268,-0.0008682359294275169,-0.027581031359592733,-0.002664831360910472,35.45747368434129,6.282999999999532,0.98,35398.2,-0.02,-170.76,123.66,0.4080043601989746,1250000
7
+ 0.0,0.0,-0.023443167263652417,0.011831789767577892,-0.02237778653368213,0.007756937981092071,35.63972123040542,6.014999999999629,1.0,41930.4,0.0,-166.2,118.3,0.3918265438079834,1300000
8
+ 0.0,0.0,-0.03180874288769998,0.07202437446940343,-0.030197021088128984,0.02260723291022123,35.65422672294366,5.4779999999996685,1.0,47715.28,0.0,-147.26,107.56,0.3506324243545532,1350000
9
+ 0.0,0.0,-0.04375058829015286,0.03541982041985015,-0.041641109560134705,0.022009846446527634,35.46172293848521,4.890999999999683,1.0,53130.72,0.0,-131.14,95.82,0.3153611516952515,1400000
10
+ 0.0,0.0,-0.04665653577291752,0.04423798154541816,-0.04416073362437467,0.03267159865443028,35.69535679911387,4.761999999999715,1.0,58037.64,0.0,-125.58,93.24,0.3096184206008911,1450000
11
+ 0.0,0.0,-0.05968818574575715,0.0626929248159906,-0.056118084567758755,0.05441269530555327,35.81017219589457,5.020999999999721,1.0,63048.18,0.0,-139.68,98.42,0.32245368003845215,1500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.01486739938119046,-0.007423921492802676,-0.014823491189320857,-0.004815552470076898,35.111582112287905,8.710999999999752,1.0,4270.04,0.0,-241.04,172.22,0.5644462394714356,1050000
3
+ 0.0,0.0,-0.0303455207074162,0.005197132223327359,-0.03027222570636162,0.0004590901857191028,33.502480887522374,8.729999999999517,0.96,13552.14,-0.04,-244.94,172.6,0.5602327871322632,1100000
4
+ 0.0,0.0,-0.02543749708528784,0.008358332598337822,-0.025169425576195316,-0.0056659957702533716,35.50889108299261,6.9619999999995805,1.0,21340.52,0.0,-191.8,137.24,0.45554203510284424,1150000
5
+ 0.0,0.0,-0.03280233190957643,-0.002477716885651842,-0.032337943163637174,-0.001126092805777999,35.32180234667165,7.286999999999653,1.0,28504.8,0.0,-200.46,143.74,0.47033468723297117,1200000
6
+ 0.0,0.0,-0.028214466019529268,-0.0008682359294275169,-0.027581031359592733,-0.002664831360910472,35.45747368434129,6.282999999999532,0.98,35398.2,-0.02,-170.76,123.66,0.4080043601989746,1250000
7
+ 0.0,0.0,-0.023443167263652417,0.011831789767577892,-0.02237778653368213,0.007756937981092071,35.63972123040542,6.014999999999629,1.0,41930.4,0.0,-166.2,118.3,0.3918265438079834,1300000
8
+ 0.0,0.0,-0.03180874288769998,0.07202437446940343,-0.030197021088128984,0.02260723291022123,35.65422672294366,5.4779999999996685,1.0,47715.28,0.0,-147.26,107.56,0.3506324243545532,1350000
9
+ 0.0,0.0,-0.04375058829015286,0.03541982041985015,-0.041641109560134705,0.022009846446527634,35.46172293848521,4.890999999999683,1.0,53130.72,0.0,-131.14,95.82,0.3153611516952515,1400000
10
+ 0.0,0.0,-0.04665653577291752,0.04423798154541816,-0.04416073362437467,0.03267159865443028,35.69535679911387,4.761999999999715,1.0,58037.64,0.0,-125.58,93.24,0.3096184206008911,1450000
11
+ 0.0,0.0,-0.05968818574575715,0.0626929248159906,-0.056118084567758755,0.05441269530555327,35.81017219589457,5.020999999999721,1.0,63048.18,0.0,-139.68,98.42,0.32245368003845215,1500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 165.71036,0.17307585,0.0075569265,5.1738296,-55.142273,-165.87933,-203.9221,1.4671576,-1.540129,62.327446,1005000
3
+ 160.0284,0.16913897,0.006196486,5.2068734,-50.711933,-160.08621,-204.8742,2.0647225,-2.2819893,46.92933,1010000
4
+ 160.00772,0.18041171,0.007584412,5.6884966,-41.510357,-160.31819,-203.68896,2.2177658,-2.0569305,55.091763,1015000
5
+ 152.06429,0.18693909,0.008315922,8.042964,-32.561386,-152.95808,-203.45708,0.86879474,-1.0419067,61.943924,1020000
6
+ 151.30014,0.20755628,0.00644345,6.381181,-59.05737,-151.5826,-205.55083,0.87046176,-0.87307626,52.875042,1025000
7
+ 148.944,0.16427748,0.0085353935,7.0757785,-39.73715,-149.58139,-204.4799,1.2767617,-1.2689552,60.4748,1030000
8
+ 147.17282,0.19035524,0.008243441,5.828989,-47.62758,-147.81685,-203.36523,2.7970405,-2.4949458,68.10646,1035000
9
+ 148.21576,0.13817805,0.009179717,11.583496,-16.469782,-149.31267,-204.54143,2.1010914,-2.0794356,99.87376,1040000
10
+ 148.94691,0.17812805,0.010284772,8.646125,-55.549942,-149.07932,-204.09373,0.8609638,-0.84128785,63.157845,1045000
11
+ 149.54684,0.1980061,0.007849528,9.923751,-28.363472,-149.81775,-204.51097,0.89891547,-0.959749,63.80462,1050000
12
+ 143.65121,0.18182531,0.008812244,7.5049067,-32.717007,-144.37744,-205.51881,2.072872,-2.94072,71.23982,1055000
13
+ 139.551,0.17582634,0.008280634,9.614909,-5.505001,-140.46678,-205.0562,1.6609832,-2.410016,65.973526,1060000
14
+ 139.4577,0.17177549,0.0072339145,9.037575,-25.78911,-140.07825,-204.48523,0.61745006,-0.7223854,54.346672,1065000
15
+ 136.56793,0.19720663,0.00759297,11.307067,-22.275513,-136.85545,-205.2892,2.3687332,-2.45513,115.85127,1070000
16
+ 140.05908,0.1974659,0.009458769,7.0015464,-1.4904993,-140.29327,-205.33807,1.4471562,-1.2020954,75.385925,1075000
17
+ 138.51169,0.18049401,0.009441682,9.087483,-29.692816,-139.00275,-204.98868,1.2425953,-1.2501372,86.93852,1080000
18
+ 139.54257,0.18923058,0.0075250217,7.303032,-32.520348,-139.98158,-205.64459,1.6777635,-1.9048556,90.948235,1085000
19
+ 137.00858,0.16610764,0.0079428265,5.7546244,-16.090126,-137.60994,-205.59555,1.0912721,-1.1508859,62.09266,1090000
20
+ 134.14182,0.15920353,0.008814591,9.6023035,2.8507733,-134.94537,-204.98654,1.1577233,-1.0597589,71.95645,1095000
21
+ 130.96548,0.1884156,0.008026725,8.964839,6.135522,-131.55254,-205.08368,2.5706983,-1.5806845,124.62309,1100000
22
+ 136.28583,0.18757619,0.008329004,7.890812,-18.23137,-136.73521,-206.72925,1.0234339,-0.9141383,58.44951,1105000
23
+ 131.6095,0.16726455,0.009526978,6.5234833,-9.141151,-131.89262,-205.09105,1.0984849,-1.417765,65.41466,1110000
24
+ 127.85196,0.13797027,0.009532055,10.030955,0.5285305,-128.83955,-205.2291,1.2255989,-1.3275607,74.605255,1115000
25
+ 130.19453,0.1844208,0.007989071,5.3812423,-5.2507505,-130.5836,-204.16258,1.067622,-1.0858682,55.778625,1120000
26
+ 134.00534,0.20369962,0.008358074,8.020683,-6.9948506,-134.42136,-204.44603,1.4402368,-1.5731618,59.323326,1125000
27
+ 131.219,0.17214307,0.009955655,9.847293,-7.767254,-131.46045,-204.84212,1.2946599,-1.114071,70.09626,1130000
28
+ 132.01086,0.18917647,0.010240279,7.8633037,3.2814808,-133.52377,-205.49103,2.110766,-2.4397175,89.029434,1135000
29
+ 125.64913,0.19962075,0.008845084,5.900835,-2.835526,-126.711365,-204.09387,3.3325574,-3.2156377,88.41038,1140000
30
+ 129.191,0.17353192,0.008462937,7.848687,-3.7377398,-130.28177,-205.0785,1.376828,-1.4576687,67.69303,1145000
31
+ 132.07303,0.15825967,0.007865503,5.0124984,-5.5264845,-132.65929,-204.93501,2.1877663,-1.9534953,56.405983,1150000
32
+ 129.53526,0.18217763,0.00850342,7.4006076,-4.056307,-130.07823,-204.84909,1.0397879,-1.0755758,56.863342,1155000
33
+ 129.38098,0.19779287,0.007866315,6.346295,1.3230945,-129.88194,-204.88751,0.7190227,-0.6125448,53.87025,1160000
34
+ 128.70007,0.20729211,0.008190382,4.792479,-2.477955,-129.7777,-205.13089,1.2929449,-1.196859,59.63217,1165000
35
+ 129.75542,0.14899153,0.009740487,4.9541316,-7.5833826,-130.02539,-205.05359,1.0174975,-1.7720295,72.09686,1170000
36
+ 132.70763,0.17668974,0.00777185,5.216278,3.1477087,-132.90009,-206.0795,1.1624663,-1.1212296,55.667313,1175000
37
+ 130.60649,0.18903919,0.0069495677,4.322933,1.2432026,-130.83809,-204.49104,0.93349236,-1.3776332,47.916687,1180000
38
+ 126.16392,0.1815413,0.008465822,4.2117004,-1.7362936,-126.50576,-204.58919,1.5650655,-2.0762737,55.48748,1185000
39
+ 124.582016,0.14999068,0.0105680395,4.606962,3.2564583,-125.321,-205.70369,0.99927694,-1.4184502,70.52841,1190000
40
+ 127.65769,0.18156959,0.009004099,5.441826,-3.660462,-127.853294,-204.78204,1.2889132,-0.98092246,57.814613,1195000
41
+ 125.789734,0.15939301,0.00830114,4.630853,0.29366034,-126.81598,-205.46733,1.7876813,-2.106473,58.9141,1200000
42
+ 127.34004,0.14026494,0.0077390233,5.880654,-1.6497213,-127.90505,-203.81516,0.966439,-0.8981806,57.655933,1205000
43
+ 124.73788,0.1721107,0.007869112,4.9653497,-3.3806443,-125.20497,-204.89827,1.4602054,-1.9387814,56.77161,1210000
44
+ 127.77647,0.19506773,0.009942851,5.2495074,-4.9872475,-128.30412,-203.76491,1.5365211,-1.8136756,59.61758,1215000
45
+ 126.349686,0.2086468,0.0073945443,7.1904473,-6.437943,-126.96177,-204.19434,0.9904268,-1.0047256,71.118835,1220000
46
+ 121.72771,0.18207242,0.0077876267,7.5343094,3.4430814,-122.058426,-203.76614,1.5899658,-1.8316793,81.3901,1225000
47
+ 125.46732,0.19905858,0.009445356,7.647166,-4.0125604,-125.61812,-205.4222,0.870085,-1.0015781,59.98722,1230000
48
+ 122.06956,0.20348279,0.006889693,5.2245097,0.78821295,-121.96664,-204.70657,0.964592,-1.7838556,56.03837,1235000
49
+ 123.03483,0.18111536,0.005782583,6.235236,0.81554765,-123.57523,-205.02718,1.1655997,-1.0872425,59.06585,1240000
50
+ 126.92784,0.17333007,0.008884724,4.778095,-8.604665,-127.02264,-204.98332,1.3810421,-1.4076948,53.5533,1245000
51
+ 114.86347,0.16950178,0.008773966,6.8627334,-0.5348978,-115.50411,-204.71355,1.6234604,-2.0703955,66.46281,1250000
52
+ 123.12099,0.1902762,0.008645338,6.999124,-0.48804367,-123.7161,-203.61496,1.3061188,-1.2037396,63.294838,1255000
53
+ 121.67787,0.17371339,0.009301184,5.2103314,2.1496572,-122.6849,-206.99658,1.0462197,-1.1924579,52.696045,1260000
54
+ 121.299255,0.1579305,0.0087454,8.73548,0.37168258,-121.69551,-204.57347,1.0387769,-1.2694839,68.74339,1265000
55
+ 119.94853,0.16209325,0.007840997,7.6359468,0.4267254,-120.55569,-204.84778,3.735064,-3.288653,122.26133,1270000
56
+ 117.040436,0.21912858,0.00730139,8.156119,-5.2699447,-117.29641,-205.1521,1.0234823,-0.98142487,66.87633,1275000
57
+ 122.24303,0.1957971,0.009137187,5.08367,1.5228661,-123.15336,-204.54631,0.9133748,-0.86738443,53.54991,1280000
58
+ 117.73298,0.17111695,0.0076938574,4.811798,-6.8513556,-118.672874,-203.95834,1.0798751,-1.0420084,58.022377,1285000
59
+ 112.85035,0.17740062,0.007454747,5.171891,-1.3996239,-113.571526,-204.63763,1.5051556,-1.5599103,71.88539,1290000
60
+ 114.34713,0.20439604,0.007705548,13.248328,1.7339338,-115.15122,-206.27695,1.0586629,-1.1280568,101.41521,1295000
61
+ 118.72575,0.18224274,0.0060509103,6.345232,-5.231582,-119.29101,-203.88824,1.9939206,-2.2471957,73.557274,1300000
62
+ 121.58778,0.15938196,0.008036909,5.1388645,-1.1531781,-122.50061,-205.05084,2.343004,-2.4097533,67.942375,1305000
63
+ 116.64279,0.17319828,0.0081104105,8.216399,-3.7958214,-117.30242,-203.87462,1.5921979,-2.351327,104.36542,1310000
64
+ 119.1406,0.16488056,0.0073349588,6.599019,-0.73993105,-119.61611,-203.64093,1.3997117,-1.4642879,90.601364,1315000
65
+ 117.17459,0.14690605,0.007015856,7.2954774,5.060341,-118.51072,-204.3125,1.0468748,-0.9606438,61.730774,1320000
66
+ 120.083336,0.16388386,0.0075472733,4.6595387,1.7824181,-120.47166,-204.64122,0.6019351,-0.5736071,61.435787,1325000
67
+ 117.00885,0.18076748,0.008158969,4.93433,3.7352955,-117.29578,-203.50722,1.4863733,-1.266689,72.246086,1330000
68
+ 117.68429,0.20237139,0.009704951,5.254432,-2.546257,-118.06736,-204.74628,2.3805385,-2.0432107,64.07243,1335000
69
+ 119.296165,0.17429185,0.0074415193,4.098642,1.9077384,-119.32495,-204.57619,0.97143006,-0.84627557,49.241848,1340000
70
+ 122.16182,0.17073742,0.008347054,5.6910334,1.6567506,-123.139404,-205.32613,1.4383342,-2.1936002,74.27919,1345000
71
+ 111.043274,0.18183464,0.0068383585,5.2764125,7.968234,-111.89602,-205.71046,1.1966971,-1.2954459,49.534317,1350000
72
+ 119.737206,0.20218611,0.007554351,6.5934114,5.7562227,-120.245056,-204.35497,1.3731438,-1.3584522,80.55447,1355000
73
+ 115.44145,0.15986049,0.009418355,4.8212214,-2.615328,-115.51443,-204.87375,1.2402884,-1.1229734,74.8627,1360000
74
+ 115.50672,0.16858777,0.0070973826,7.306443,-1.9751806,-116.56753,-204.74307,1.6775205,-2.075348,71.042786,1365000
75
+ 116.934456,0.19096741,0.007869718,7.234544,3.056712,-117.646545,-205.2073,1.2262682,-1.2613565,68.53799,1370000
76
+ 110.32482,0.15222181,0.0076326537,6.131383,5.221502,-111.5837,-204.18591,2.208695,-2.3628075,52.82122,1375000
77
+ 111.39778,0.13073212,0.007974069,4.364493,0.79249424,-112.51542,-204.77744,0.7677316,-0.8570062,53.534046,1380000
78
+ 115.35373,0.15118955,0.0071975943,4.943206,5.205435,-116.41669,-205.37257,0.7955426,-1.5268672,43.440548,1385000
79
+ 117.454926,0.14592698,0.00762292,7.356302,-9.443297,-118.371635,-204.28793,4.0974035,-4.596805,115.330956,1390000
80
+ 113.76132,0.1662851,0.008180721,4.380405,-3.8463247,-114.71085,-203.16881,0.732404,-1.0797365,50.26922,1395000
81
+ 111.1558,0.14901909,0.007565817,4.4596825,1.1954253,-111.30349,-204.72939,2.4591177,-1.7167916,57.84591,1400000
82
+ 113.298645,0.1426121,0.006862541,4.4548907,2.4342208,-113.48474,-204.91718,0.9220734,-1.0424043,50.21064,1405000
83
+ 118.29645,0.17579442,0.007917837,5.5355697,-0.6277578,-118.65137,-203.60945,1.074315,-0.97051334,59.45766,1410000
84
+ 110.95303,0.17067304,0.009755396,5.37111,1.4643687,-111.69143,-203.69632,1.4797641,-1.2741693,78.828094,1415000
85
+ 114.28086,0.16725962,0.008976225,4.3760166,0.4084068,-114.66001,-203.44684,1.6433245,-1.9121938,59.37222,1420000
86
+ 111.10107,0.17037097,0.0076525914,5.0197663,4.599801,-111.801384,-204.34996,3.5720713,-3.1327846,87.45618,1425000
87
+ 108.71176,0.13735466,0.0069448003,7.505752,3.8907442,-109.02736,-204.65506,0.94682646,-1.0619509,64.051865,1430000
88
+ 114.66172,0.16067974,0.008943042,6.7486606,5.399002,-114.52355,-204.71648,1.5014017,-1.4781948,82.530045,1435000
89
+ 106.519295,0.17004308,0.0077346824,5.3144183,1.2255918,-107.72538,-204.86632,1.4667892,-1.4174924,55.770653,1440000
90
+ 114.64674,0.15955317,0.006824732,5.2632346,4.376355,-115.413284,-204.75493,1.1633816,-0.82694197,56.71602,1445000
91
+ 110.07178,0.15509135,0.0064432225,3.9543636,-3.758855,-110.69325,-204.2121,1.7983202,-1.3120855,47.241722,1450000
92
+ 109.93644,0.16248013,0.007826836,7.995216,-2.2948225,-110.65607,-205.30026,1.1658643,-0.9053957,76.72345,1455000
93
+ 107.97509,0.15665033,0.005951253,4.290899,0.963066,-109.15627,-204.2781,1.2266308,-1.419404,62.32586,1460000
94
+ 107.46649,0.1386271,0.007763624,3.5475693,1.1952665,-108.25059,-204.06812,1.235814,-2.0860457,55.360386,1465000
95
+ 106.43756,0.13774142,0.0075817774,4.279185,3.98627,-106.64141,-204.07765,1.6696097,-1.5089376,62.51242,1470000
96
+ 109.684975,0.14721316,0.006651299,3.1795788,-2.542635,-110.0427,-204.41142,2.0028455,-1.4814694,56.84195,1475000
97
+ 108.11439,0.15229039,0.009193145,5.730661,1.3553573,-108.457115,-203.70607,3.7182212,-3.1724248,124.91722,1480000
98
+ 108.50926,0.14276691,0.007290074,4.314696,0.39421666,-108.78074,-204.99638,0.90320605,-0.87408924,55.086716,1485000
99
+ 107.8694,0.16177867,0.00636993,6.275894,3.6713827,-108.74129,-204.57323,1.204977,-0.8980832,56.602783,1490000
100
+ 101.75121,0.1274986,0.0074778018,7.078491,-1.8577209,-102.07118,-204.53065,1.790219,-1.6914796,64.40872,1495000
101
+ 103.31247,0.17546469,0.007369807,4.7808146,4.828383,-104.11269,-203.98297,0.998746,-0.92574036,48.85293,1500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 165.71036,0.17307585,0.0075569265,5.1738296,-55.142273,-165.87933,-203.9221,1.4671576,-1.540129,62.327446,1005000
3
+ 160.0284,0.16913897,0.006196486,5.2068734,-50.711933,-160.08621,-204.8742,2.0647225,-2.2819893,46.92933,1010000
4
+ 160.00772,0.18041171,0.007584412,5.6884966,-41.510357,-160.31819,-203.68896,2.2177658,-2.0569305,55.091763,1015000
5
+ 152.06429,0.18693909,0.008315922,8.042964,-32.561386,-152.95808,-203.45708,0.86879474,-1.0419067,61.943924,1020000
6
+ 151.30014,0.20755628,0.00644345,6.381181,-59.05737,-151.5826,-205.55083,0.87046176,-0.87307626,52.875042,1025000
7
+ 148.944,0.16427748,0.0085353935,7.0757785,-39.73715,-149.58139,-204.4799,1.2767617,-1.2689552,60.4748,1030000
8
+ 147.17282,0.19035524,0.008243441,5.828989,-47.62758,-147.81685,-203.36523,2.7970405,-2.4949458,68.10646,1035000
9
+ 148.21576,0.13817805,0.009179717,11.583496,-16.469782,-149.31267,-204.54143,2.1010914,-2.0794356,99.87376,1040000
10
+ 148.94691,0.17812805,0.010284772,8.646125,-55.549942,-149.07932,-204.09373,0.8609638,-0.84128785,63.157845,1045000
11
+ 149.54684,0.1980061,0.007849528,9.923751,-28.363472,-149.81775,-204.51097,0.89891547,-0.959749,63.80462,1050000
12
+ 143.65121,0.18182531,0.008812244,7.5049067,-32.717007,-144.37744,-205.51881,2.072872,-2.94072,71.23982,1055000
13
+ 139.551,0.17582634,0.008280634,9.614909,-5.505001,-140.46678,-205.0562,1.6609832,-2.410016,65.973526,1060000
14
+ 139.4577,0.17177549,0.0072339145,9.037575,-25.78911,-140.07825,-204.48523,0.61745006,-0.7223854,54.346672,1065000
15
+ 136.56793,0.19720663,0.00759297,11.307067,-22.275513,-136.85545,-205.2892,2.3687332,-2.45513,115.85127,1070000
16
+ 140.05908,0.1974659,0.009458769,7.0015464,-1.4904993,-140.29327,-205.33807,1.4471562,-1.2020954,75.385925,1075000
17
+ 138.51169,0.18049401,0.009441682,9.087483,-29.692816,-139.00275,-204.98868,1.2425953,-1.2501372,86.93852,1080000
18
+ 139.54257,0.18923058,0.0075250217,7.303032,-32.520348,-139.98158,-205.64459,1.6777635,-1.9048556,90.948235,1085000
19
+ 137.00858,0.16610764,0.0079428265,5.7546244,-16.090126,-137.60994,-205.59555,1.0912721,-1.1508859,62.09266,1090000
20
+ 134.14182,0.15920353,0.008814591,9.6023035,2.8507733,-134.94537,-204.98654,1.1577233,-1.0597589,71.95645,1095000
21
+ 130.96548,0.1884156,0.008026725,8.964839,6.135522,-131.55254,-205.08368,2.5706983,-1.5806845,124.62309,1100000
22
+ 136.28583,0.18757619,0.008329004,7.890812,-18.23137,-136.73521,-206.72925,1.0234339,-0.9141383,58.44951,1105000
23
+ 131.6095,0.16726455,0.009526978,6.5234833,-9.141151,-131.89262,-205.09105,1.0984849,-1.417765,65.41466,1110000
24
+ 127.85196,0.13797027,0.009532055,10.030955,0.5285305,-128.83955,-205.2291,1.2255989,-1.3275607,74.605255,1115000
25
+ 130.19453,0.1844208,0.007989071,5.3812423,-5.2507505,-130.5836,-204.16258,1.067622,-1.0858682,55.778625,1120000
26
+ 134.00534,0.20369962,0.008358074,8.020683,-6.9948506,-134.42136,-204.44603,1.4402368,-1.5731618,59.323326,1125000
27
+ 131.219,0.17214307,0.009955655,9.847293,-7.767254,-131.46045,-204.84212,1.2946599,-1.114071,70.09626,1130000
28
+ 132.01086,0.18917647,0.010240279,7.8633037,3.2814808,-133.52377,-205.49103,2.110766,-2.4397175,89.029434,1135000
29
+ 125.64913,0.19962075,0.008845084,5.900835,-2.835526,-126.711365,-204.09387,3.3325574,-3.2156377,88.41038,1140000
30
+ 129.191,0.17353192,0.008462937,7.848687,-3.7377398,-130.28177,-205.0785,1.376828,-1.4576687,67.69303,1145000
31
+ 132.07303,0.15825967,0.007865503,5.0124984,-5.5264845,-132.65929,-204.93501,2.1877663,-1.9534953,56.405983,1150000
32
+ 129.53526,0.18217763,0.00850342,7.4006076,-4.056307,-130.07823,-204.84909,1.0397879,-1.0755758,56.863342,1155000
33
+ 129.38098,0.19779287,0.007866315,6.346295,1.3230945,-129.88194,-204.88751,0.7190227,-0.6125448,53.87025,1160000
34
+ 128.70007,0.20729211,0.008190382,4.792479,-2.477955,-129.7777,-205.13089,1.2929449,-1.196859,59.63217,1165000
35
+ 129.75542,0.14899153,0.009740487,4.9541316,-7.5833826,-130.02539,-205.05359,1.0174975,-1.7720295,72.09686,1170000
36
+ 132.70763,0.17668974,0.00777185,5.216278,3.1477087,-132.90009,-206.0795,1.1624663,-1.1212296,55.667313,1175000
37
+ 130.60649,0.18903919,0.0069495677,4.322933,1.2432026,-130.83809,-204.49104,0.93349236,-1.3776332,47.916687,1180000
38
+ 126.16392,0.1815413,0.008465822,4.2117004,-1.7362936,-126.50576,-204.58919,1.5650655,-2.0762737,55.48748,1185000
39
+ 124.582016,0.14999068,0.0105680395,4.606962,3.2564583,-125.321,-205.70369,0.99927694,-1.4184502,70.52841,1190000
40
+ 127.65769,0.18156959,0.009004099,5.441826,-3.660462,-127.853294,-204.78204,1.2889132,-0.98092246,57.814613,1195000
41
+ 125.789734,0.15939301,0.00830114,4.630853,0.29366034,-126.81598,-205.46733,1.7876813,-2.106473,58.9141,1200000
42
+ 127.34004,0.14026494,0.0077390233,5.880654,-1.6497213,-127.90505,-203.81516,0.966439,-0.8981806,57.655933,1205000
43
+ 124.73788,0.1721107,0.007869112,4.9653497,-3.3806443,-125.20497,-204.89827,1.4602054,-1.9387814,56.77161,1210000
44
+ 127.77647,0.19506773,0.009942851,5.2495074,-4.9872475,-128.30412,-203.76491,1.5365211,-1.8136756,59.61758,1215000
45
+ 126.349686,0.2086468,0.0073945443,7.1904473,-6.437943,-126.96177,-204.19434,0.9904268,-1.0047256,71.118835,1220000
46
+ 121.72771,0.18207242,0.0077876267,7.5343094,3.4430814,-122.058426,-203.76614,1.5899658,-1.8316793,81.3901,1225000
47
+ 125.46732,0.19905858,0.009445356,7.647166,-4.0125604,-125.61812,-205.4222,0.870085,-1.0015781,59.98722,1230000
48
+ 122.06956,0.20348279,0.006889693,5.2245097,0.78821295,-121.96664,-204.70657,0.964592,-1.7838556,56.03837,1235000
49
+ 123.03483,0.18111536,0.005782583,6.235236,0.81554765,-123.57523,-205.02718,1.1655997,-1.0872425,59.06585,1240000
50
+ 126.92784,0.17333007,0.008884724,4.778095,-8.604665,-127.02264,-204.98332,1.3810421,-1.4076948,53.5533,1245000
51
+ 114.86347,0.16950178,0.008773966,6.8627334,-0.5348978,-115.50411,-204.71355,1.6234604,-2.0703955,66.46281,1250000
52
+ 123.12099,0.1902762,0.008645338,6.999124,-0.48804367,-123.7161,-203.61496,1.3061188,-1.2037396,63.294838,1255000
53
+ 121.67787,0.17371339,0.009301184,5.2103314,2.1496572,-122.6849,-206.99658,1.0462197,-1.1924579,52.696045,1260000
54
+ 121.299255,0.1579305,0.0087454,8.73548,0.37168258,-121.69551,-204.57347,1.0387769,-1.2694839,68.74339,1265000
55
+ 119.94853,0.16209325,0.007840997,7.6359468,0.4267254,-120.55569,-204.84778,3.735064,-3.288653,122.26133,1270000
56
+ 117.040436,0.21912858,0.00730139,8.156119,-5.2699447,-117.29641,-205.1521,1.0234823,-0.98142487,66.87633,1275000
57
+ 122.24303,0.1957971,0.009137187,5.08367,1.5228661,-123.15336,-204.54631,0.9133748,-0.86738443,53.54991,1280000
58
+ 117.73298,0.17111695,0.0076938574,4.811798,-6.8513556,-118.672874,-203.95834,1.0798751,-1.0420084,58.022377,1285000
59
+ 112.85035,0.17740062,0.007454747,5.171891,-1.3996239,-113.571526,-204.63763,1.5051556,-1.5599103,71.88539,1290000
60
+ 114.34713,0.20439604,0.007705548,13.248328,1.7339338,-115.15122,-206.27695,1.0586629,-1.1280568,101.41521,1295000
61
+ 118.72575,0.18224274,0.0060509103,6.345232,-5.231582,-119.29101,-203.88824,1.9939206,-2.2471957,73.557274,1300000
62
+ 121.58778,0.15938196,0.008036909,5.1388645,-1.1531781,-122.50061,-205.05084,2.343004,-2.4097533,67.942375,1305000
63
+ 116.64279,0.17319828,0.0081104105,8.216399,-3.7958214,-117.30242,-203.87462,1.5921979,-2.351327,104.36542,1310000
64
+ 119.1406,0.16488056,0.0073349588,6.599019,-0.73993105,-119.61611,-203.64093,1.3997117,-1.4642879,90.601364,1315000
65
+ 117.17459,0.14690605,0.007015856,7.2954774,5.060341,-118.51072,-204.3125,1.0468748,-0.9606438,61.730774,1320000
66
+ 120.083336,0.16388386,0.0075472733,4.6595387,1.7824181,-120.47166,-204.64122,0.6019351,-0.5736071,61.435787,1325000
67
+ 117.00885,0.18076748,0.008158969,4.93433,3.7352955,-117.29578,-203.50722,1.4863733,-1.266689,72.246086,1330000
68
+ 117.68429,0.20237139,0.009704951,5.254432,-2.546257,-118.06736,-204.74628,2.3805385,-2.0432107,64.07243,1335000
69
+ 119.296165,0.17429185,0.0074415193,4.098642,1.9077384,-119.32495,-204.57619,0.97143006,-0.84627557,49.241848,1340000
70
+ 122.16182,0.17073742,0.008347054,5.6910334,1.6567506,-123.139404,-205.32613,1.4383342,-2.1936002,74.27919,1345000
71
+ 111.043274,0.18183464,0.0068383585,5.2764125,7.968234,-111.89602,-205.71046,1.1966971,-1.2954459,49.534317,1350000
72
+ 119.737206,0.20218611,0.007554351,6.5934114,5.7562227,-120.245056,-204.35497,1.3731438,-1.3584522,80.55447,1355000
73
+ 115.44145,0.15986049,0.009418355,4.8212214,-2.615328,-115.51443,-204.87375,1.2402884,-1.1229734,74.8627,1360000
74
+ 115.50672,0.16858777,0.0070973826,7.306443,-1.9751806,-116.56753,-204.74307,1.6775205,-2.075348,71.042786,1365000
75
+ 116.934456,0.19096741,0.007869718,7.234544,3.056712,-117.646545,-205.2073,1.2262682,-1.2613565,68.53799,1370000
76
+ 110.32482,0.15222181,0.0076326537,6.131383,5.221502,-111.5837,-204.18591,2.208695,-2.3628075,52.82122,1375000
77
+ 111.39778,0.13073212,0.007974069,4.364493,0.79249424,-112.51542,-204.77744,0.7677316,-0.8570062,53.534046,1380000
78
+ 115.35373,0.15118955,0.0071975943,4.943206,5.205435,-116.41669,-205.37257,0.7955426,-1.5268672,43.440548,1385000
79
+ 117.454926,0.14592698,0.00762292,7.356302,-9.443297,-118.371635,-204.28793,4.0974035,-4.596805,115.330956,1390000
80
+ 113.76132,0.1662851,0.008180721,4.380405,-3.8463247,-114.71085,-203.16881,0.732404,-1.0797365,50.26922,1395000
81
+ 111.1558,0.14901909,0.007565817,4.4596825,1.1954253,-111.30349,-204.72939,2.4591177,-1.7167916,57.84591,1400000
82
+ 113.298645,0.1426121,0.006862541,4.4548907,2.4342208,-113.48474,-204.91718,0.9220734,-1.0424043,50.21064,1405000
83
+ 118.29645,0.17579442,0.007917837,5.5355697,-0.6277578,-118.65137,-203.60945,1.074315,-0.97051334,59.45766,1410000
84
+ 110.95303,0.17067304,0.009755396,5.37111,1.4643687,-111.69143,-203.69632,1.4797641,-1.2741693,78.828094,1415000
85
+ 114.28086,0.16725962,0.008976225,4.3760166,0.4084068,-114.66001,-203.44684,1.6433245,-1.9121938,59.37222,1420000
86
+ 111.10107,0.17037097,0.0076525914,5.0197663,4.599801,-111.801384,-204.34996,3.5720713,-3.1327846,87.45618,1425000
87
+ 108.71176,0.13735466,0.0069448003,7.505752,3.8907442,-109.02736,-204.65506,0.94682646,-1.0619509,64.051865,1430000
88
+ 114.66172,0.16067974,0.008943042,6.7486606,5.399002,-114.52355,-204.71648,1.5014017,-1.4781948,82.530045,1435000
89
+ 106.519295,0.17004308,0.0077346824,5.3144183,1.2255918,-107.72538,-204.86632,1.4667892,-1.4174924,55.770653,1440000
90
+ 114.64674,0.15955317,0.006824732,5.2632346,4.376355,-115.413284,-204.75493,1.1633816,-0.82694197,56.71602,1445000
91
+ 110.07178,0.15509135,0.0064432225,3.9543636,-3.758855,-110.69325,-204.2121,1.7983202,-1.3120855,47.241722,1450000
92
+ 109.93644,0.16248013,0.007826836,7.995216,-2.2948225,-110.65607,-205.30026,1.1658643,-0.9053957,76.72345,1455000
93
+ 107.97509,0.15665033,0.005951253,4.290899,0.963066,-109.15627,-204.2781,1.2266308,-1.419404,62.32586,1460000
94
+ 107.46649,0.1386271,0.007763624,3.5475693,1.1952665,-108.25059,-204.06812,1.235814,-2.0860457,55.360386,1465000
95
+ 106.43756,0.13774142,0.0075817774,4.279185,3.98627,-106.64141,-204.07765,1.6696097,-1.5089376,62.51242,1470000
96
+ 109.684975,0.14721316,0.006651299,3.1795788,-2.542635,-110.0427,-204.41142,2.0028455,-1.4814694,56.84195,1475000
97
+ 108.11439,0.15229039,0.009193145,5.730661,1.3553573,-108.457115,-203.70607,3.7182212,-3.1724248,124.91722,1480000
98
+ 108.50926,0.14276691,0.007290074,4.314696,0.39421666,-108.78074,-204.99638,0.90320605,-0.87408924,55.086716,1485000
99
+ 107.8694,0.16177867,0.00636993,6.275894,3.6713827,-108.74129,-204.57323,1.204977,-0.8980832,56.602783,1490000
100
+ 101.75121,0.1274986,0.0074778018,7.078491,-1.8577209,-102.07118,-204.53065,1.790219,-1.6914796,64.40872,1495000
101
+ 103.31247,0.17546469,0.007369807,4.7808146,4.828383,-104.11269,-203.98297,0.998746,-0.92574036,48.85293,1500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d78cf3b2790168bd3bd45e68adeabd1ba846b0c8c81c563d2abefbf33d0fe84
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e219c701761b16c52e1563b7cb998a4e82b38be52395a394826abf6b4b89522
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4a30d6737a5b83e87d822aea3b77d75f3a2d6774033ba11d8ecd9ed6de56272
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71309235484c51a73ee1220763439b802380c31edbe2e6fa09917cb55cbcc007
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a34cb84e50b06b67d3d9f752e3601e508e4910710417cd9c0b97cd3e2ca1ae4
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1948762199439846165e663c661bb46e4ec28dac403be224e090d7fbdc41ec2
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dda28a584952649ac7541d8e937c531721f569d73178acfab06511c46bf417f2
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6e0e4f3a92336b64f40ecec58a5db2890e2085008fee1dbce7fbcb539b36d2f
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b438559a8d5a44fdc5606f2d471728067a94e678e40bc59eceacb42788cd175c
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/params_1500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25425d346c2d3be3ba7e6720f69cbd02605373a3e9187085ef4e65d26019334f
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260320_015949/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/kexdkkjq