Tiredsheep commited on
Commit
db275fd
·
verified ·
1 Parent(s): c5bb361

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_450000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_500000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_550000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_600000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_650000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_700000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_750000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_800000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_850000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_900000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.016475632075344148,0.002977121451604871,-0.016068768076845857,0.0002503927452825565,26.49808021494976,17.856999999998894,0.62,8928.76,-0.54,-560.06,355.14,1.0677370595932008,450000
3
+ 0.0,0.0,-0.023436599671771873,-0.002896199756283034,-0.022438446989312383,-0.005978597637347527,32.0903967601278,11.487999999999635,0.9,24756.48,-0.16,-348.56,227.76,0.7277789735794067,500000
4
+ 0.0,0.0,-0.04954256082778114,-0.00683176120900682,-0.047206124197445,0.01268190636604556,32.00142155637023,8.168999999999583,0.96,34458.02,-0.04,-245.34,161.38,0.5269394111633301,550000
5
+ 0.0,0.0,-0.042391380312044806,-0.0029621376282687275,-0.0401577569122364,0.001217209249413888,31.663929340510553,8.019999999999651,0.94,42611.16,-0.12,-255.38,158.4,0.5309604454040527,600000
6
+ 0.0,0.0,-0.042615019338182326,0.03408630843388969,-0.03997643376619276,0.013986440228204219,33.38039969138992,6.5219999999995215,0.96,50446.44,-0.06,-196.72,128.44,0.41683093547821043,650000
7
+ 0.0,0.0,-0.06128477557124821,0.044756028610810704,-0.056908491667224635,0.03584117116064402,34.997561310829454,5.834999999999622,0.96,56726.84,-0.06,-175.96,114.7,0.3670168161392212,700000
8
+ 0.0,0.0,-0.07184680492360658,0.03654070975743058,-0.06710455460926545,0.043228496657201104,35.30548512129382,5.414999999999723,1.0,62121.86,0.0,-158.8,106.3,0.34156057357788083,750000
9
+ 0.0,0.0,-0.07593666889676003,0.038917340853141816,-0.07106629392598088,0.04761771662622835,35.59710145785285,4.70399999999977,1.0,67211.14,0.0,-136.82,92.08,0.3112912607192993,800000
10
+ 0.0,0.0,-0.07847148225668013,0.04081899909629042,-0.0734218909830678,0.049104724760047666,35.71688861415067,4.296999999999803,1.0,71662.16,0.0,-124.76,83.94,0.2881143093109131,850000
11
+ 0.0,0.0,-0.07401733621020903,0.03569054651069593,-0.06885815368644488,0.07216982071203644,34.70416586319812,5.268999999999708,0.98,76591.9,-0.04,-152.08,103.38,0.33206178188323976,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.016475632075344148,0.002977121451604871,-0.016068768076845857,0.0002503927452825565,26.49808021494976,17.856999999998894,0.62,8928.76,-0.54,-560.06,355.14,1.0677370595932008,450000
3
+ 0.0,0.0,-0.023436599671771873,-0.002896199756283034,-0.022438446989312383,-0.005978597637347527,32.0903967601278,11.487999999999635,0.9,24756.48,-0.16,-348.56,227.76,0.7277789735794067,500000
4
+ 0.0,0.0,-0.04954256082778114,-0.00683176120900682,-0.047206124197445,0.01268190636604556,32.00142155637023,8.168999999999583,0.96,34458.02,-0.04,-245.34,161.38,0.5269394111633301,550000
5
+ 0.0,0.0,-0.042391380312044806,-0.0029621376282687275,-0.0401577569122364,0.001217209249413888,31.663929340510553,8.019999999999651,0.94,42611.16,-0.12,-255.38,158.4,0.5309604454040527,600000
6
+ 0.0,0.0,-0.042615019338182326,0.03408630843388969,-0.03997643376619276,0.013986440228204219,33.38039969138992,6.5219999999995215,0.96,50446.44,-0.06,-196.72,128.44,0.41683093547821043,650000
7
+ 0.0,0.0,-0.06128477557124821,0.044756028610810704,-0.056908491667224635,0.03584117116064402,34.997561310829454,5.834999999999622,0.96,56726.84,-0.06,-175.96,114.7,0.3670168161392212,700000
8
+ 0.0,0.0,-0.07184680492360658,0.03654070975743058,-0.06710455460926545,0.043228496657201104,35.30548512129382,5.414999999999723,1.0,62121.86,0.0,-158.8,106.3,0.34156057357788083,750000
9
+ 0.0,0.0,-0.07593666889676003,0.038917340853141816,-0.07106629392598088,0.04761771662622835,35.59710145785285,4.70399999999977,1.0,67211.14,0.0,-136.82,92.08,0.3112912607192993,800000
10
+ 0.0,0.0,-0.07847148225668013,0.04081899909629042,-0.0734218909830678,0.049104724760047666,35.71688861415067,4.296999999999803,1.0,71662.16,0.0,-124.76,83.94,0.2881143093109131,850000
11
+ 0.0,0.0,-0.07401733621020903,0.03569054651069593,-0.06885815368644488,0.07216982071203644,34.70416586319812,5.268999999999708,0.98,76591.9,-0.04,-152.08,103.38,0.33206178188323976,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
2
+ 0.643265,152.65453,0.0075980597,-0.005156799,-13.1786995,0.19453254,-152.55438,152.8439,1.6845665,6.2422547,-69.90439,-155.14688,-195.06387,7.926821,7.221267,-7.138418,127.3331,405000
3
+ 0.6443439,148.96472,0.007623238,-0.0039529493,-13.018539,0.195763,-148.86548,149.15654,1.1565669,6.592435,-55.016033,-151.66153,-193.22118,7.7490015,4.849304,-4.620331,103.49316,410000
4
+ 0.64733785,150.39694,0.007689698,0.0037162567,-12.016723,0.20818043,-150.30453,150.60884,1.3898687,3.6582024,-40.803207,-153.1081,-192.90053,5.048071,0.7240639,-0.83049333,53.08139,415000
5
+ 0.63025695,150.69656,0.007644919,-0.018109744,-14.86886,0.17575951,-150.58289,150.85422,3.5650995,6.2941794,-35.494335,-153.81473,-198.78122,9.859279,4.721145,-4.6399603,96.43646,420000
6
+ 0.6394948,148.69543,0.007879713,-0.010390713,-13.818666,0.19849652,-148.58656,148.88354,1.6594177,4.203403,-60.683037,-150.82204,-199.19528,5.8628206,0.4290268,-0.8757771,55.75992,425000
7
+ 0.64110625,146.80826,0.008117279,-0.0098519055,-13.713696,0.19555739,-146.69695,146.99396,2.7539022,5.460565,-67.055626,-149.05803,-197.10396,8.214467,1.2576982,-1.4600021,82.27845,430000
8
+ 0.6453779,147.9339,0.0083820885,0.0029202646,-12.151607,0.16857024,-147.83203,148.10538,1.9877169,5.955225,-53.18908,-150.20258,-197.16711,7.9429417,3.9273055,-3.6610806,97.29001,435000
9
+ 0.63677776,146.01132,0.008372984,-0.011563878,-13.881094,0.21518959,-145.8951,146.21495,1.8477007,7.36026,-62.01387,-149.57384,-196.66193,9.207961,2.836074,-3.1542444,99.97038,440000
10
+ 0.64508986,146.5398,0.008659959,0.004350907,-11.997583,0.17904796,-146.4359,146.72319,2.079761,4.893556,-76.04396,-148.96953,-198.40472,6.973317,0.7199221,-0.6550503,62.1195,445000
11
+ 0.6458272,146.02335,0.008711074,-0.005442377,-13.124765,0.17512862,-145.90903,146.19302,2.6926954,7.7760406,-49.00423,-148.6982,-195.84305,10.468736,1.7271746,-1.8109988,100.45282,450000
12
+ 0.63606185,141.1145,0.008721768,-0.016547816,-14.397301,0.19846252,-140.98892,141.29642,4.1386375,9.751056,-30.95133,-144.47643,-197.00487,13.889693,5.2832966,-5.7666063,134.73117,455000
13
+ 0.6304907,140.45709,0.008636576,-0.007640728,-13.384694,0.20934844,-140.3415,140.6588,2.560434,6.54695,-15.041662,-144.06982,-200.3571,9.107384,2.4911425,-2.2260344,90.06359,460000
14
+ 0.6461242,142.59235,0.009241166,-0.00742111,-13.303049,0.16549623,-142.46942,142.75043,2.8859153,6.678305,-37.393517,-145.73119,-199.4401,9.56422,3.588069,-3.8886454,131.529,465000
15
+ 0.63835174,137.17221,0.009153864,-0.00927492,-13.513225,0.19685173,-137.04852,137.35979,2.3040679,6.64704,-12.077508,-139.83035,-201.11758,8.951108,0.662961,-0.6118509,80.3447,470000
16
+ 0.636791,140.49677,0.008969372,0.0013449576,-12.35005,0.18450841,-140.386,140.68262,2.2069557,7.85164,-49.18793,-143.24821,-199.64223,10.058596,7.993062,-8.185585,155.33798,475000
17
+ 0.6409978,141.1199,0.009169036,-0.007687983,-13.338472,0.1909186,-140.99762,141.30313,3.6679192,8.048097,-24.145462,-144.12032,-197.68916,11.716016,2.9970076,-2.6262205,119.554115,480000
18
+ 0.6424893,137.79854,0.009290451,-0.00013378698,-12.5144005,0.14880964,-137.68228,137.9472,22.000315,11.174199,-15.819845,-140.59036,-199.06825,33.174515,3.3323183,-3.6682336,209.87292,485000
19
+ 0.6407904,139.0167,0.009304904,-0.0037474616,-12.9027405,0.1729816,-138.89664,139.18593,3.6505897,8.854815,-35.79149,-141.69661,-197.85912,12.505404,1.4219191,-1.1101617,115.42937,490000
20
+ 0.6489133,137.70428,0.009278906,0.011863679,-11.221436,0.16880465,-137.60016,137.88495,3.728275,6.526652,-40.970444,-139.835,-202.96701,10.254927,3.4157968,-3.0090754,113.16118,495000
21
+ 0.6348133,132.5325,0.009405187,-0.0060831946,-13.146791,0.17262039,-132.40887,132.69904,3.4102776,12.449433,-29.500406,-135.86003,-201.89275,15.859711,7.025614,-5.037615,165.11766,500000
22
+ 0.64744717,137.10468,0.009569492,0.010549205,-11.397621,0.20057473,-136.9956,137.3158,4.431602,8.602759,-14.177907,-140.24667,-204.22095,13.034361,3.6961584,-3.5097754,128.03806,505000
23
+ 0.63906175,133.45816,0.009788549,-0.007136525,-13.229069,0.21215679,-133.32866,133.66318,2.7197397,8.863651,-30.563284,-136.45238,-197.2954,11.583391,1.9749013,-1.8228719,112.54745,510000
24
+ 0.6284626,132.69055,0.009541794,-0.0037744364,-12.895569,0.16725533,-132.56749,132.85403,3.1126735,8.000861,0.85641015,-136.09488,-200.97098,11.113535,1.759632,-2.502218,139.16891,515000
25
+ 0.64500695,137.42258,0.00939177,-0.0070233345,-13.247818,0.16561514,-137.29816,137.58118,4.5604343,8.342742,-24.545494,-140.16081,-204.63425,12.903176,3.698126,-3.30907,130.29153,520000
26
+ 0.63528293,138.83827,0.009205186,-0.01626431,-14.266864,0.18647166,-138.70694,139.00848,6.4796076,9.556769,-17.410664,-141.93828,-198.71825,16.036377,2.0732527,-3.413546,191.44763,525000
27
+ 0.6441838,135.42743,0.00935569,0.011751502,-11.243919,0.179466,-135.32224,135.61864,3.7248764,11.231298,-35.06821,-139.19394,-197.76611,14.956175,1.125839,-1.181033,139.25243,530000
28
+ 0.6373442,135.46848,0.009383752,-0.005081249,-13.041494,0.2124522,-135.3461,135.67584,3.1229825,12.464222,2.3601658,-139.29008,-203.50812,15.587204,2.958001,-3.3280227,138.847,535000
29
+ 0.64509916,132.30405,0.009146708,0.0065777553,-11.780861,0.1513429,-132.19629,132.46196,3.3612955,12.199487,-21.834372,-135.75586,-201.94147,15.560782,4.513779,-5.4859815,161.33307,540000
30
+ 0.650798,132.16324,0.009553216,0.0072578774,-11.740269,0.18534383,-132.05109,132.35585,4.345029,11.460006,-9.838492,-134.74666,-202.94554,15.805035,6.2655725,-7.225169,179.4553,545000
31
+ 0.6387239,135.15762,0.009442728,-0.01627431,-14.223475,0.15254796,-135.02332,135.29388,3.4887524,11.294269,-18.863207,-136.90288,-200.91827,14.783021,2.2291398,-2.073104,166.8576,550000
32
+ 0.6460562,130.77686,0.009549049,0.0067690155,-11.791132,0.19001442,-130.66426,130.97365,6.5474167,12.459838,-6.917731,-133.65706,-195.06636,19.007256,2.5336194,-1.9291397,229.8836,555000
33
+ 0.648825,132.69962,0.009525128,0.015966173,-10.823784,0.16909772,-132.59653,132.88467,3.3722382,7.942862,-8.805404,-135.6614,-202.06053,11.3151,5.252202,-4.5160875,134.98666,560000
34
+ 0.63904476,133.41344,0.009537217,-0.0070215845,-13.23623,0.18797976,-133.2872,133.59439,2.488747,9.43185,-1.1263504,-136.4121,-203.5711,11.920597,6.5413623,-7.189885,145.79277,565000
35
+ 0.6539054,130.65945,0.009561684,0.02993047,-9.369749,0.17164996,-130.56987,130.86104,2.2678115,8.377403,-11.197053,-132.75105,-201.72568,10.645215,2.656642,-2.6378708,117.990875,570000
36
+ 0.6417743,133.6405,0.009319901,-0.0016464231,-12.676657,0.1904467,-133.52235,133.8293,3.7009828,11.98055,-16.672588,-136.88046,-202.71912,15.681533,7.3082747,-6.823574,199.46136,575000
37
+ 0.6474547,133.28178,0.009433002,0.0065887873,-11.8015175,0.15672144,-133.17047,133.4451,6.8757987,10.12779,2.168981,-135.93913,-203.05162,17.00359,8.111816,-6.1184196,325.20587,580000
38
+ 0.6362356,129.07503,0.00953307,-0.01410663,-13.979757,0.17374966,-128.94176,129.23468,4.0266347,21.329227,-2.899532,-132.77055,-198.16188,25.355862,7.3632646,-6.621008,191.59583,585000
39
+ 0.64266616,128.15894,0.009391232,-0.005018486,-13.03438,0.16655923,-128.03653,128.32048,2.7065365,9.222795,-11.34628,-131.02423,-205.41644,11.929331,2.8027027,-2.7968805,119.150246,590000
40
+ 0.6349283,130.84866,0.00927468,-0.0073326314,-13.290607,0.16503978,-130.7254,131.00636,3.491169,10.64731,-17.303635,-133.57108,-202.47365,14.138479,4.7184877,-5.0372243,144.67726,595000
41
+ 0.63584894,128.43484,0.009623543,-0.002680667,-12.778553,0.1638084,-128.31187,128.59596,6.234959,15.365386,-7.9687476,-132.39389,-200.77492,21.600346,2.8783817,-3.211027,194.56989,600000
42
+ 0.63393444,128.14713,0.009500139,-0.0056832717,-13.09823,0.16553152,-128.0227,128.30698,3.0246034,10.972584,-15.471093,-131.29556,-198.21265,13.997187,2.2656443,-2.9817133,128.55583,605000
43
+ 0.6371266,128.60109,0.009423305,0.0001453699,-12.484573,0.16543177,-128.48344,128.76668,2.694495,7.942016,-13.372177,-130.92525,-203.92157,10.636511,4.7059646,-2.7336006,163.26659,610000
44
+ 0.63748056,131.12636,0.009095032,-0.011593759,-13.774735,0.16338561,-131.0011,131.27815,3.3655014,11.176664,-13.467462,-133.55475,-201.98048,14.542166,6.525617,-4.7287097,159.42883,615000
45
+ 0.63954675,126.92883,0.009158885,-0.012469034,-13.861414,0.1675699,-126.80188,127.08394,3.5732179,11.863883,-6.740142,-130.08035,-197.03038,15.437101,1.2872832,-0.95074147,138.11382,620000
46
+ 0.633351,121.55235,0.009612724,0.011473011,-11.306477,0.16228493,-121.44367,121.72611,3.5356958,9.095477,-2.1091099,-124.54231,-202.15108,12.631173,3.021589,-2.7533305,113.058624,625000
47
+ 0.64548504,129.50552,0.009381985,0.011635914,-11.25976,0.1605006,-129.39987,129.67767,3.4521043,8.605102,-6.2098813,-132.73816,-202.84927,12.057206,2.121385,-2.27052,121.49571,630000
48
+ 0.6450627,124.29553,0.009672853,0.011927512,-11.266909,0.15590137,-124.18655,124.463356,3.6854446,8.587611,-2.6847208,-127.15493,-195.93513,12.273056,3.14279,-2.636501,117.09846,635000
49
+ 0.64918554,124.7937,0.00923872,-2.9991725e-05,-12.503246,0.16436242,-124.678185,124.95803,10.66199,14.948421,1.9969046,-128.32463,-200.02194,25.61041,3.2680602,-3.4829195,242.4981,640000
50
+ 0.6386839,125.597275,0.009541889,-0.0072116163,-13.255785,0.16297925,-125.47079,125.753044,4.1934776,10.757285,-3.7805688,-128.48434,-199.75212,14.950763,2.9411237,-2.7413871,160.30177,645000
51
+ 0.63721436,117.85981,0.009270427,0.0079568,-11.641701,0.17458336,-117.751884,118.04235,4.617673,14.593101,-7.1603174,-121.37764,-199.27422,19.210773,3.3791864,-4.535394,196.26782,650000
52
+ 0.6494256,127.7482,0.009223907,-0.005337682,-13.078679,0.19925213,-127.62756,127.94211,3.2569776,8.749644,0.2056885,-130.63356,-199.90045,12.006622,2.6632104,-2.655586,128.81789,655000
53
+ 0.6335176,124.98389,0.009340846,-0.004289966,-12.95927,0.19523033,-124.86284,125.17483,3.9020562,9.751259,3.8140016,-129.21977,-203.04486,13.653315,2.769002,-1.9850646,134.84763,660000
54
+ 0.64474857,126.51434,0.0092457235,-0.004354125,-12.970934,0.17572448,-126.3944,126.685715,3.6014366,8.822232,-0.7040361,-129.18776,-203.43045,12.423669,2.78757,-2.4116023,160.81085,665000
55
+ 0.6352337,125.87314,0.009141115,-0.0045954897,-13.0027275,0.1668117,-125.754265,126.035355,3.033558,10.398595,-4.497462,-128.51266,-196.36516,13.432153,6.107367,-7.9556923,181.35376,670000
56
+ 0.6364669,124.63878,0.009227295,-0.0057101864,-13.118836,0.18373421,-124.51773,124.8168,3.4580827,8.201751,-6.823029,-127.28357,-202.42708,11.659834,2.116748,-1.7428006,114.4395,675000
57
+ 0.6419362,125.406746,0.008967015,-0.008841272,-13.485977,0.17224248,-125.28581,125.570145,4.624267,9.031642,0.45204386,-128.87798,-196.7765,13.655909,1.8092209,-1.9410435,131.2236,680000
58
+ 0.642268,124.41244,0.009402487,0.0004180912,-12.455534,0.14879307,-124.29533,124.56165,6.2579203,12.939467,-1.5782851,-126.7949,-205.16028,19.197388,3.218024,-3.178508,229.50018,685000
59
+ 0.63574,118.316345,0.009377664,0.0073611606,-11.715033,0.16071549,-118.20648,118.48442,4.733924,9.49133,-3.3331695,-121.30088,-199.16705,14.225254,2.3889635,-2.4697561,167.38612,690000
60
+ 0.64572394,121.1819,0.009449038,0.0022357227,-12.2633915,0.18953314,-121.06602,121.373665,3.089759,10.628699,0.7910089,-123.732376,-206.0269,13.718458,1.0945746,-1.8655409,127.30032,695000
61
+ 0.6394597,124.94179,0.009276237,0.007050845,-11.7399025,0.17944793,-124.832886,125.12829,5.9589577,10.643054,-7.523777,-128.24303,-195.33495,16.602013,3.4796684,-3.5831091,199.13051,700000
62
+ 0.64227253,125.389305,0.009305858,0.0020012935,-12.284943,0.16592014,-125.27498,125.55722,3.1559978,18.720625,-6.481528,-128.17175,-204.28676,21.876623,14.048868,-12.048524,269.30795,705000
63
+ 0.6450062,119.41735,0.009276985,0.01539691,-10.840311,0.15294713,-119.31679,119.58569,4.3090243,12.949997,-2.818257,-122.638916,-198.23016,17.259022,6.58518,-6.8227367,192.06497,710000
64
+ 0.64688414,120.88283,0.009127499,0.021968266,-10.093178,0.14522363,-120.790695,121.05002,7.219116,12.08845,-0.22937278,-123.73197,-199.53816,19.307568,2.5650172,-1.8943522,215.87827,715000
65
+ 0.6389473,120.87054,0.009416742,0.0007322165,-12.422243,0.16971326,-120.75356,121.040985,3.6115067,9.3124695,-8.808804,-124.28387,-204.89542,12.923976,1.8779569,-2.5592303,116.596146,720000
66
+ 0.6449081,117.651054,0.009131734,0.01631124,-10.713785,0.13547035,-117.553215,117.80283,3.024733,10.618087,-6.8079863,-120.34341,-202.31041,13.64282,4.2206645,-4.2433844,147.37453,725000
67
+ 0.63218564,118.748,0.009264143,0.003912525,-12.07767,0.17135462,-118.636116,118.92327,3.8917577,14.469614,-9.792186,-121.82711,-202.38464,18.361372,6.9457483,-8.318788,187.83588,730000
68
+ 0.6423114,120.315414,0.009265565,-0.002635542,-12.784445,0.17469488,-120.19696,120.48748,4.164972,15.098724,-3.504759,-123.14922,-204.88583,19.263697,10.951202,-12.485553,225.47067,735000
69
+ 0.6485815,120.038895,0.009010245,0.00090772175,-12.399257,0.13647863,-119.92717,120.176285,3.3326423,9.648496,-11.413003,-123.197075,-195.85461,12.981138,2.5207741,-1.9144294,126.85292,740000
70
+ 0.6394123,124.859024,0.009174975,-0.010756701,-13.672396,0.13940638,-124.73358,124.98767,3.112807,9.732345,-1.1056793,-127.836235,-199.87358,12.845152,1.4719777,-1.4302796,123.803955,745000
71
+ 0.6417158,120.19875,0.009221682,-0.0016091791,-12.6744995,0.124537796,-120.08188,120.32168,3.6768677,12.938231,-6.9607916,-122.4162,-202.30157,16.615099,4.316939,-4.1554875,146.16086,750000
72
+ 0.64967287,119.35918,0.0093156835,0.014997332,-10.890099,0.15917838,-119.25773,119.533356,4.3555527,14.610578,-2.8076622,-121.58125,-199.56772,18.96613,1.8485432,-1.715724,173.39322,755000
73
+ 0.6412961,118.90997,0.009125584,0.012455324,-11.13512,0.1743328,-118.80836,119.09676,3.6195588,10.187041,-3.2310953,-121.186356,-203.16371,13.806601,3.0795486,-3.121655,176.3368,760000
74
+ 0.636049,119.80622,0.009219453,-0.008402573,-13.411396,0.16099207,-119.68257,119.95882,2.601303,11.837916,-3.8428798,-122.22278,-203.71954,14.439219,4.012319,-6.16646,129.2957,765000
75
+ 0.64039207,118.56178,0.009344838,-0.0036664933,-12.892355,0.15855229,-118.441315,118.71667,4.3053765,10.677342,-6.3896403,-121.41499,-199.83684,14.982719,5.5326524,-5.4297724,159.89355,770000
76
+ 0.6394213,113.8176,0.009247138,-0.0033746036,-12.864935,0.1467784,-113.69863,113.961006,5.4096575,13.256627,0.47826475,-117.06482,-200.73756,18.666285,5.517737,-5.0085163,206.72226,775000
77
+ 0.64525956,114.99387,0.008928722,0.0056562354,-11.866512,0.16207427,-114.887924,115.1616,4.045584,14.729464,-3.9274597,-118.078545,-199.33803,18.775047,6.6305823,-6.785177,218.12198,780000
78
+ 0.6446402,114.338455,0.009297281,-0.0011017432,-12.618502,0.17109822,-114.22113,114.50845,3.524936,9.275496,3.1658447,-118.17931,-201.28346,12.800431,2.2261078,-2.184962,138.99338,785000
79
+ 0.6370356,120.61284,0.0089479955,-0.017739743,-14.482538,0.15710838,-120.483246,120.75221,6.147721,9.121507,-9.082663,-123.458046,-197.76074,15.269228,2.288703,-2.032179,174.33551,790000
80
+ 0.6429846,117.905106,0.009375071,-0.0011138852,-12.6188135,0.16107337,-117.7868,118.06506,4.1211476,12.273775,-5.1462407,-121.359474,-202.5615,16.394922,2.1706064,-2.0880418,158.39401,795000
81
+ 0.64650136,114.83568,0.008848266,0.013271352,-11.000118,0.15032743,-114.73834,114.99928,3.0729408,8.159675,-6.132368,-118.179565,-203.69879,11.232615,2.5788658,-2.6245677,136.17926,800000
82
+ 0.6431491,116.67439,0.009088537,0.00928756,-11.478102,0.16518313,-116.57007,116.84886,7.557817,13.721298,-2.3196435,-119.51354,-196.93135,21.279116,3.4324453,-3.624996,247.61003,805000
83
+ 0.6455818,119.77748,0.009094914,0.009117223,-11.497547,0.16878155,-119.67291,119.95538,3.68769,6.9453483,-6.4024734,-122.07129,-194.99864,10.6330385,0.734258,-1.1429008,97.99921,810000
84
+ 0.6502924,115.26128,0.009075126,-0.0053802636,-13.092858,0.1640602,-115.14246,115.41996,3.413379,8.987651,-2.6419368,-118.12062,-201.1917,12.40103,1.9453199,-2.2579122,139.81699,815000
85
+ 0.637968,119.7455,0.009303941,-0.001784843,-12.691837,0.15588452,-119.62741,119.8996,3.6945565,11.071761,-11.536994,-122.28511,-200.62825,14.766317,5.409694,-5.3333964,168.48067,820000
86
+ 0.6484833,113.85289,0.009408035,0.00025082688,-12.473339,0.15514737,-113.735535,114.008286,4.9894166,16.582642,-0.3767514,-117.593315,-203.68202,21.572058,6.0679865,-7.4515443,221.52097,825000
87
+ 0.65072936,115.83453,0.009066216,0.023843033,-9.870123,0.16931984,-115.745056,116.027695,3.7486634,9.806767,-1.1834062,-118.62182,-198.53664,13.555431,0.7567306,-0.6383513,113.47882,830000
88
+ 0.64777327,116.38169,0.009046122,0.01368225,-10.987501,0.16020906,-116.2823,116.55558,3.235555,12.214309,-5.447961,-119.20636,-203.40427,15.449863,4.7035165,-4.5906734,171.67317,835000
89
+ 0.6372964,114.535164,0.009109437,-0.022106595,-14.92678,0.1674165,-114.3992,114.68047,3.6357872,11.278679,-8.995079,-117.29949,-204.10211,14.914466,3.880208,-4.1821175,155.23216,840000
90
+ 0.6389389,120.69818,0.0090827625,-0.008840088,-13.473282,0.14349116,-120.575806,120.83283,2.8732355,12.640123,-1.6545792,-123.93166,-199.67021,15.513359,1.8889868,-2.1146142,137.2093,845000
91
+ 0.64560276,114.25324,0.008988986,0.00854155,-11.549776,0.14942276,-114.14942,114.41121,3.956786,11.900589,-4.4078064,-117.89207,-203.58093,15.857375,1.6342654,-1.4599236,152.61195,850000
92
+ 0.6423073,116.030426,0.008984615,-0.00065417995,-12.572811,0.15660065,-115.917465,116.18637,4.3575244,10.090316,-3.6139567,-119.073265,-198.6808,14.44784,2.4314835,-2.4375744,145.46875,855000
93
+ 0.64501417,111.97113,0.008995396,0.0016631999,-12.315105,0.1638041,-111.86036,112.1366,5.148681,11.325249,-5.577162,-114.586205,-195.34927,16.47393,3.304754,-3.6494427,148.78964,860000
94
+ 0.641198,113.05025,0.008996571,0.0014754767,-12.335996,0.14870684,-112.93926,113.200424,3.5794506,13.1505575,-1.1891043,-116.04822,-198.64372,16.730007,3.2186806,-4.32603,139.86899,865000
95
+ 0.64886314,111.066284,0.009020278,0.0044897944,-12.002255,0.13822092,-110.95802,111.20899,5.0043845,10.871202,11.923709,-114.20818,-199.5469,15.875587,4.5049605,-4.001946,180.2392,870000
96
+ 0.6479572,110.74069,0.009058282,0.0033148404,-12.134054,0.12534943,-110.63079,110.869354,3.6635785,11.246657,1.836301,-114.64297,-200.82486,14.910236,5.0740104,-5.175359,164.79837,875000
97
+ 0.63383955,113.76301,0.00899682,-0.010783535,-13.698594,0.16139245,-113.639755,113.91362,4.357194,10.0087,0.6138143,-116.99766,-202.1591,14.365894,1.2654829,-1.2759504,129.03535,880000
98
+ 0.6416048,113.553925,0.0091427965,-0.0008181185,-12.589482,0.13064691,-113.43882,113.683754,4.1266036,8.992571,1.6297456,-116.12827,-201.60596,13.119175,2.0314193,-1.9348761,137.30453,885000
99
+ 0.64291275,111.4379,0.009079064,0.005191203,-11.928223,0.1510078,-111.329605,111.59409,4.097607,17.816105,4.458632,-114.123924,-201.8971,21.913712,8.962136,-9.274958,253.3046,890000
100
+ 0.635887,104.33165,0.008916115,-0.014020458,-14.072485,0.118818596,-104.20618,104.43645,4.02766,12.573307,-5.001734,-107.91937,-199.74426,16.600967,5.827271,-5.1061497,225.48383,895000
101
+ 0.6362478,109.10452,0.009049487,-0.010963438,-13.711498,0.15623471,-108.980446,109.249794,4.942483,11.649042,7.6461205,-112.06869,-200.46214,16.591526,1.757865,-1.8579618,141.35522,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
2
+ 0.643265,152.65453,0.0075980597,-0.005156799,-13.1786995,0.19453254,-152.55438,152.8439,1.6845665,6.2422547,-69.90439,-155.14688,-195.06387,7.926821,7.221267,-7.138418,127.3331,405000
3
+ 0.6443439,148.96472,0.007623238,-0.0039529493,-13.018539,0.195763,-148.86548,149.15654,1.1565669,6.592435,-55.016033,-151.66153,-193.22118,7.7490015,4.849304,-4.620331,103.49316,410000
4
+ 0.64733785,150.39694,0.007689698,0.0037162567,-12.016723,0.20818043,-150.30453,150.60884,1.3898687,3.6582024,-40.803207,-153.1081,-192.90053,5.048071,0.7240639,-0.83049333,53.08139,415000
5
+ 0.63025695,150.69656,0.007644919,-0.018109744,-14.86886,0.17575951,-150.58289,150.85422,3.5650995,6.2941794,-35.494335,-153.81473,-198.78122,9.859279,4.721145,-4.6399603,96.43646,420000
6
+ 0.6394948,148.69543,0.007879713,-0.010390713,-13.818666,0.19849652,-148.58656,148.88354,1.6594177,4.203403,-60.683037,-150.82204,-199.19528,5.8628206,0.4290268,-0.8757771,55.75992,425000
7
+ 0.64110625,146.80826,0.008117279,-0.0098519055,-13.713696,0.19555739,-146.69695,146.99396,2.7539022,5.460565,-67.055626,-149.05803,-197.10396,8.214467,1.2576982,-1.4600021,82.27845,430000
8
+ 0.6453779,147.9339,0.0083820885,0.0029202646,-12.151607,0.16857024,-147.83203,148.10538,1.9877169,5.955225,-53.18908,-150.20258,-197.16711,7.9429417,3.9273055,-3.6610806,97.29001,435000
9
+ 0.63677776,146.01132,0.008372984,-0.011563878,-13.881094,0.21518959,-145.8951,146.21495,1.8477007,7.36026,-62.01387,-149.57384,-196.66193,9.207961,2.836074,-3.1542444,99.97038,440000
10
+ 0.64508986,146.5398,0.008659959,0.004350907,-11.997583,0.17904796,-146.4359,146.72319,2.079761,4.893556,-76.04396,-148.96953,-198.40472,6.973317,0.7199221,-0.6550503,62.1195,445000
11
+ 0.6458272,146.02335,0.008711074,-0.005442377,-13.124765,0.17512862,-145.90903,146.19302,2.6926954,7.7760406,-49.00423,-148.6982,-195.84305,10.468736,1.7271746,-1.8109988,100.45282,450000
12
+ 0.63606185,141.1145,0.008721768,-0.016547816,-14.397301,0.19846252,-140.98892,141.29642,4.1386375,9.751056,-30.95133,-144.47643,-197.00487,13.889693,5.2832966,-5.7666063,134.73117,455000
13
+ 0.6304907,140.45709,0.008636576,-0.007640728,-13.384694,0.20934844,-140.3415,140.6588,2.560434,6.54695,-15.041662,-144.06982,-200.3571,9.107384,2.4911425,-2.2260344,90.06359,460000
14
+ 0.6461242,142.59235,0.009241166,-0.00742111,-13.303049,0.16549623,-142.46942,142.75043,2.8859153,6.678305,-37.393517,-145.73119,-199.4401,9.56422,3.588069,-3.8886454,131.529,465000
15
+ 0.63835174,137.17221,0.009153864,-0.00927492,-13.513225,0.19685173,-137.04852,137.35979,2.3040679,6.64704,-12.077508,-139.83035,-201.11758,8.951108,0.662961,-0.6118509,80.3447,470000
16
+ 0.636791,140.49677,0.008969372,0.0013449576,-12.35005,0.18450841,-140.386,140.68262,2.2069557,7.85164,-49.18793,-143.24821,-199.64223,10.058596,7.993062,-8.185585,155.33798,475000
17
+ 0.6409978,141.1199,0.009169036,-0.007687983,-13.338472,0.1909186,-140.99762,141.30313,3.6679192,8.048097,-24.145462,-144.12032,-197.68916,11.716016,2.9970076,-2.6262205,119.554115,480000
18
+ 0.6424893,137.79854,0.009290451,-0.00013378698,-12.5144005,0.14880964,-137.68228,137.9472,22.000315,11.174199,-15.819845,-140.59036,-199.06825,33.174515,3.3323183,-3.6682336,209.87292,485000
19
+ 0.6407904,139.0167,0.009304904,-0.0037474616,-12.9027405,0.1729816,-138.89664,139.18593,3.6505897,8.854815,-35.79149,-141.69661,-197.85912,12.505404,1.4219191,-1.1101617,115.42937,490000
20
+ 0.6489133,137.70428,0.009278906,0.011863679,-11.221436,0.16880465,-137.60016,137.88495,3.728275,6.526652,-40.970444,-139.835,-202.96701,10.254927,3.4157968,-3.0090754,113.16118,495000
21
+ 0.6348133,132.5325,0.009405187,-0.0060831946,-13.146791,0.17262039,-132.40887,132.69904,3.4102776,12.449433,-29.500406,-135.86003,-201.89275,15.859711,7.025614,-5.037615,165.11766,500000
22
+ 0.64744717,137.10468,0.009569492,0.010549205,-11.397621,0.20057473,-136.9956,137.3158,4.431602,8.602759,-14.177907,-140.24667,-204.22095,13.034361,3.6961584,-3.5097754,128.03806,505000
23
+ 0.63906175,133.45816,0.009788549,-0.007136525,-13.229069,0.21215679,-133.32866,133.66318,2.7197397,8.863651,-30.563284,-136.45238,-197.2954,11.583391,1.9749013,-1.8228719,112.54745,510000
24
+ 0.6284626,132.69055,0.009541794,-0.0037744364,-12.895569,0.16725533,-132.56749,132.85403,3.1126735,8.000861,0.85641015,-136.09488,-200.97098,11.113535,1.759632,-2.502218,139.16891,515000
25
+ 0.64500695,137.42258,0.00939177,-0.0070233345,-13.247818,0.16561514,-137.29816,137.58118,4.5604343,8.342742,-24.545494,-140.16081,-204.63425,12.903176,3.698126,-3.30907,130.29153,520000
26
+ 0.63528293,138.83827,0.009205186,-0.01626431,-14.266864,0.18647166,-138.70694,139.00848,6.4796076,9.556769,-17.410664,-141.93828,-198.71825,16.036377,2.0732527,-3.413546,191.44763,525000
27
+ 0.6441838,135.42743,0.00935569,0.011751502,-11.243919,0.179466,-135.32224,135.61864,3.7248764,11.231298,-35.06821,-139.19394,-197.76611,14.956175,1.125839,-1.181033,139.25243,530000
28
+ 0.6373442,135.46848,0.009383752,-0.005081249,-13.041494,0.2124522,-135.3461,135.67584,3.1229825,12.464222,2.3601658,-139.29008,-203.50812,15.587204,2.958001,-3.3280227,138.847,535000
29
+ 0.64509916,132.30405,0.009146708,0.0065777553,-11.780861,0.1513429,-132.19629,132.46196,3.3612955,12.199487,-21.834372,-135.75586,-201.94147,15.560782,4.513779,-5.4859815,161.33307,540000
30
+ 0.650798,132.16324,0.009553216,0.0072578774,-11.740269,0.18534383,-132.05109,132.35585,4.345029,11.460006,-9.838492,-134.74666,-202.94554,15.805035,6.2655725,-7.225169,179.4553,545000
31
+ 0.6387239,135.15762,0.009442728,-0.01627431,-14.223475,0.15254796,-135.02332,135.29388,3.4887524,11.294269,-18.863207,-136.90288,-200.91827,14.783021,2.2291398,-2.073104,166.8576,550000
32
+ 0.6460562,130.77686,0.009549049,0.0067690155,-11.791132,0.19001442,-130.66426,130.97365,6.5474167,12.459838,-6.917731,-133.65706,-195.06636,19.007256,2.5336194,-1.9291397,229.8836,555000
33
+ 0.648825,132.69962,0.009525128,0.015966173,-10.823784,0.16909772,-132.59653,132.88467,3.3722382,7.942862,-8.805404,-135.6614,-202.06053,11.3151,5.252202,-4.5160875,134.98666,560000
34
+ 0.63904476,133.41344,0.009537217,-0.0070215845,-13.23623,0.18797976,-133.2872,133.59439,2.488747,9.43185,-1.1263504,-136.4121,-203.5711,11.920597,6.5413623,-7.189885,145.79277,565000
35
+ 0.6539054,130.65945,0.009561684,0.02993047,-9.369749,0.17164996,-130.56987,130.86104,2.2678115,8.377403,-11.197053,-132.75105,-201.72568,10.645215,2.656642,-2.6378708,117.990875,570000
36
+ 0.6417743,133.6405,0.009319901,-0.0016464231,-12.676657,0.1904467,-133.52235,133.8293,3.7009828,11.98055,-16.672588,-136.88046,-202.71912,15.681533,7.3082747,-6.823574,199.46136,575000
37
+ 0.6474547,133.28178,0.009433002,0.0065887873,-11.8015175,0.15672144,-133.17047,133.4451,6.8757987,10.12779,2.168981,-135.93913,-203.05162,17.00359,8.111816,-6.1184196,325.20587,580000
38
+ 0.6362356,129.07503,0.00953307,-0.01410663,-13.979757,0.17374966,-128.94176,129.23468,4.0266347,21.329227,-2.899532,-132.77055,-198.16188,25.355862,7.3632646,-6.621008,191.59583,585000
39
+ 0.64266616,128.15894,0.009391232,-0.005018486,-13.03438,0.16655923,-128.03653,128.32048,2.7065365,9.222795,-11.34628,-131.02423,-205.41644,11.929331,2.8027027,-2.7968805,119.150246,590000
40
+ 0.6349283,130.84866,0.00927468,-0.0073326314,-13.290607,0.16503978,-130.7254,131.00636,3.491169,10.64731,-17.303635,-133.57108,-202.47365,14.138479,4.7184877,-5.0372243,144.67726,595000
41
+ 0.63584894,128.43484,0.009623543,-0.002680667,-12.778553,0.1638084,-128.31187,128.59596,6.234959,15.365386,-7.9687476,-132.39389,-200.77492,21.600346,2.8783817,-3.211027,194.56989,600000
42
+ 0.63393444,128.14713,0.009500139,-0.0056832717,-13.09823,0.16553152,-128.0227,128.30698,3.0246034,10.972584,-15.471093,-131.29556,-198.21265,13.997187,2.2656443,-2.9817133,128.55583,605000
43
+ 0.6371266,128.60109,0.009423305,0.0001453699,-12.484573,0.16543177,-128.48344,128.76668,2.694495,7.942016,-13.372177,-130.92525,-203.92157,10.636511,4.7059646,-2.7336006,163.26659,610000
44
+ 0.63748056,131.12636,0.009095032,-0.011593759,-13.774735,0.16338561,-131.0011,131.27815,3.3655014,11.176664,-13.467462,-133.55475,-201.98048,14.542166,6.525617,-4.7287097,159.42883,615000
45
+ 0.63954675,126.92883,0.009158885,-0.012469034,-13.861414,0.1675699,-126.80188,127.08394,3.5732179,11.863883,-6.740142,-130.08035,-197.03038,15.437101,1.2872832,-0.95074147,138.11382,620000
46
+ 0.633351,121.55235,0.009612724,0.011473011,-11.306477,0.16228493,-121.44367,121.72611,3.5356958,9.095477,-2.1091099,-124.54231,-202.15108,12.631173,3.021589,-2.7533305,113.058624,625000
47
+ 0.64548504,129.50552,0.009381985,0.011635914,-11.25976,0.1605006,-129.39987,129.67767,3.4521043,8.605102,-6.2098813,-132.73816,-202.84927,12.057206,2.121385,-2.27052,121.49571,630000
48
+ 0.6450627,124.29553,0.009672853,0.011927512,-11.266909,0.15590137,-124.18655,124.463356,3.6854446,8.587611,-2.6847208,-127.15493,-195.93513,12.273056,3.14279,-2.636501,117.09846,635000
49
+ 0.64918554,124.7937,0.00923872,-2.9991725e-05,-12.503246,0.16436242,-124.678185,124.95803,10.66199,14.948421,1.9969046,-128.32463,-200.02194,25.61041,3.2680602,-3.4829195,242.4981,640000
50
+ 0.6386839,125.597275,0.009541889,-0.0072116163,-13.255785,0.16297925,-125.47079,125.753044,4.1934776,10.757285,-3.7805688,-128.48434,-199.75212,14.950763,2.9411237,-2.7413871,160.30177,645000
51
+ 0.63721436,117.85981,0.009270427,0.0079568,-11.641701,0.17458336,-117.751884,118.04235,4.617673,14.593101,-7.1603174,-121.37764,-199.27422,19.210773,3.3791864,-4.535394,196.26782,650000
52
+ 0.6494256,127.7482,0.009223907,-0.005337682,-13.078679,0.19925213,-127.62756,127.94211,3.2569776,8.749644,0.2056885,-130.63356,-199.90045,12.006622,2.6632104,-2.655586,128.81789,655000
53
+ 0.6335176,124.98389,0.009340846,-0.004289966,-12.95927,0.19523033,-124.86284,125.17483,3.9020562,9.751259,3.8140016,-129.21977,-203.04486,13.653315,2.769002,-1.9850646,134.84763,660000
54
+ 0.64474857,126.51434,0.0092457235,-0.004354125,-12.970934,0.17572448,-126.3944,126.685715,3.6014366,8.822232,-0.7040361,-129.18776,-203.43045,12.423669,2.78757,-2.4116023,160.81085,665000
55
+ 0.6352337,125.87314,0.009141115,-0.0045954897,-13.0027275,0.1668117,-125.754265,126.035355,3.033558,10.398595,-4.497462,-128.51266,-196.36516,13.432153,6.107367,-7.9556923,181.35376,670000
56
+ 0.6364669,124.63878,0.009227295,-0.0057101864,-13.118836,0.18373421,-124.51773,124.8168,3.4580827,8.201751,-6.823029,-127.28357,-202.42708,11.659834,2.116748,-1.7428006,114.4395,675000
57
+ 0.6419362,125.406746,0.008967015,-0.008841272,-13.485977,0.17224248,-125.28581,125.570145,4.624267,9.031642,0.45204386,-128.87798,-196.7765,13.655909,1.8092209,-1.9410435,131.2236,680000
58
+ 0.642268,124.41244,0.009402487,0.0004180912,-12.455534,0.14879307,-124.29533,124.56165,6.2579203,12.939467,-1.5782851,-126.7949,-205.16028,19.197388,3.218024,-3.178508,229.50018,685000
59
+ 0.63574,118.316345,0.009377664,0.0073611606,-11.715033,0.16071549,-118.20648,118.48442,4.733924,9.49133,-3.3331695,-121.30088,-199.16705,14.225254,2.3889635,-2.4697561,167.38612,690000
60
+ 0.64572394,121.1819,0.009449038,0.0022357227,-12.2633915,0.18953314,-121.06602,121.373665,3.089759,10.628699,0.7910089,-123.732376,-206.0269,13.718458,1.0945746,-1.8655409,127.30032,695000
61
+ 0.6394597,124.94179,0.009276237,0.007050845,-11.7399025,0.17944793,-124.832886,125.12829,5.9589577,10.643054,-7.523777,-128.24303,-195.33495,16.602013,3.4796684,-3.5831091,199.13051,700000
62
+ 0.64227253,125.389305,0.009305858,0.0020012935,-12.284943,0.16592014,-125.27498,125.55722,3.1559978,18.720625,-6.481528,-128.17175,-204.28676,21.876623,14.048868,-12.048524,269.30795,705000
63
+ 0.6450062,119.41735,0.009276985,0.01539691,-10.840311,0.15294713,-119.31679,119.58569,4.3090243,12.949997,-2.818257,-122.638916,-198.23016,17.259022,6.58518,-6.8227367,192.06497,710000
64
+ 0.64688414,120.88283,0.009127499,0.021968266,-10.093178,0.14522363,-120.790695,121.05002,7.219116,12.08845,-0.22937278,-123.73197,-199.53816,19.307568,2.5650172,-1.8943522,215.87827,715000
65
+ 0.6389473,120.87054,0.009416742,0.0007322165,-12.422243,0.16971326,-120.75356,121.040985,3.6115067,9.3124695,-8.808804,-124.28387,-204.89542,12.923976,1.8779569,-2.5592303,116.596146,720000
66
+ 0.6449081,117.651054,0.009131734,0.01631124,-10.713785,0.13547035,-117.553215,117.80283,3.024733,10.618087,-6.8079863,-120.34341,-202.31041,13.64282,4.2206645,-4.2433844,147.37453,725000
67
+ 0.63218564,118.748,0.009264143,0.003912525,-12.07767,0.17135462,-118.636116,118.92327,3.8917577,14.469614,-9.792186,-121.82711,-202.38464,18.361372,6.9457483,-8.318788,187.83588,730000
68
+ 0.6423114,120.315414,0.009265565,-0.002635542,-12.784445,0.17469488,-120.19696,120.48748,4.164972,15.098724,-3.504759,-123.14922,-204.88583,19.263697,10.951202,-12.485553,225.47067,735000
69
+ 0.6485815,120.038895,0.009010245,0.00090772175,-12.399257,0.13647863,-119.92717,120.176285,3.3326423,9.648496,-11.413003,-123.197075,-195.85461,12.981138,2.5207741,-1.9144294,126.85292,740000
70
+ 0.6394123,124.859024,0.009174975,-0.010756701,-13.672396,0.13940638,-124.73358,124.98767,3.112807,9.732345,-1.1056793,-127.836235,-199.87358,12.845152,1.4719777,-1.4302796,123.803955,745000
71
+ 0.6417158,120.19875,0.009221682,-0.0016091791,-12.6744995,0.124537796,-120.08188,120.32168,3.6768677,12.938231,-6.9607916,-122.4162,-202.30157,16.615099,4.316939,-4.1554875,146.16086,750000
72
+ 0.64967287,119.35918,0.0093156835,0.014997332,-10.890099,0.15917838,-119.25773,119.533356,4.3555527,14.610578,-2.8076622,-121.58125,-199.56772,18.96613,1.8485432,-1.715724,173.39322,755000
73
+ 0.6412961,118.90997,0.009125584,0.012455324,-11.13512,0.1743328,-118.80836,119.09676,3.6195588,10.187041,-3.2310953,-121.186356,-203.16371,13.806601,3.0795486,-3.121655,176.3368,760000
74
+ 0.636049,119.80622,0.009219453,-0.008402573,-13.411396,0.16099207,-119.68257,119.95882,2.601303,11.837916,-3.8428798,-122.22278,-203.71954,14.439219,4.012319,-6.16646,129.2957,765000
75
+ 0.64039207,118.56178,0.009344838,-0.0036664933,-12.892355,0.15855229,-118.441315,118.71667,4.3053765,10.677342,-6.3896403,-121.41499,-199.83684,14.982719,5.5326524,-5.4297724,159.89355,770000
76
+ 0.6394213,113.8176,0.009247138,-0.0033746036,-12.864935,0.1467784,-113.69863,113.961006,5.4096575,13.256627,0.47826475,-117.06482,-200.73756,18.666285,5.517737,-5.0085163,206.72226,775000
77
+ 0.64525956,114.99387,0.008928722,0.0056562354,-11.866512,0.16207427,-114.887924,115.1616,4.045584,14.729464,-3.9274597,-118.078545,-199.33803,18.775047,6.6305823,-6.785177,218.12198,780000
78
+ 0.6446402,114.338455,0.009297281,-0.0011017432,-12.618502,0.17109822,-114.22113,114.50845,3.524936,9.275496,3.1658447,-118.17931,-201.28346,12.800431,2.2261078,-2.184962,138.99338,785000
79
+ 0.6370356,120.61284,0.0089479955,-0.017739743,-14.482538,0.15710838,-120.483246,120.75221,6.147721,9.121507,-9.082663,-123.458046,-197.76074,15.269228,2.288703,-2.032179,174.33551,790000
80
+ 0.6429846,117.905106,0.009375071,-0.0011138852,-12.6188135,0.16107337,-117.7868,118.06506,4.1211476,12.273775,-5.1462407,-121.359474,-202.5615,16.394922,2.1706064,-2.0880418,158.39401,795000
81
+ 0.64650136,114.83568,0.008848266,0.013271352,-11.000118,0.15032743,-114.73834,114.99928,3.0729408,8.159675,-6.132368,-118.179565,-203.69879,11.232615,2.5788658,-2.6245677,136.17926,800000
82
+ 0.6431491,116.67439,0.009088537,0.00928756,-11.478102,0.16518313,-116.57007,116.84886,7.557817,13.721298,-2.3196435,-119.51354,-196.93135,21.279116,3.4324453,-3.624996,247.61003,805000
83
+ 0.6455818,119.77748,0.009094914,0.009117223,-11.497547,0.16878155,-119.67291,119.95538,3.68769,6.9453483,-6.4024734,-122.07129,-194.99864,10.6330385,0.734258,-1.1429008,97.99921,810000
84
+ 0.6502924,115.26128,0.009075126,-0.0053802636,-13.092858,0.1640602,-115.14246,115.41996,3.413379,8.987651,-2.6419368,-118.12062,-201.1917,12.40103,1.9453199,-2.2579122,139.81699,815000
85
+ 0.637968,119.7455,0.009303941,-0.001784843,-12.691837,0.15588452,-119.62741,119.8996,3.6945565,11.071761,-11.536994,-122.28511,-200.62825,14.766317,5.409694,-5.3333964,168.48067,820000
86
+ 0.6484833,113.85289,0.009408035,0.00025082688,-12.473339,0.15514737,-113.735535,114.008286,4.9894166,16.582642,-0.3767514,-117.593315,-203.68202,21.572058,6.0679865,-7.4515443,221.52097,825000
87
+ 0.65072936,115.83453,0.009066216,0.023843033,-9.870123,0.16931984,-115.745056,116.027695,3.7486634,9.806767,-1.1834062,-118.62182,-198.53664,13.555431,0.7567306,-0.6383513,113.47882,830000
88
+ 0.64777327,116.38169,0.009046122,0.01368225,-10.987501,0.16020906,-116.2823,116.55558,3.235555,12.214309,-5.447961,-119.20636,-203.40427,15.449863,4.7035165,-4.5906734,171.67317,835000
89
+ 0.6372964,114.535164,0.009109437,-0.022106595,-14.92678,0.1674165,-114.3992,114.68047,3.6357872,11.278679,-8.995079,-117.29949,-204.10211,14.914466,3.880208,-4.1821175,155.23216,840000
90
+ 0.6389389,120.69818,0.0090827625,-0.008840088,-13.473282,0.14349116,-120.575806,120.83283,2.8732355,12.640123,-1.6545792,-123.93166,-199.67021,15.513359,1.8889868,-2.1146142,137.2093,845000
91
+ 0.64560276,114.25324,0.008988986,0.00854155,-11.549776,0.14942276,-114.14942,114.41121,3.956786,11.900589,-4.4078064,-117.89207,-203.58093,15.857375,1.6342654,-1.4599236,152.61195,850000
92
+ 0.6423073,116.030426,0.008984615,-0.00065417995,-12.572811,0.15660065,-115.917465,116.18637,4.3575244,10.090316,-3.6139567,-119.073265,-198.6808,14.44784,2.4314835,-2.4375744,145.46875,855000
93
+ 0.64501417,111.97113,0.008995396,0.0016631999,-12.315105,0.1638041,-111.86036,112.1366,5.148681,11.325249,-5.577162,-114.586205,-195.34927,16.47393,3.304754,-3.6494427,148.78964,860000
94
+ 0.641198,113.05025,0.008996571,0.0014754767,-12.335996,0.14870684,-112.93926,113.200424,3.5794506,13.1505575,-1.1891043,-116.04822,-198.64372,16.730007,3.2186806,-4.32603,139.86899,865000
95
+ 0.64886314,111.066284,0.009020278,0.0044897944,-12.002255,0.13822092,-110.95802,111.20899,5.0043845,10.871202,11.923709,-114.20818,-199.5469,15.875587,4.5049605,-4.001946,180.2392,870000
96
+ 0.6479572,110.74069,0.009058282,0.0033148404,-12.134054,0.12534943,-110.63079,110.869354,3.6635785,11.246657,1.836301,-114.64297,-200.82486,14.910236,5.0740104,-5.175359,164.79837,875000
97
+ 0.63383955,113.76301,0.00899682,-0.010783535,-13.698594,0.16139245,-113.639755,113.91362,4.357194,10.0087,0.6138143,-116.99766,-202.1591,14.365894,1.2654829,-1.2759504,129.03535,880000
98
+ 0.6416048,113.553925,0.0091427965,-0.0008181185,-12.589482,0.13064691,-113.43882,113.683754,4.1266036,8.992571,1.6297456,-116.12827,-201.60596,13.119175,2.0314193,-1.9348761,137.30453,885000
99
+ 0.64291275,111.4379,0.009079064,0.005191203,-11.928223,0.1510078,-111.329605,111.59409,4.097607,17.816105,4.458632,-114.123924,-201.8971,21.913712,8.962136,-9.274958,253.3046,890000
100
+ 0.635887,104.33165,0.008916115,-0.014020458,-14.072485,0.118818596,-104.20618,104.43645,4.02766,12.573307,-5.001734,-107.91937,-199.74426,16.600967,5.827271,-5.1061497,225.48383,895000
101
+ 0.6362478,109.10452,0.009049487,-0.010963438,-13.711498,0.15623471,-108.980446,109.249794,4.942483,11.649042,7.6461205,-112.06869,-200.46214,16.591526,1.757865,-1.8579618,141.35522,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19f2dfd2d6577293eebf0748a704d3803ca4760ed98251ed59d64c6bbe8936af
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f2ff1a4fae88d87ece49b5af75463a748881a1a266b1cd6b08190870d3be48b
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b8bb35d27d799b8783d7bfaaced7e3fb9e7939534307badcae55497ab0e9222
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4634a336634f04065a93e1f4971acc73779805b804a72275aed246bcd51a30d3
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb9448125721fb12acf73471db82cb489f349f52b43d90ecd7d302120958a69c
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a9a278ed7a7c75a0e7e11b45304036203e87e868dc45edca37ec1f7db58d7f8
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1818b5f69625d4c0a8297399da97eab7475de24d396ca36dc9b5ca0926de163a
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd230066c9fb3255a91a21799ebc0115efcfa4ff37be47db9161992260ec404d
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aa6399d0f17893fd4522edc6dc15922e798555e989e5b9c2dbd424c99cc656b
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7566b9646b44d6b330007467846822c428e114beb51e583e0a240faab809f4f
3
+ size 326957888
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_042444/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/mcdblpoi