Tiredsheep commited on
Commit
5058f26
·
verified ·
1 Parent(s): bab73cd

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_550000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_600000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_650000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_700000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_750000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_800000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_850000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_900000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.017761307720437252,0.006935031885831305,-0.017360439940886672,0.004243976454457025,35.400051599173715,8.75399999999974,0.98,4223.0,-0.02,-238.72,173.08,0.5412278461456299,550000
3
+ 0.0,0.0,-0.015338114277839727,0.012971487047636752,-0.01429004795755625,0.009382590544909055,35.03147312002952,6.288999999999687,1.0,12295.92,0.0,-178.32,123.78,0.4121164035797119,600000
4
+ 0.0,0.0,-0.012447754744037216,0.04509496682186848,-0.009891532431114852,0.039267257269662965,35.77028012429479,5.460999999999821,1.0,17971.52,0.0,-150.02,107.22,0.34993260860443115,650000
5
+ 0.0,0.0,-0.010525698099156442,0.0416234097328709,-0.008314819973883253,0.03070922295547465,35.7001506378387,4.722999999999846,1.0,23282.16,0.0,-128.58,92.46,0.29866036891937253,700000
6
+ 0.0,0.0,-0.015696150941556714,0.05507102058986734,-0.01278345135040973,0.05577984157965653,35.68858745994591,3.778999999999812,1.0,27550.64,0.0,-105.96,73.58,0.24709057807922363,750000
7
+ 0.0,0.0,-0.013047293336454904,0.06943399962152856,-0.009468601769854269,0.06982167019969485,35.48529848323828,3.671999999999807,0.98,31068.76,-0.02,-106.44,71.44,0.2314702844619751,800000
8
+ 0.0,0.0,-0.014592307484209779,0.06129269632741553,-0.011098929032941468,0.06804169027399969,35.94497211158509,3.527999999999896,1.0,34745.26,0.0,-100.24,68.56,0.22135836124420166,850000
9
+ 0.0,0.0,-0.011773218523533413,0.058652554258213585,-0.007920590820251325,0.07750903128342747,34.85885149593953,3.7099999999998254,0.98,38654.3,-0.02,-106.18,72.2,0.23081892013549804,900000
10
+ 0.0,0.0,-0.012012686676858059,0.06165579842664264,-0.009069641610377193,0.06079959816693065,35.92789089903954,2.8149999999999125,1.0,41893.6,0.0,-79.7,54.3,0.17691574573516847,950000
11
+ 0.0,0.0,-0.008033427151279958,0.05029643602633587,-0.005457885086103609,0.0439714691200799,35.42565099415617,3.6429999999998457,0.98,45210.56,-0.02,-99.72,70.86,0.22782538414001466,1000000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.017761307720437252,0.006935031885831305,-0.017360439940886672,0.004243976454457025,35.400051599173715,8.75399999999974,0.98,4223.0,-0.02,-238.72,173.08,0.5412278461456299,550000
3
+ 0.0,0.0,-0.015338114277839727,0.012971487047636752,-0.01429004795755625,0.009382590544909055,35.03147312002952,6.288999999999687,1.0,12295.92,0.0,-178.32,123.78,0.4121164035797119,600000
4
+ 0.0,0.0,-0.012447754744037216,0.04509496682186848,-0.009891532431114852,0.039267257269662965,35.77028012429479,5.460999999999821,1.0,17971.52,0.0,-150.02,107.22,0.34993260860443115,650000
5
+ 0.0,0.0,-0.010525698099156442,0.0416234097328709,-0.008314819973883253,0.03070922295547465,35.7001506378387,4.722999999999846,1.0,23282.16,0.0,-128.58,92.46,0.29866036891937253,700000
6
+ 0.0,0.0,-0.015696150941556714,0.05507102058986734,-0.01278345135040973,0.05577984157965653,35.68858745994591,3.778999999999812,1.0,27550.64,0.0,-105.96,73.58,0.24709057807922363,750000
7
+ 0.0,0.0,-0.013047293336454904,0.06943399962152856,-0.009468601769854269,0.06982167019969485,35.48529848323828,3.671999999999807,0.98,31068.76,-0.02,-106.44,71.44,0.2314702844619751,800000
8
+ 0.0,0.0,-0.014592307484209779,0.06129269632741553,-0.011098929032941468,0.06804169027399969,35.94497211158509,3.527999999999896,1.0,34745.26,0.0,-100.24,68.56,0.22135836124420166,850000
9
+ 0.0,0.0,-0.011773218523533413,0.058652554258213585,-0.007920590820251325,0.07750903128342747,34.85885149593953,3.7099999999998254,0.98,38654.3,-0.02,-106.18,72.2,0.23081892013549804,900000
10
+ 0.0,0.0,-0.012012686676858059,0.06165579842664264,-0.009069641610377193,0.06079959816693065,35.92789089903954,2.8149999999999125,1.0,41893.6,0.0,-79.7,54.3,0.17691574573516847,950000
11
+ 0.0,0.0,-0.008033427151279958,0.05029643602633587,-0.005457885086103609,0.0439714691200799,35.42565099415617,3.6429999999998457,0.98,45210.56,-0.02,-99.72,70.86,0.22782538414001466,1000000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 143.28134,0.2074565,-0.0025529228,-12.694628,0.16651481,142.90991,9.316321,-50.9161,-146.63748,-195.41913,0.3111859,-0.28514525,29.722538,505000
3
+ 140.49663,0.22984435,-0.011546782,-13.37108,0.17724305,140.10109,9.41867,-44.74355,-143.6895,-192.5832,1.3567142,-1.2677691,33.708652,510000
4
+ 140.56345,0.17253858,0.0030506134,-12.277097,0.16802211,140.21985,10.488258,-50.64672,-143.7935,-194.3493,0.4831032,-0.3968043,30.94076,515000
5
+ 136.83255,0.18390474,-0.028798576,-14.45815,0.2126365,136.46481,8.91912,-42.979824,-139.99092,-199.65364,0.41007784,-0.75128967,56.776943,520000
6
+ 133.78099,0.17691657,-0.019748585,-13.821551,0.20654216,133.41728,13.207109,-12.251732,-137.38335,-195.73451,0.36287335,-0.42551216,35.464684,525000
7
+ 130.17819,0.1910195,0.015712151,-11.446091,0.17064343,129.80081,17.589113,-13.926538,-133.71684,-196.21234,1.7514133,-1.355492,72.66823,530000
8
+ 127.86701,0.2061052,0.009346896,-11.8914795,0.18265352,127.4689,12.421901,-9.035285,-130.68991,-195.61353,0.41609913,-0.4582787,36.195976,535000
9
+ 127.336075,0.17742792,-0.022320185,-13.92115,0.21864167,126.962326,15.339812,-4.881917,-131.74625,-199.48753,0.63216877,-1.261208,58.528908,540000
10
+ 126.76497,0.19925883,0.029424287,-10.663227,0.17082016,126.36546,13.180686,-51.135044,-130.21802,-199.8461,0.7183905,-0.85056454,53.262093,545000
11
+ 123.378075,0.16572994,-0.0010348824,-12.561926,0.20993023,123.00345,12.081664,-7.0752783,-126.93786,-191.4067,1.0592283,-1.1364542,53.38198,550000
12
+ 121.453,0.20059574,-0.011835846,-13.219204,0.21754672,121.0467,20.52559,-4.264087,-125.38012,-191.37811,1.5241061,-1.4840485,59.614353,555000
13
+ 119.2317,0.19860837,0.0044943765,-12.2294655,0.2031675,118.825424,12.461173,-18.213417,-123.555374,-199.41025,0.8033452,-0.6652883,51.894768,560000
14
+ 118.47855,0.19551593,-0.021564493,-13.813639,0.2267626,118.07784,14.925422,-4.1972847,-122.01565,-197.64742,0.8010683,-0.8042778,60.332188,565000
15
+ 116.18288,0.1851126,-0.004394296,-12.75555,0.21933708,115.78282,23.418785,-30.660824,-120.28631,-198.73735,6.050345,-5.850951,113.54823,570000
16
+ 119.427475,0.20549375,-0.026934236,-14.067468,0.24172524,119.007195,14.260225,-1.003351,-123.44425,-198.85677,0.38879472,-0.5952026,49.0007,575000
17
+ 118.596634,0.18349192,0.0040113092,-12.265689,0.20998353,118.19914,14.145413,-18.329174,-122.80481,-195.15927,0.8494228,-0.97713614,60.47061,580000
18
+ 116.27683,0.18927048,0.013320849,-11.71828,0.19968455,115.87456,12.478149,-6.2035403,-120.23226,-196.13051,0.68641263,-0.41161114,54.213913,585000
19
+ 115.211,0.18066815,-0.033843506,-14.415256,0.25472462,114.80945,13.864821,-2.6901007,-119.37892,-186.07059,0.5529682,-0.54145455,53.305977,590000
20
+ 117.35937,0.17244548,0.009747631,-11.940727,0.20811635,116.969055,24.2144,-17.568432,-121.04639,-187.8859,1.6100451,-1.6406834,58.067493,595000
21
+ 111.50509,0.20499197,-0.0050944476,-12.784477,0.22894573,111.07625,16.517408,0.16977923,-114.95528,-185.1184,0.69595104,-0.7105099,43.706535,600000
22
+ 117.622025,0.18935427,-0.008532342,-12.9875555,0.22728543,117.21391,15.551246,-10.030614,-121.70974,-188.67764,0.8320119,-0.8346562,46.986565,605000
23
+ 114.41078,0.19858794,0.008523939,-12.006012,0.20716798,113.996506,18.05403,-5.8314953,-117.56339,-184.16844,0.8445085,-0.62474054,46.36718,610000
24
+ 110.3147,0.16883245,-0.0029703232,-12.666981,0.22532552,109.92351,18.11525,1.0797985,-114.36116,-180.88683,0.6851795,-0.85139275,54.24986,615000
25
+ 110.77624,0.1897478,-0.018583372,-13.572601,0.23515233,110.36992,13.728828,-6.96214,-114.80763,-187.46362,1.846469,-2.7234883,53.82022,620000
26
+ 114.840034,0.18055174,-0.014202491,-13.297607,0.2367821,114.436905,11.819624,-5.1231227,-118.93782,-182.7845,0.5773835,-0.46185708,39.26306,625000
27
+ 115.2894,0.16872224,-0.0053803576,-12.802316,0.22784472,114.89821,13.775658,-2.300442,-119.35519,-192.58142,1.0553025,-0.9396106,54.76763,630000
28
+ 112.71203,0.17923519,0.01085341,-11.873869,0.20582268,112.31611,10.871242,1.2118145,-116.47267,-188.06485,0.53224915,-0.75603026,50.151775,635000
29
+ 107.27183,0.19011155,-0.004511553,-12.751862,0.2284219,106.8578,16.130346,-9.075312,-111.80066,-187.44319,1.3294531,-1.4003769,72.56583,640000
30
+ 109.93601,0.1703023,0.006871534,-12.11958,0.21891636,109.53992,13.555606,-5.065763,-113.58923,-188.16502,0.74043876,-0.9976974,53.07661,645000
31
+ 111.88157,0.20644012,-0.01441718,-13.319183,0.23441033,111.45513,14.317459,-6.855903,-115.41392,-193.60707,0.96495855,-1.0128125,45.113632,650000
32
+ 109.958916,0.23624866,0.031211946,-10.776234,0.19512343,109.49633,12.549822,-6.955402,-113.17443,-183.12227,1.4634131,-1.5424864,66.22249,655000
33
+ 112.757095,0.20465562,0.030309854,-10.80677,0.19344783,112.328674,15.875626,-12.435663,-115.986305,-189.25113,0.49548393,-0.4951202,45.733917,660000
34
+ 107.38421,0.19932896,-0.013992351,-13.278299,0.23871872,106.96016,16.92983,-1.3386868,-111.87239,-188.17871,1.3252736,-1.6357639,78.12554,665000
35
+ 108.60941,0.19607729,-0.010303839,-13.07732,0.23340014,108.19025,14.1644125,-0.6105876,-112.352905,-185.45375,0.82048386,-0.6544065,43.22842,670000
36
+ 110.37937,0.21693479,0.045152523,-9.992525,0.1799371,109.93735,11.197814,-5.640813,-113.970276,-193.27817,0.7445872,-0.6516749,47.067165,675000
37
+ 108.6799,0.18846025,0.030077737,-10.832828,0.19543687,108.26593,10.8405,3.1691837,-112.00917,-183.65334,0.54612106,-0.4839947,38.445618,680000
38
+ 105.79221,0.18828481,0.0010955161,-12.439453,0.22507557,105.377754,12.8331785,0.55582917,-109.95359,-184.63109,0.38948628,-0.3895249,39.50709,685000
39
+ 103.282776,0.1773283,-0.022576705,-13.753536,0.24770686,102.88032,10.675292,-0.73179466,-107.31248,-197.55547,1.0039047,-1.1587648,48.53447,690000
40
+ 107.62855,0.22850604,-0.003291909,-12.679919,0.23199931,107.171326,12.150802,-2.3041818,-110.962685,-193.48119,0.9044064,-0.99638957,49.365906,695000
41
+ 106.53814,0.2210866,-0.0038857001,-12.714422,0.23040725,106.09053,12.166196,-1.9838437,-110.293846,-192.0081,0.61162156,-0.6175407,43.214836,700000
42
+ 106.945816,0.19681974,0.005096055,-12.212406,0.21639925,106.5275,10.460186,-2.6234,-110.6079,-177.44191,1.11167,-1.339971,46.380444,705000
43
+ 102.4805,0.18438736,-0.011703598,-13.1581335,0.2339913,102.07382,15.750922,-2.545451,-106.52651,-176.43634,0.76915205,-0.6033859,63.131744,710000
44
+ 106.94846,0.19644488,0.0062645674,-12.153122,0.21948363,106.526276,7.358129,-5.9444184,-110.567375,-199.22948,0.60625905,-0.50507,42.809444,715000
45
+ 106.21344,0.19751033,0.02121782,-11.314495,0.20250352,105.792206,12.381358,-4.78306,-109.87494,-182.46965,0.68496305,-0.72429156,51.477707,720000
46
+ 99.23157,0.18730806,0.030273255,-10.82225,0.1952763,98.81871,15.450419,-0.4019777,-103.020096,-179.09052,0.85119265,-0.8195476,56.0327,725000
47
+ 104.96097,0.21989709,0.043049138,-10.132208,0.18421501,104.51381,12.630412,-5.527227,-108.64056,-187.4598,0.49613625,-0.56362015,43.206123,730000
48
+ 101.26231,0.20941108,0.06762458,-8.758447,0.15829957,100.826965,8.764976,-1.9525692,-104.420364,-181.78157,1.0781181,-0.6549449,52.775024,735000
49
+ 101.67419,0.16680336,0.020026444,-11.378108,0.20310602,101.28425,14.041684,1.9539287,-106.01375,-187.79153,0.62365365,-0.48937526,48.33013,740000
50
+ 104.70706,0.17516641,-0.01775539,-13.491887,0.24151309,104.308136,15.620135,-1.9256938,-108.84143,-191.3666,0.90966,-0.85861003,64.849785,745000
51
+ 95.136375,0.18335038,0.008861065,-12.002774,0.21390156,94.73026,12.838347,-5.499854,-99.384995,-184.14594,1.0916309,-1.0820476,54.3518,750000
52
+ 105.12762,0.20378208,0.04061434,-10.191557,0.17930846,104.70392,9.798882,-3.192951,-108.87144,-189.6246,0.64739823,-0.6190205,38.078976,755000
53
+ 101.56124,0.21794939,0.006463703,-12.129636,0.21168989,101.12514,14.573952,1.4679776,-105.42034,-184.03635,0.3801586,-0.42723027,39.692043,760000
54
+ 104.38467,0.20436284,0.0028443874,-12.338682,0.21755804,103.9599,11.768947,-1.0563667,-107.46883,-193.92847,1.1621745,-0.9333603,40.258297,765000
55
+ 100.92495,0.20546843,0.0069654677,-12.097976,0.20960939,100.50291,14.008814,-5.148627,-104.78528,-183.5098,0.48842108,-1.1954346,51.550903,770000
56
+ 99.50052,0.21021092,0.007124086,-12.100387,0.21571898,99.06746,15.314357,-3.7557726,-103.31524,-196.4251,0.7227153,-0.73592716,57.675125,775000
57
+ 103.02482,0.2117524,-0.011561627,-13.156497,0.23170024,102.592926,13.934567,-2.280092,-107.320694,-183.68738,0.54075694,-0.93361485,47.214752,780000
58
+ 99.81062,0.20865318,0.0019991691,-12.386383,0.21794702,99.38202,9.919845,-0.04033518,-103.29061,-179.33658,0.4602139,-0.49157473,49.107178,785000
59
+ 94.037,0.20589133,-0.017903341,-13.498072,0.24212748,93.60689,16.8196,3.263402,-97.48563,-175.24086,0.3708986,-0.37513432,46.890755,790000
60
+ 96.762764,0.1840908,-0.00076614117,-12.54341,0.22137654,96.35806,10.791041,2.3885713,-100.380394,-187.28035,0.43563354,-0.78119695,46.512424,795000
61
+ 100.33066,0.18128683,0.009837057,-11.940399,0.20989674,99.929634,14.388959,-2.429053,-104.01763,-178.60919,0.87346315,-0.6187741,53.49596,800000
62
+ 102.07604,0.19400024,0.0164363,-11.557859,0.20163491,101.66397,10.866092,-3.6030772,-105.302444,-181.6873,0.5323407,-0.5128098,38.083977,805000
63
+ 96.19748,0.19979444,-0.008855054,-13.012401,0.22487389,95.78167,12.099505,-1.7353034,-100.7822,-190.74075,0.78096443,-0.74305815,41.19976,810000
64
+ 98.92273,0.21227217,0.0011052735,-12.437563,0.22017226,98.48918,16.061747,0.32370943,-102.585304,-170.30208,0.65727484,-0.732301,47.849823,815000
65
+ 98.318855,0.19008447,0.0018152316,-12.39736,0.2192522,97.9077,15.381424,-4.818655,-103.06144,-172.39253,4.897967,-4.1216245,75.48785,820000
66
+ 96.39677,0.18664584,-0.02661841,-14.012941,0.2465411,95.9902,11.373713,3.0548887,-99.82141,-192.3847,0.5061254,-0.49521273,38.719276,825000
67
+ 95.43077,0.22312069,-0.0034564293,-12.69672,0.22308505,94.98802,14.3322525,1.3723985,-98.23535,-169.55203,0.62691844,-0.6039887,53.411827,830000
68
+ 97.530365,0.2006694,0.023587404,-11.129559,0.19155681,97.11455,10.799409,-4.7336164,-101.04186,-193.41998,5.3865204,-5.49838,82.52021,835000
69
+ 99.762794,0.21362165,0.0015068346,-12.413559,0.21639234,99.33127,10.514197,0.5481265,-102.13665,-179.98036,0.730736,-0.42417258,41.89944,840000
70
+ 102.39086,0.18893941,-0.024652917,-13.938573,0.23886625,101.9877,11.918812,-7.6445074,-106.48533,-183.06197,1.3667907,-0.67511916,57.347908,845000
71
+ 93.47847,0.19202492,0.0314432,-10.69392,0.1861773,93.068825,15.260833,1.4615631,-97.08424,-197.96346,0.84850925,-0.8607774,49.826027,850000
72
+ 99.95417,0.17260161,0.0308767,-10.680044,0.1811937,99.5695,11.481384,-3.431851,-103.32737,-186.31487,0.8899065,-0.7311534,55.547226,855000
73
+ 92.08329,0.20038465,0.0086122565,-12.002272,0.2076768,91.66661,10.842435,5.8111544,-95.79257,-193.62558,0.7240982,-0.5072635,43.897003,860000
74
+ 96.09557,0.19808018,-0.030110706,-14.248758,0.24533989,95.68227,12.326125,-2.1874714,-99.71722,-195.99644,2.2378604,-2.3889785,70.7862,865000
75
+ 98.50836,0.17216727,-0.0049271053,-12.786895,0.21960096,98.12152,10.775673,-0.7766226,-102.25012,-185.01295,0.3585944,-0.5547222,40.352455,870000
76
+ 93.29035,0.17668462,-0.0060299253,-12.850176,0.22127625,92.89842,12.0880995,5.3435607,-97.580956,-192.457,0.6366362,-0.736269,44.250328,875000
77
+ 95.30548,0.20265165,0.02105032,-11.272928,0.1933862,94.88839,7.468141,0.7133583,-98.4749,-177.10962,0.3623149,-0.37001067,35.472973,880000
78
+ 94.873726,0.16044478,-0.01106581,-13.145679,0.22529383,94.49905,11.050774,-2.6184871,-99.10365,-189.6799,0.73250693,-1.5452986,69.03618,885000
79
+ 98.51533,0.20595711,-0.015820853,-13.4317255,0.22807291,98.09712,12.77639,1.0855849,-102.63445,-185.3464,0.57546073,-0.6558097,41.84166,890000
80
+ 94.84017,0.16955897,0.006953887,-12.089358,0.2047236,94.45894,12.031837,0.6388613,-99.11548,-174.90367,1.0648155,-0.5677331,55.433178,895000
81
+ 92.03733,0.20978716,0.01668249,-11.521991,0.19653752,91.61432,8.652842,-0.83793724,-96.13047,-177.71643,1.0046022,-1.1338224,50.437393,900000
82
+ 94.5209,0.20532152,-0.002858163,-12.6693735,0.21379454,94.104645,16.277624,0.66834164,-98.46619,-189.76414,0.7536841,-0.7091196,51.673027,905000
83
+ 98.53721,0.18032044,-0.00046023482,-12.527096,0.21277863,98.14457,14.940971,-0.24935955,-102.63738,-177.48494,1.3501858,-1.2678592,54.870964,910000
84
+ 93.616806,0.22180752,0.002724678,-12.339718,0.2097661,93.18251,13.707852,-2.062208,-96.933495,-171.51181,0.9051575,-0.9654511,54.16887,915000
85
+ 94.81344,0.1887914,-0.0025715407,-12.652018,0.21402243,94.4132,13.440305,5.9115543,-98.74627,-187.50964,2.9177287,-2.639011,54.18236,920000
86
+ 90.66438,0.20717482,0.013963499,-11.670534,0.19646555,90.24678,13.02455,4.756097,-94.6847,-199.78918,0.8614155,-0.87014055,48.999657,925000
87
+ 90.80637,0.20050684,0.014234671,-11.653895,0.19606249,90.39557,15.864596,-0.88662803,-94.42836,-177.22446,1.1330739,-1.0196549,62.584953,930000
88
+ 96.008316,0.20857956,-0.0015738413,-12.593717,0.21149409,95.58981,16.17364,1.5694735,-99.09359,-196.30994,2.2676992,-2.400387,78.81749,935000
89
+ 88.467705,0.24962774,-0.017898964,-13.569872,0.22702405,88.00896,12.044021,-2.9109201,-92.40949,-193.21893,0.6130933,-1.0790389,47.79709,940000
90
+ 95.24579,0.19155142,0.02259317,-11.13906,0.1849212,94.846725,10.789941,1.6077822,-99.47339,-188.5205,0.56352854,-0.44025236,38.11975,945000
91
+ 89.41094,0.22787817,-0.005854207,-12.853474,0.21287836,88.97604,10.407176,4.3054833,-93.07433,-181.25731,0.62454194,-0.6865873,42.69156,950000
92
+ 92.89728,0.20038888,0.010546105,-11.868765,0.19829258,92.48805,10.158963,3.8109756,-96.3856,-184.1995,0.60009205,-1.3980138,64.179245,955000
93
+ 89.50167,0.2005289,0.029215148,-10.743776,0.17872497,89.0932,9.6608925,6.038699,-93.75545,-181.23245,0.27111265,-0.593644,33.17884,960000
94
+ 91.922066,0.22138971,-0.020178163,-13.72952,0.2253209,91.49554,12.068652,-4.355765,-95.36116,-177.2659,1.0716534,-0.7113674,54.222054,965000
95
+ 90.7362,0.21463248,0.024024563,-11.054947,0.18379274,90.31375,12.566284,1.5850345,-94.65212,-170.45358,1.7687554,-1.5632093,52.237564,970000
96
+ 92.33838,0.18754368,0.016330132,-11.508223,0.18948886,91.945015,11.293811,0.8942128,-95.31115,-191.78177,0.718212,-0.5153837,48.416203,975000
97
+ 92.792404,0.19519423,-0.0020403473,-12.624706,0.20655565,92.39269,14.375905,6.9290423,-96.230675,-181.41475,1.3034657,-1.301806,58.084724,980000
98
+ 90.19091,0.19014041,0.008366122,-11.985236,0.19478826,89.797615,13.506091,-1.222187,-93.52101,-196.17212,1.2621632,-1.1718347,52.9068,985000
99
+ 91.16707,0.20492041,0.0013689526,-12.415189,0.20039572,90.76039,13.395502,0.25452286,-94.325905,-184.42511,0.45585656,-0.42546767,40.288948,990000
100
+ 86.30011,0.21332037,0.0150342,-11.585442,0.19045022,85.8813,12.000015,-6.2405267,-89.86362,-188.09366,0.68649715,-0.75325453,62.000465,995000
101
+ 84.99937,0.18300462,0.022419706,-11.090125,0.1763542,84.617584,9.439723,-0.10208471,-88.099915,-195.51335,0.4621565,-0.35102898,34.082207,1000000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 143.28134,0.2074565,-0.0025529228,-12.694628,0.16651481,142.90991,9.316321,-50.9161,-146.63748,-195.41913,0.3111859,-0.28514525,29.722538,505000
3
+ 140.49663,0.22984435,-0.011546782,-13.37108,0.17724305,140.10109,9.41867,-44.74355,-143.6895,-192.5832,1.3567142,-1.2677691,33.708652,510000
4
+ 140.56345,0.17253858,0.0030506134,-12.277097,0.16802211,140.21985,10.488258,-50.64672,-143.7935,-194.3493,0.4831032,-0.3968043,30.94076,515000
5
+ 136.83255,0.18390474,-0.028798576,-14.45815,0.2126365,136.46481,8.91912,-42.979824,-139.99092,-199.65364,0.41007784,-0.75128967,56.776943,520000
6
+ 133.78099,0.17691657,-0.019748585,-13.821551,0.20654216,133.41728,13.207109,-12.251732,-137.38335,-195.73451,0.36287335,-0.42551216,35.464684,525000
7
+ 130.17819,0.1910195,0.015712151,-11.446091,0.17064343,129.80081,17.589113,-13.926538,-133.71684,-196.21234,1.7514133,-1.355492,72.66823,530000
8
+ 127.86701,0.2061052,0.009346896,-11.8914795,0.18265352,127.4689,12.421901,-9.035285,-130.68991,-195.61353,0.41609913,-0.4582787,36.195976,535000
9
+ 127.336075,0.17742792,-0.022320185,-13.92115,0.21864167,126.962326,15.339812,-4.881917,-131.74625,-199.48753,0.63216877,-1.261208,58.528908,540000
10
+ 126.76497,0.19925883,0.029424287,-10.663227,0.17082016,126.36546,13.180686,-51.135044,-130.21802,-199.8461,0.7183905,-0.85056454,53.262093,545000
11
+ 123.378075,0.16572994,-0.0010348824,-12.561926,0.20993023,123.00345,12.081664,-7.0752783,-126.93786,-191.4067,1.0592283,-1.1364542,53.38198,550000
12
+ 121.453,0.20059574,-0.011835846,-13.219204,0.21754672,121.0467,20.52559,-4.264087,-125.38012,-191.37811,1.5241061,-1.4840485,59.614353,555000
13
+ 119.2317,0.19860837,0.0044943765,-12.2294655,0.2031675,118.825424,12.461173,-18.213417,-123.555374,-199.41025,0.8033452,-0.6652883,51.894768,560000
14
+ 118.47855,0.19551593,-0.021564493,-13.813639,0.2267626,118.07784,14.925422,-4.1972847,-122.01565,-197.64742,0.8010683,-0.8042778,60.332188,565000
15
+ 116.18288,0.1851126,-0.004394296,-12.75555,0.21933708,115.78282,23.418785,-30.660824,-120.28631,-198.73735,6.050345,-5.850951,113.54823,570000
16
+ 119.427475,0.20549375,-0.026934236,-14.067468,0.24172524,119.007195,14.260225,-1.003351,-123.44425,-198.85677,0.38879472,-0.5952026,49.0007,575000
17
+ 118.596634,0.18349192,0.0040113092,-12.265689,0.20998353,118.19914,14.145413,-18.329174,-122.80481,-195.15927,0.8494228,-0.97713614,60.47061,580000
18
+ 116.27683,0.18927048,0.013320849,-11.71828,0.19968455,115.87456,12.478149,-6.2035403,-120.23226,-196.13051,0.68641263,-0.41161114,54.213913,585000
19
+ 115.211,0.18066815,-0.033843506,-14.415256,0.25472462,114.80945,13.864821,-2.6901007,-119.37892,-186.07059,0.5529682,-0.54145455,53.305977,590000
20
+ 117.35937,0.17244548,0.009747631,-11.940727,0.20811635,116.969055,24.2144,-17.568432,-121.04639,-187.8859,1.6100451,-1.6406834,58.067493,595000
21
+ 111.50509,0.20499197,-0.0050944476,-12.784477,0.22894573,111.07625,16.517408,0.16977923,-114.95528,-185.1184,0.69595104,-0.7105099,43.706535,600000
22
+ 117.622025,0.18935427,-0.008532342,-12.9875555,0.22728543,117.21391,15.551246,-10.030614,-121.70974,-188.67764,0.8320119,-0.8346562,46.986565,605000
23
+ 114.41078,0.19858794,0.008523939,-12.006012,0.20716798,113.996506,18.05403,-5.8314953,-117.56339,-184.16844,0.8445085,-0.62474054,46.36718,610000
24
+ 110.3147,0.16883245,-0.0029703232,-12.666981,0.22532552,109.92351,18.11525,1.0797985,-114.36116,-180.88683,0.6851795,-0.85139275,54.24986,615000
25
+ 110.77624,0.1897478,-0.018583372,-13.572601,0.23515233,110.36992,13.728828,-6.96214,-114.80763,-187.46362,1.846469,-2.7234883,53.82022,620000
26
+ 114.840034,0.18055174,-0.014202491,-13.297607,0.2367821,114.436905,11.819624,-5.1231227,-118.93782,-182.7845,0.5773835,-0.46185708,39.26306,625000
27
+ 115.2894,0.16872224,-0.0053803576,-12.802316,0.22784472,114.89821,13.775658,-2.300442,-119.35519,-192.58142,1.0553025,-0.9396106,54.76763,630000
28
+ 112.71203,0.17923519,0.01085341,-11.873869,0.20582268,112.31611,10.871242,1.2118145,-116.47267,-188.06485,0.53224915,-0.75603026,50.151775,635000
29
+ 107.27183,0.19011155,-0.004511553,-12.751862,0.2284219,106.8578,16.130346,-9.075312,-111.80066,-187.44319,1.3294531,-1.4003769,72.56583,640000
30
+ 109.93601,0.1703023,0.006871534,-12.11958,0.21891636,109.53992,13.555606,-5.065763,-113.58923,-188.16502,0.74043876,-0.9976974,53.07661,645000
31
+ 111.88157,0.20644012,-0.01441718,-13.319183,0.23441033,111.45513,14.317459,-6.855903,-115.41392,-193.60707,0.96495855,-1.0128125,45.113632,650000
32
+ 109.958916,0.23624866,0.031211946,-10.776234,0.19512343,109.49633,12.549822,-6.955402,-113.17443,-183.12227,1.4634131,-1.5424864,66.22249,655000
33
+ 112.757095,0.20465562,0.030309854,-10.80677,0.19344783,112.328674,15.875626,-12.435663,-115.986305,-189.25113,0.49548393,-0.4951202,45.733917,660000
34
+ 107.38421,0.19932896,-0.013992351,-13.278299,0.23871872,106.96016,16.92983,-1.3386868,-111.87239,-188.17871,1.3252736,-1.6357639,78.12554,665000
35
+ 108.60941,0.19607729,-0.010303839,-13.07732,0.23340014,108.19025,14.1644125,-0.6105876,-112.352905,-185.45375,0.82048386,-0.6544065,43.22842,670000
36
+ 110.37937,0.21693479,0.045152523,-9.992525,0.1799371,109.93735,11.197814,-5.640813,-113.970276,-193.27817,0.7445872,-0.6516749,47.067165,675000
37
+ 108.6799,0.18846025,0.030077737,-10.832828,0.19543687,108.26593,10.8405,3.1691837,-112.00917,-183.65334,0.54612106,-0.4839947,38.445618,680000
38
+ 105.79221,0.18828481,0.0010955161,-12.439453,0.22507557,105.377754,12.8331785,0.55582917,-109.95359,-184.63109,0.38948628,-0.3895249,39.50709,685000
39
+ 103.282776,0.1773283,-0.022576705,-13.753536,0.24770686,102.88032,10.675292,-0.73179466,-107.31248,-197.55547,1.0039047,-1.1587648,48.53447,690000
40
+ 107.62855,0.22850604,-0.003291909,-12.679919,0.23199931,107.171326,12.150802,-2.3041818,-110.962685,-193.48119,0.9044064,-0.99638957,49.365906,695000
41
+ 106.53814,0.2210866,-0.0038857001,-12.714422,0.23040725,106.09053,12.166196,-1.9838437,-110.293846,-192.0081,0.61162156,-0.6175407,43.214836,700000
42
+ 106.945816,0.19681974,0.005096055,-12.212406,0.21639925,106.5275,10.460186,-2.6234,-110.6079,-177.44191,1.11167,-1.339971,46.380444,705000
43
+ 102.4805,0.18438736,-0.011703598,-13.1581335,0.2339913,102.07382,15.750922,-2.545451,-106.52651,-176.43634,0.76915205,-0.6033859,63.131744,710000
44
+ 106.94846,0.19644488,0.0062645674,-12.153122,0.21948363,106.526276,7.358129,-5.9444184,-110.567375,-199.22948,0.60625905,-0.50507,42.809444,715000
45
+ 106.21344,0.19751033,0.02121782,-11.314495,0.20250352,105.792206,12.381358,-4.78306,-109.87494,-182.46965,0.68496305,-0.72429156,51.477707,720000
46
+ 99.23157,0.18730806,0.030273255,-10.82225,0.1952763,98.81871,15.450419,-0.4019777,-103.020096,-179.09052,0.85119265,-0.8195476,56.0327,725000
47
+ 104.96097,0.21989709,0.043049138,-10.132208,0.18421501,104.51381,12.630412,-5.527227,-108.64056,-187.4598,0.49613625,-0.56362015,43.206123,730000
48
+ 101.26231,0.20941108,0.06762458,-8.758447,0.15829957,100.826965,8.764976,-1.9525692,-104.420364,-181.78157,1.0781181,-0.6549449,52.775024,735000
49
+ 101.67419,0.16680336,0.020026444,-11.378108,0.20310602,101.28425,14.041684,1.9539287,-106.01375,-187.79153,0.62365365,-0.48937526,48.33013,740000
50
+ 104.70706,0.17516641,-0.01775539,-13.491887,0.24151309,104.308136,15.620135,-1.9256938,-108.84143,-191.3666,0.90966,-0.85861003,64.849785,745000
51
+ 95.136375,0.18335038,0.008861065,-12.002774,0.21390156,94.73026,12.838347,-5.499854,-99.384995,-184.14594,1.0916309,-1.0820476,54.3518,750000
52
+ 105.12762,0.20378208,0.04061434,-10.191557,0.17930846,104.70392,9.798882,-3.192951,-108.87144,-189.6246,0.64739823,-0.6190205,38.078976,755000
53
+ 101.56124,0.21794939,0.006463703,-12.129636,0.21168989,101.12514,14.573952,1.4679776,-105.42034,-184.03635,0.3801586,-0.42723027,39.692043,760000
54
+ 104.38467,0.20436284,0.0028443874,-12.338682,0.21755804,103.9599,11.768947,-1.0563667,-107.46883,-193.92847,1.1621745,-0.9333603,40.258297,765000
55
+ 100.92495,0.20546843,0.0069654677,-12.097976,0.20960939,100.50291,14.008814,-5.148627,-104.78528,-183.5098,0.48842108,-1.1954346,51.550903,770000
56
+ 99.50052,0.21021092,0.007124086,-12.100387,0.21571898,99.06746,15.314357,-3.7557726,-103.31524,-196.4251,0.7227153,-0.73592716,57.675125,775000
57
+ 103.02482,0.2117524,-0.011561627,-13.156497,0.23170024,102.592926,13.934567,-2.280092,-107.320694,-183.68738,0.54075694,-0.93361485,47.214752,780000
58
+ 99.81062,0.20865318,0.0019991691,-12.386383,0.21794702,99.38202,9.919845,-0.04033518,-103.29061,-179.33658,0.4602139,-0.49157473,49.107178,785000
59
+ 94.037,0.20589133,-0.017903341,-13.498072,0.24212748,93.60689,16.8196,3.263402,-97.48563,-175.24086,0.3708986,-0.37513432,46.890755,790000
60
+ 96.762764,0.1840908,-0.00076614117,-12.54341,0.22137654,96.35806,10.791041,2.3885713,-100.380394,-187.28035,0.43563354,-0.78119695,46.512424,795000
61
+ 100.33066,0.18128683,0.009837057,-11.940399,0.20989674,99.929634,14.388959,-2.429053,-104.01763,-178.60919,0.87346315,-0.6187741,53.49596,800000
62
+ 102.07604,0.19400024,0.0164363,-11.557859,0.20163491,101.66397,10.866092,-3.6030772,-105.302444,-181.6873,0.5323407,-0.5128098,38.083977,805000
63
+ 96.19748,0.19979444,-0.008855054,-13.012401,0.22487389,95.78167,12.099505,-1.7353034,-100.7822,-190.74075,0.78096443,-0.74305815,41.19976,810000
64
+ 98.92273,0.21227217,0.0011052735,-12.437563,0.22017226,98.48918,16.061747,0.32370943,-102.585304,-170.30208,0.65727484,-0.732301,47.849823,815000
65
+ 98.318855,0.19008447,0.0018152316,-12.39736,0.2192522,97.9077,15.381424,-4.818655,-103.06144,-172.39253,4.897967,-4.1216245,75.48785,820000
66
+ 96.39677,0.18664584,-0.02661841,-14.012941,0.2465411,95.9902,11.373713,3.0548887,-99.82141,-192.3847,0.5061254,-0.49521273,38.719276,825000
67
+ 95.43077,0.22312069,-0.0034564293,-12.69672,0.22308505,94.98802,14.3322525,1.3723985,-98.23535,-169.55203,0.62691844,-0.6039887,53.411827,830000
68
+ 97.530365,0.2006694,0.023587404,-11.129559,0.19155681,97.11455,10.799409,-4.7336164,-101.04186,-193.41998,5.3865204,-5.49838,82.52021,835000
69
+ 99.762794,0.21362165,0.0015068346,-12.413559,0.21639234,99.33127,10.514197,0.5481265,-102.13665,-179.98036,0.730736,-0.42417258,41.89944,840000
70
+ 102.39086,0.18893941,-0.024652917,-13.938573,0.23886625,101.9877,11.918812,-7.6445074,-106.48533,-183.06197,1.3667907,-0.67511916,57.347908,845000
71
+ 93.47847,0.19202492,0.0314432,-10.69392,0.1861773,93.068825,15.260833,1.4615631,-97.08424,-197.96346,0.84850925,-0.8607774,49.826027,850000
72
+ 99.95417,0.17260161,0.0308767,-10.680044,0.1811937,99.5695,11.481384,-3.431851,-103.32737,-186.31487,0.8899065,-0.7311534,55.547226,855000
73
+ 92.08329,0.20038465,0.0086122565,-12.002272,0.2076768,91.66661,10.842435,5.8111544,-95.79257,-193.62558,0.7240982,-0.5072635,43.897003,860000
74
+ 96.09557,0.19808018,-0.030110706,-14.248758,0.24533989,95.68227,12.326125,-2.1874714,-99.71722,-195.99644,2.2378604,-2.3889785,70.7862,865000
75
+ 98.50836,0.17216727,-0.0049271053,-12.786895,0.21960096,98.12152,10.775673,-0.7766226,-102.25012,-185.01295,0.3585944,-0.5547222,40.352455,870000
76
+ 93.29035,0.17668462,-0.0060299253,-12.850176,0.22127625,92.89842,12.0880995,5.3435607,-97.580956,-192.457,0.6366362,-0.736269,44.250328,875000
77
+ 95.30548,0.20265165,0.02105032,-11.272928,0.1933862,94.88839,7.468141,0.7133583,-98.4749,-177.10962,0.3623149,-0.37001067,35.472973,880000
78
+ 94.873726,0.16044478,-0.01106581,-13.145679,0.22529383,94.49905,11.050774,-2.6184871,-99.10365,-189.6799,0.73250693,-1.5452986,69.03618,885000
79
+ 98.51533,0.20595711,-0.015820853,-13.4317255,0.22807291,98.09712,12.77639,1.0855849,-102.63445,-185.3464,0.57546073,-0.6558097,41.84166,890000
80
+ 94.84017,0.16955897,0.006953887,-12.089358,0.2047236,94.45894,12.031837,0.6388613,-99.11548,-174.90367,1.0648155,-0.5677331,55.433178,895000
81
+ 92.03733,0.20978716,0.01668249,-11.521991,0.19653752,91.61432,8.652842,-0.83793724,-96.13047,-177.71643,1.0046022,-1.1338224,50.437393,900000
82
+ 94.5209,0.20532152,-0.002858163,-12.6693735,0.21379454,94.104645,16.277624,0.66834164,-98.46619,-189.76414,0.7536841,-0.7091196,51.673027,905000
83
+ 98.53721,0.18032044,-0.00046023482,-12.527096,0.21277863,98.14457,14.940971,-0.24935955,-102.63738,-177.48494,1.3501858,-1.2678592,54.870964,910000
84
+ 93.616806,0.22180752,0.002724678,-12.339718,0.2097661,93.18251,13.707852,-2.062208,-96.933495,-171.51181,0.9051575,-0.9654511,54.16887,915000
85
+ 94.81344,0.1887914,-0.0025715407,-12.652018,0.21402243,94.4132,13.440305,5.9115543,-98.74627,-187.50964,2.9177287,-2.639011,54.18236,920000
86
+ 90.66438,0.20717482,0.013963499,-11.670534,0.19646555,90.24678,13.02455,4.756097,-94.6847,-199.78918,0.8614155,-0.87014055,48.999657,925000
87
+ 90.80637,0.20050684,0.014234671,-11.653895,0.19606249,90.39557,15.864596,-0.88662803,-94.42836,-177.22446,1.1330739,-1.0196549,62.584953,930000
88
+ 96.008316,0.20857956,-0.0015738413,-12.593717,0.21149409,95.58981,16.17364,1.5694735,-99.09359,-196.30994,2.2676992,-2.400387,78.81749,935000
89
+ 88.467705,0.24962774,-0.017898964,-13.569872,0.22702405,88.00896,12.044021,-2.9109201,-92.40949,-193.21893,0.6130933,-1.0790389,47.79709,940000
90
+ 95.24579,0.19155142,0.02259317,-11.13906,0.1849212,94.846725,10.789941,1.6077822,-99.47339,-188.5205,0.56352854,-0.44025236,38.11975,945000
91
+ 89.41094,0.22787817,-0.005854207,-12.853474,0.21287836,88.97604,10.407176,4.3054833,-93.07433,-181.25731,0.62454194,-0.6865873,42.69156,950000
92
+ 92.89728,0.20038888,0.010546105,-11.868765,0.19829258,92.48805,10.158963,3.8109756,-96.3856,-184.1995,0.60009205,-1.3980138,64.179245,955000
93
+ 89.50167,0.2005289,0.029215148,-10.743776,0.17872497,89.0932,9.6608925,6.038699,-93.75545,-181.23245,0.27111265,-0.593644,33.17884,960000
94
+ 91.922066,0.22138971,-0.020178163,-13.72952,0.2253209,91.49554,12.068652,-4.355765,-95.36116,-177.2659,1.0716534,-0.7113674,54.222054,965000
95
+ 90.7362,0.21463248,0.024024563,-11.054947,0.18379274,90.31375,12.566284,1.5850345,-94.65212,-170.45358,1.7687554,-1.5632093,52.237564,970000
96
+ 92.33838,0.18754368,0.016330132,-11.508223,0.18948886,91.945015,11.293811,0.8942128,-95.31115,-191.78177,0.718212,-0.5153837,48.416203,975000
97
+ 92.792404,0.19519423,-0.0020403473,-12.624706,0.20655565,92.39269,14.375905,6.9290423,-96.230675,-181.41475,1.3034657,-1.301806,58.084724,980000
98
+ 90.19091,0.19014041,0.008366122,-11.985236,0.19478826,89.797615,13.506091,-1.222187,-93.52101,-196.17212,1.2621632,-1.1718347,52.9068,985000
99
+ 91.16707,0.20492041,0.0013689526,-12.415189,0.20039572,90.76039,13.395502,0.25452286,-94.325905,-184.42511,0.45585656,-0.42546767,40.288948,990000
100
+ 86.30011,0.21332037,0.0150342,-11.585442,0.19045022,85.8813,12.000015,-6.2405267,-89.86362,-188.09366,0.68649715,-0.75325453,62.000465,995000
101
+ 84.99937,0.18300462,0.022419706,-11.090125,0.1763542,84.617584,9.439723,-0.10208471,-88.099915,-195.51335,0.4621565,-0.35102898,34.082207,1000000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c322d33179b9c1d5f6f93011ed6bbe397981fed80855aaa75908f58f6d96175d
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45d14b126a58f5da7c6c1256fc88ed27d24062da609629435dca5dc8cc96e1a9
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c413aef867046a59e9a501097f85a4e6af3e07d6d8a31b131e405b5bc4058e4
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:191e8b3d96b71fe888fd07cbb1f7083570702c6677dda80677ae1b2493c43cb6
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e310ccfc0956717c5afc46ca78a0e09253fbda6f487c6f7ff0ad258ca29af8ce
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a373209e3098b3e1904597c999551917bfbe97c097dd4b5ad55efa3847c486b1
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f1cf0680d1bdbbe39fde1e8a87f105fabf97b8be8571a090c1cfe4e58fca492
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75628e3a2ee62e2e59dd30d0dc79cc50061c4bcfe2914429eb0e68e02380a64b
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e9236e99a180ebd823f04a23c4e579922154139f19fbe45a45ed3f17afee44c
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e21a8b6690abb251a13e2a081e6f06c1c608c17999d9d45032267747316eb12
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_121017/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/8nmhqutu