Tiredsheep commited on
Commit
fdd9346
·
verified ·
1 Parent(s): 50e278a

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_1050000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_1100000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_650000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_700000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_750000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_800000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_850000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_900000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.012530847482369111,0.00211016480014507,-0.012196095170996122,0.005523157956878134,34.96458670685257,8.43099999999951,0.96,4225.62,-0.04,-236.14,166.62,0.5552746534347535,650000
3
+ 0.0,0.0,-0.020382143506866526,-0.0020835428076890904,-0.020751281482070165,-0.0012612579265024026,35.10373245457576,6.615999999999541,1.0,11943.62,0.0,-183.8,130.32,0.44670964241027833,700000
4
+ 0.0,0.0,-0.038631110090896946,-0.004932662685366565,-0.038448170073837204,0.019332280944099587,34.80421445018674,6.476999999999504,0.98,18652.82,-0.02,-175.42,127.54,0.42549746990203857,750000
5
+ 0.0,0.0,-0.030021940631428184,0.0015243961227822912,-0.02984308132415255,0.002655304036861395,35.18002268956399,5.828999999999621,1.0,24957.84,0.0,-159.7,114.58,0.389252986907959,800000
6
+ 0.0,0.0,-0.04120596300481973,0.0007980002912566975,-0.04059567754420482,-0.0024828323801204303,35.404174730955404,5.5699999999996415,1.0,30737.16,0.0,-152.72,109.4,0.41987047672271727,850000
7
+ 0.0,0.0,-0.03426596992406049,0.003431203831582834,-0.03389569826766943,-0.0007551110939447213,35.49408752685764,5.1939999999996544,1.0,36191.4,0.0,-141.7,101.88,0.389050817489624,900000
8
+ 0.0,0.0,-0.05415425347763557,0.012873892068553746,-0.053622257554132295,0.005932367856799072,35.524903174496174,4.872999999999686,1.0,41311.34,0.0,-132.42,95.46,0.34719096660614013,950000
9
+ 0.0,0.0,-0.043657865585037633,0.017256349500712097,-0.04238563271958754,0.019515170980352454,35.46930721581628,4.664999999999723,1.0,46175.1,0.0,-127.46,91.3,0.30618971824645996,1000000
10
+ 0.0,0.0,-0.06504249884662074,0.0256964570108936,-0.06372126731936979,0.01391925074367882,35.45251021670721,4.480999999999728,1.0,50775.22,0.0,-121.56,87.62,0.2968000602722168,1050000
11
+ 0.0,0.0,-0.052970506575293175,0.049512676665101896,-0.05037912831481214,0.04633109903511026,35.55552303136791,4.364999999999743,1.0,55309.26,0.0,-119.12,85.3,0.28368688583374024,1100000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.012530847482369111,0.00211016480014507,-0.012196095170996122,0.005523157956878134,34.96458670685257,8.43099999999951,0.96,4225.62,-0.04,-236.14,166.62,0.5552746534347535,650000
3
+ 0.0,0.0,-0.020382143506866526,-0.0020835428076890904,-0.020751281482070165,-0.0012612579265024026,35.10373245457576,6.615999999999541,1.0,11943.62,0.0,-183.8,130.32,0.44670964241027833,700000
4
+ 0.0,0.0,-0.038631110090896946,-0.004932662685366565,-0.038448170073837204,0.019332280944099587,34.80421445018674,6.476999999999504,0.98,18652.82,-0.02,-175.42,127.54,0.42549746990203857,750000
5
+ 0.0,0.0,-0.030021940631428184,0.0015243961227822912,-0.02984308132415255,0.002655304036861395,35.18002268956399,5.828999999999621,1.0,24957.84,0.0,-159.7,114.58,0.389252986907959,800000
6
+ 0.0,0.0,-0.04120596300481973,0.0007980002912566975,-0.04059567754420482,-0.0024828323801204303,35.404174730955404,5.5699999999996415,1.0,30737.16,0.0,-152.72,109.4,0.41987047672271727,850000
7
+ 0.0,0.0,-0.03426596992406049,0.003431203831582834,-0.03389569826766943,-0.0007551110939447213,35.49408752685764,5.1939999999996544,1.0,36191.4,0.0,-141.7,101.88,0.389050817489624,900000
8
+ 0.0,0.0,-0.05415425347763557,0.012873892068553746,-0.053622257554132295,0.005932367856799072,35.524903174496174,4.872999999999686,1.0,41311.34,0.0,-132.42,95.46,0.34719096660614013,950000
9
+ 0.0,0.0,-0.043657865585037633,0.017256349500712097,-0.04238563271958754,0.019515170980352454,35.46930721581628,4.664999999999723,1.0,46175.1,0.0,-127.46,91.3,0.30618971824645996,1000000
10
+ 0.0,0.0,-0.06504249884662074,0.0256964570108936,-0.06372126731936979,0.01391925074367882,35.45251021670721,4.480999999999728,1.0,50775.22,0.0,-121.56,87.62,0.2968000602722168,1050000
11
+ 0.0,0.0,-0.052970506575293175,0.049512676665101896,-0.05037912831481214,0.04633109903511026,35.55552303136791,4.364999999999743,1.0,55309.26,0.0,-119.12,85.3,0.28368688583374024,1100000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/adj_loss,actor/adj_max,actor/adj_mean,actor/adj_std,actor/fast_loss,actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 199.9452,40.387928,0.784004,1.9907235,199.9452,0.18456106,9.789141,-48.24457,-155.0192,-202.92654,18.753033,-20.040485,512.9637,605000
3
+ 116.61518,76.023476,0.7756999,2.1610308,116.61518,0.19118792,10.710723,-31.602434,-152.65742,-196.55383,30.901573,-34.457214,427.11722,610000
4
+ 123.781876,42.380543,0.76387495,1.8013104,123.781876,0.16581784,10.629007,-41.65633,-150.19908,-204.0876,17.527462,-21.115095,588.7106,615000
5
+ 126.296555,47.299377,0.8715922,2.1562126,126.296555,0.17368104,6.710561,-24.64588,-148.40184,-204.58134,24.954351,-24.559948,481.87296,620000
6
+ 129.43523,33.162483,0.752738,1.5978246,129.43523,0.16912347,9.427962,-25.941093,-145.83899,-204.0547,8.526857,-8.940613,369.40637,625000
7
+ 111.862564,41.78308,0.83676744,1.9711531,111.862564,0.15047869,13.8391905,-21.66732,-141.5124,-203.0897,26.301693,-22.825474,534.88043,630000
8
+ 104.13173,40.529427,0.8204109,1.7225348,104.13173,0.17023334,14.389226,-39.606255,-141.25247,-202.2208,14.787575,-13.9938755,426.6805,635000
9
+ 131.6036,52.286327,0.847556,1.9634862,131.6036,0.17375723,13.920952,-2.7657866,-141.09807,-204.06955,19.698586,-16.091839,477.73407,640000
10
+ 91.90368,50.28231,0.8099301,1.7287381,91.90368,0.17538387,11.356357,-40.17901,-140.19829,-204.84181,10.244707,-10.184441,417.59134,645000
11
+ 209.56439,57.43921,0.83225065,2.236933,209.56439,0.21041459,10.708069,-26.784262,-140.56198,-203.79431,44.524418,-37.72982,902.8129,650000
12
+ 168.63562,30.233467,0.8479335,1.9812382,168.63562,0.2137897,14.312476,-3.9299257,-136.78337,-204.65732,23.018185,-17.73902,473.94485,655000
13
+ 119.6393,43.89304,0.814312,1.8169782,119.6393,0.21176249,16.045227,-3.5037966,-134.97952,-204.49083,15.293551,-15.447435,510.64334,660000
14
+ 97.36774,47.736557,0.8690089,1.9909066,97.36774,0.1880507,26.232605,-22.47203,-136.72437,-203.87105,25.014175,-25.230215,567.2256,665000
15
+ 300.46686,47.25294,0.7873778,1.7117751,300.46686,0.18350059,13.702174,-26.004904,-131.40787,-203.97539,16.951471,-14.361353,568.48566,670000
16
+ 1997.1726,50.71185,0.863642,2.2799623,1997.1726,0.1950092,8.840729,-37.72877,-136.6257,-204.78084,57.850414,-58.382507,1080.0751,675000
17
+ 117.445755,62.28786,0.8712573,2.1182458,117.445755,0.16657123,18.221767,-9.812429,-134.77232,-204.84421,21.814888,-21.745071,496.65433,680000
18
+ 304.38632,65.79671,0.9701635,2.7779725,304.38632,0.1761184,12.634371,-24.50457,-132.9669,-204.63765,62.749634,-70.703545,793.28,685000
19
+ 1633.2151,39.2109,0.84747195,1.8220631,1633.2151,0.18004072,14.869568,-7.9100046,-131.68681,-202.72878,35.712627,-39.46608,1077.104,690000
20
+ 74.48916,45.940987,0.8379964,2.196661,74.48916,0.19597974,12.5992985,-12.750108,-129.84406,-203.72578,42.086716,-31.80778,585.71344,695000
21
+ 236.81572,97.12334,0.9493601,3.0759294,236.81572,0.20628096,12.649602,-3.852098,-125.93261,-204.17636,25.189638,-24.137638,657.55493,700000
22
+ 110.40292,60.14348,0.86570007,1.895994,110.40292,0.19373718,14.011779,-7.248346,-130.97884,-204.80545,19.129957,-20.074875,469.14957,705000
23
+ 72.49425,30.535435,0.7542267,1.5890441,72.49425,0.18179429,9.890281,-0.44828638,-127.03965,-204.66855,12.742153,-11.920443,366.6977,710000
24
+ 156.06422,61.575825,0.7841343,1.7070885,156.06422,0.17184922,17.927404,0.12177783,-125.4343,-200.45535,12.616613,-12.226535,466.5873,715000
25
+ 858.8645,44.070778,0.8632446,2.1876543,858.8645,0.18218645,11.245328,-7.802379,-127.460815,-204.4561,21.323828,-22.761868,658.31494,720000
26
+ 99.98372,34.436348,0.8387096,1.900291,99.98372,0.15597677,9.790974,-6.845425,-131.5822,-205.12852,14.775505,-17.549631,453.32623,725000
27
+ 83.85759,31.245663,0.71451443,1.3745557,83.85759,0.18178865,11.536487,-2.7173047,-126.4156,-201.80025,28.175737,-21.50115,525.6182,730000
28
+ 84.70981,35.586876,0.83791447,1.9721576,84.70981,0.17996073,11.937095,4.8811407,-125.93778,-204.02756,13.099748,-12.63358,448.15125,735000
29
+ 99.702126,46.34567,0.8103316,1.5999976,99.702126,0.1428495,12.179325,-5.7280674,-122.15767,-192.97789,10.100585,-17.692085,455.85052,740000
30
+ 115.676315,51.08859,0.73316145,1.4774945,115.676315,0.15099597,13.225687,-11.864153,-125.622856,-204.49962,17.288893,-15.632038,512.95996,745000
31
+ 296.72595,40.276123,0.8414267,1.8307264,296.72595,0.14819518,9.244667,-12.657666,-126.04624,-203.6618,99.23802,-117.90273,1549.6028,750000
32
+ 75.31554,36.25149,0.7524312,1.5554774,75.31554,0.17218861,7.299953,-7.9652524,-124.77616,-203.99142,18.319195,-17.847937,428.06653,755000
33
+ 407.96024,48.242172,0.7840212,1.9501708,407.96024,0.1994437,15.865409,-4.1825147,-125.52351,-204.85384,20.60463,-22.563837,546.30597,760000
34
+ 297.12958,47.15028,0.8961228,2.200447,297.12958,0.19139022,13.47677,-2.0243084,-125.15696,-205.78304,42.369514,-29.418852,673.3399,765000
35
+ 134.61575,34.066273,0.71541274,1.4078795,134.61575,0.16459785,11.217406,4.6263833,-121.335915,-202.97942,25.3999,-21.273922,542.90686,770000
36
+ 86.78943,30.026144,0.7256012,1.4463723,86.78943,0.1731465,7.500441,-7.0219727,-123.620094,-205.91135,35.474716,-30.04348,519.3639,775000
37
+ 88.62467,69.54186,0.82238936,2.269766,88.62467,0.1766764,7.996998,1.6654927,-122.06277,-205.23578,23.381142,-27.346006,501.26358,780000
38
+ 258.0734,29.775005,0.82372147,1.5895425,258.0734,0.2005885,9.005185,0.66965634,-119.82251,-200.8203,37.73816,-35.82729,615.8845,785000
39
+ 79.11119,40.703876,0.84424543,1.818032,79.11119,0.16544735,8.460082,-2.2207017,-118.06835,-199.8282,32.461025,-31.901474,549.75415,790000
40
+ 121.9729,65.02798,0.8087415,2.113574,121.9729,0.16744576,8.028681,-3.2627184,-119.072975,-201.68086,16.555471,-21.597622,540.55005,795000
41
+ 64.40347,26.755758,0.76965475,1.4884417,64.40347,0.18077958,6.5515084,-0.16252185,-116.631676,-200.90225,20.470827,-21.329819,405.01788,800000
42
+ 76.90129,39.606064,0.79431194,1.6711079,76.90129,0.18487331,10.952805,-7.3467655,-120.43005,-200.0963,15.991554,-16.00049,447.18756,805000
43
+ 112.36836,41.272713,0.84486526,1.77354,112.36836,0.17275488,7.27037,-1.7278196,-117.81675,-200.34712,12.098246,-16.009174,451.49622,810000
44
+ 106.1145,45.15208,0.8163102,2.0301812,106.1145,0.19018981,8.623454,-8.787646,-119.49883,-204.05316,28.805677,-28.304516,467.5287,815000
45
+ 2398.619,80.21301,0.90760803,2.6960726,2398.619,0.17378718,9.32073,-8.874034,-119.12284,-203.55849,200.98038,-223.27432,1972.8844,820000
46
+ 62.67148,44.96986,0.795956,1.7212942,62.67148,0.1761771,16.717821,1.5251267,-113.08595,-198.53874,30.790401,-35.109234,513.5674,825000
47
+ 105.3577,45.45462,0.7925446,1.7962278,105.3577,0.18302529,6.366277,0.6178402,-119.69485,-199.3134,73.16652,-67.8741,730.08875,830000
48
+ 88.46961,53.23252,0.81713635,2.0402372,88.46961,0.17440906,6.387101,1.3297371,-114.77099,-200.9658,11.157689,-11.150724,405.27087,835000
49
+ 90.19444,34.6702,0.8193252,1.6806889,90.19444,0.18953502,12.497539,1.9220384,-116.73303,-203.97699,25.213224,-28.640495,477.07385,840000
50
+ 77.54814,28.131372,0.8158769,1.570888,77.54814,0.15820101,10.664752,-3.1312263,-117.37615,-201.99115,19.274866,-16.214056,465.75928,845000
51
+ 130.55583,74.17273,0.9245645,2.5407798,130.55583,0.15266714,7.0372806,-0.6423221,-109.07824,-204.27013,19.014631,-19.575254,600.4907,850000
52
+ 166.2614,41.734287,0.75466245,1.5426668,166.2614,0.1583428,8.894167,-2.1361284,-116.467285,-203.4683,35.967358,-39.374733,561.6554,855000
53
+ 66.68222,48.689423,0.8618977,2.0638297,66.68222,0.16559076,15.348536,3.7843833,-115.192116,-200.4728,9.027011,-9.840338,482.99847,860000
54
+ 174.76144,175.44623,0.9156026,3.477205,174.76144,0.16508558,9.351112,-5.5988984,-118.16953,-201.73517,34.035553,-38.656048,767.9825,865000
55
+ 63.467735,38.426514,0.76798284,1.6370564,63.467735,0.14187573,11.918647,1.5144751,-114.601295,-200.94809,35.83301,-39.680664,507.22577,870000
56
+ 284.4484,127.49327,0.885101,2.8271816,284.4484,0.16142745,10.902999,-4.0976644,-114.53332,-202.05414,73.8676,-98.94892,1041.4829,875000
57
+ 141.00276,54.18634,0.820929,1.9147552,141.00276,0.17173484,11.624194,-2.4935193,-116.96824,-202.66867,37.200706,-36.220406,694.43884,880000
58
+ 92.75488,58.041317,0.83708024,2.0786572,92.75488,0.12274319,8.187236,-2.2109857,-109.037575,-199.68143,18.314575,-18.216719,499.87036,885000
59
+ 115.22918,38.509007,0.80864227,1.8648466,115.22918,0.15855105,13.574714,-4.231057,-107.70778,-203.82166,41.324097,-48.76467,697.32214,890000
60
+ 265.05573,69.21505,0.8279326,2.1597712,265.05573,0.15720709,5.4897337,1.4719595,-109.89431,-200.55508,20.894363,-19.97661,622.89355,895000
61
+ 166.33757,170.01439,0.9331838,3.2310634,166.33757,0.1831056,9.544947,-4.72836,-112.59954,-197.87367,107.82995,-106.79586,1437.8136,900000
62
+ 126.573074,69.69075,0.7746323,1.9566298,126.573074,0.17245159,8.363074,-3.6770697,-114.56907,-197.50694,28.831131,-19.827318,565.7504,905000
63
+ 1280.8712,74.60937,0.9264285,2.3851745,1280.8712,0.14989658,10.843258,-10.177735,-111.87858,-201.73686,42.93881,-43.420914,1128.0752,910000
64
+ 62.542957,34.076195,0.79469055,1.6123196,62.542957,0.1940282,7.5075235,0.45209748,-111.62914,-192.04414,18.724487,-18.606592,447.19473,915000
65
+ 146.88736,67.42063,0.9241974,2.746955,146.88736,0.16450295,8.26858,-4.5153604,-112.13989,-199.9198,19.422316,-19.031672,534.25507,920000
66
+ 355.48178,41.502285,0.93326205,2.2749908,355.48178,0.1553685,10.377059,-6.840589,-112.314064,-202.40341,33.55652,-38.263256,695.0165,925000
67
+ 85.944786,57.16048,0.8441956,1.8133733,85.944786,0.16007003,13.826093,-1.7819649,-107.97915,-199.35509,15.694579,-15.3992,453.78253,930000
68
+ 216.51486,51.092186,0.87328947,2.0597308,216.51486,0.1641078,9.76714,-1.6427402,-107.532486,-200.56189,17.03799,-18.986279,614.08826,935000
69
+ 117.030914,58.393505,0.8291531,1.8996494,117.030914,0.20449492,13.284592,-3.1901727,-112.06089,-191.27219,17.99918,-20.01054,532.7954,940000
70
+ 297.34613,114.967964,1.0161694,2.915463,297.34613,0.16584441,16.819418,-1.2586844,-115.75478,-201.42812,32.33982,-33.728127,776.9388,945000
71
+ 129.27637,83.92449,0.80734557,2.0713916,129.27637,0.17430839,11.794312,-1.6997619,-105.1416,-203.32286,17.097288,-16.430264,536.853,950000
72
+ 69.11769,60.095345,0.8200682,2.0209315,69.11769,0.16763392,8.644808,-1.0685079,-112.03896,-199.64368,39.185688,-40.821087,580.83185,955000
73
+ 821.9196,52.82723,0.8376874,2.0522065,821.9196,0.15373653,8.5947695,-2.3623211,-106.79146,-197.07117,70.24335,-75.03521,1013.6673,960000
74
+ 202.7137,56.48558,0.8770984,2.0862458,202.7137,0.16340709,17.999537,-0.8744426,-110.71029,-204.48079,67.792404,-76.65341,747.3883,965000
75
+ 94.14429,52.37113,0.8782801,1.993793,94.14429,0.16736406,5.5091844,-1.6583217,-109.598564,-203.3768,14.122066,-13.850578,469.75266,970000
76
+ 154.9466,83.45781,0.8896866,2.2318673,154.9466,0.14044331,13.062606,0.97417766,-106.31301,-194.48235,84.79022,-74.67646,1180.2909,975000
77
+ 71.0815,24.588028,0.76788616,1.5342438,71.0815,0.15407658,6.1259003,1.5550385,-106.5093,-202.06496,12.102496,-10.367851,382.7012,980000
78
+ 164.92126,73.11133,0.8730957,2.1343384,164.92126,0.15865943,16.426413,-2.8187873,-107.89237,-200.62706,34.533833,-45.392677,682.5751,985000
79
+ 130.82394,74.16406,0.8916479,2.62436,130.82394,0.16075987,7.023771,4.0799756,-109.8811,-203.0204,24.615273,-24.303646,604.153,990000
80
+ 80.26304,64.75675,0.80413014,1.8435382,80.26304,0.17246653,12.8868685,0.30688313,-109.1404,-194.55438,19.525543,-15.607178,449.79388,995000
81
+ 123.401764,66.34313,0.81568813,1.885455,123.401764,0.13740584,9.396936,-1.2801621,-105.67364,-201.23892,15.659647,-15.973287,512.97766,1000000
82
+ 69.14002,26.22055,0.71178067,1.3023082,69.14002,0.15613303,9.344432,0.2596136,-106.42743,-202.83096,20.38771,-21.02886,505.3443,1005000
83
+ 91.97873,33.146122,0.7846219,1.5416555,91.97873,0.15625207,10.645762,-8.168058,-111.9563,-200.09962,22.622398,-20.38896,586.61804,1010000
84
+ 181.26971,173.29984,0.8503919,2.91175,181.26971,0.15434423,9.009997,-1.1300106,-105.63971,-195.59328,63.03491,-72.65394,1231.7085,1015000
85
+ 15300.095,96.43712,0.9846521,3.2236278,15300.095,0.16769443,12.890714,0.16133317,-107.28279,-196.81927,166.86398,-173.32443,2141.3328,1020000
86
+ 61.621574,40.748653,0.7695305,1.5941527,61.621574,0.1724328,7.943975,-0.8669249,-103.43816,-204.28217,14.790212,-14.001775,400.68524,1025000
87
+ 96.61952,40.595093,0.88738155,2.1880867,96.61952,0.13918656,5.94731,-1.562173,-103.82969,-193.37045,25.40706,-26.564425,581.48645,1030000
88
+ 352.0761,86.9424,0.8131036,1.9839637,352.0761,0.16944647,7.945401,-0.7606796,-107.70794,-203.92319,45.156063,-48.56829,696.2001,1035000
89
+ 104.24572,82.99218,0.8169589,1.9926178,104.24572,0.12588346,13.67954,0.025616318,-100.08654,-203.04732,17.61375,-19.124722,534.149,1040000
90
+ 96.631,56.5016,0.80682576,1.9428357,96.631,0.15573333,7.8939257,-4.551935,-109.68579,-199.13771,21.3883,-16.988707,520.76904,1045000
91
+ 61.765343,38.34787,0.81095153,1.8212272,61.765343,0.15991107,9.2953205,-4.0365095,-100.757286,-190.88661,18.667572,-24.599667,489.51608,1050000
92
+ 132.57271,46.263367,0.7939622,1.7203248,132.57271,0.1555515,5.8343515,-2.8343046,-105.04922,-198.34929,17.406176,-17.154215,497.0741,1055000
93
+ 111.18706,57.76947,0.7670149,1.8662574,111.18706,0.14340937,14.324576,-3.6935694,-103.45711,-190.11461,18.121563,-16.330654,503.72333,1060000
94
+ 152.0599,67.84329,0.864278,2.0463395,152.0599,0.1488274,12.442489,0.11306816,-102.563835,-194.33258,16.24041,-18.117676,535.98047,1065000
95
+ 77.008484,56.465633,0.71490324,1.7902718,77.008484,0.16292518,11.351893,-1.5257083,-101.4096,-197.98996,62.28985,-71.82328,1040.186,1070000
96
+ 1661.9811,44.92079,0.75329834,1.7453952,1661.9811,0.15642813,10.620486,0.23484376,-102.23683,-203.10156,35.96415,-40.727848,891.6581,1075000
97
+ 113.96086,42.16313,0.85966843,1.8897458,113.96086,0.17036521,7.991859,1.1724658,-101.96935,-191.13919,9.874797,-9.831017,395.47815,1080000
98
+ 169.31976,57.798428,0.85721177,1.8759164,169.31976,0.15252313,5.9271617,0.63266104,-103.00437,-199.11816,29.646618,-25.018135,514.8704,1085000
99
+ 99.649414,125.30438,0.84761786,2.698416,99.649414,0.13272819,5.187229,-1.4829121,-102.29288,-202.05945,30.709936,-28.06792,650.7717,1090000
100
+ 125.41076,75.08093,0.92823607,2.6344483,125.41076,0.1279184,6.3107924,0.34163475,-97.12932,-204.65622,33.973812,-31.995897,605.9402,1095000
101
+ 98.8253,98.859726,0.9146226,2.359048,98.8253,0.14653623,12.0077305,2.5657792,-97.70174,-203.70912,79.49923,-89.67711,782.53046,1100000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/adj_loss,actor/adj_max,actor/adj_mean,actor/adj_std,actor/fast_loss,actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 199.9452,40.387928,0.784004,1.9907235,199.9452,0.18456106,9.789141,-48.24457,-155.0192,-202.92654,18.753033,-20.040485,512.9637,605000
3
+ 116.61518,76.023476,0.7756999,2.1610308,116.61518,0.19118792,10.710723,-31.602434,-152.65742,-196.55383,30.901573,-34.457214,427.11722,610000
4
+ 123.781876,42.380543,0.76387495,1.8013104,123.781876,0.16581784,10.629007,-41.65633,-150.19908,-204.0876,17.527462,-21.115095,588.7106,615000
5
+ 126.296555,47.299377,0.8715922,2.1562126,126.296555,0.17368104,6.710561,-24.64588,-148.40184,-204.58134,24.954351,-24.559948,481.87296,620000
6
+ 129.43523,33.162483,0.752738,1.5978246,129.43523,0.16912347,9.427962,-25.941093,-145.83899,-204.0547,8.526857,-8.940613,369.40637,625000
7
+ 111.862564,41.78308,0.83676744,1.9711531,111.862564,0.15047869,13.8391905,-21.66732,-141.5124,-203.0897,26.301693,-22.825474,534.88043,630000
8
+ 104.13173,40.529427,0.8204109,1.7225348,104.13173,0.17023334,14.389226,-39.606255,-141.25247,-202.2208,14.787575,-13.9938755,426.6805,635000
9
+ 131.6036,52.286327,0.847556,1.9634862,131.6036,0.17375723,13.920952,-2.7657866,-141.09807,-204.06955,19.698586,-16.091839,477.73407,640000
10
+ 91.90368,50.28231,0.8099301,1.7287381,91.90368,0.17538387,11.356357,-40.17901,-140.19829,-204.84181,10.244707,-10.184441,417.59134,645000
11
+ 209.56439,57.43921,0.83225065,2.236933,209.56439,0.21041459,10.708069,-26.784262,-140.56198,-203.79431,44.524418,-37.72982,902.8129,650000
12
+ 168.63562,30.233467,0.8479335,1.9812382,168.63562,0.2137897,14.312476,-3.9299257,-136.78337,-204.65732,23.018185,-17.73902,473.94485,655000
13
+ 119.6393,43.89304,0.814312,1.8169782,119.6393,0.21176249,16.045227,-3.5037966,-134.97952,-204.49083,15.293551,-15.447435,510.64334,660000
14
+ 97.36774,47.736557,0.8690089,1.9909066,97.36774,0.1880507,26.232605,-22.47203,-136.72437,-203.87105,25.014175,-25.230215,567.2256,665000
15
+ 300.46686,47.25294,0.7873778,1.7117751,300.46686,0.18350059,13.702174,-26.004904,-131.40787,-203.97539,16.951471,-14.361353,568.48566,670000
16
+ 1997.1726,50.71185,0.863642,2.2799623,1997.1726,0.1950092,8.840729,-37.72877,-136.6257,-204.78084,57.850414,-58.382507,1080.0751,675000
17
+ 117.445755,62.28786,0.8712573,2.1182458,117.445755,0.16657123,18.221767,-9.812429,-134.77232,-204.84421,21.814888,-21.745071,496.65433,680000
18
+ 304.38632,65.79671,0.9701635,2.7779725,304.38632,0.1761184,12.634371,-24.50457,-132.9669,-204.63765,62.749634,-70.703545,793.28,685000
19
+ 1633.2151,39.2109,0.84747195,1.8220631,1633.2151,0.18004072,14.869568,-7.9100046,-131.68681,-202.72878,35.712627,-39.46608,1077.104,690000
20
+ 74.48916,45.940987,0.8379964,2.196661,74.48916,0.19597974,12.5992985,-12.750108,-129.84406,-203.72578,42.086716,-31.80778,585.71344,695000
21
+ 236.81572,97.12334,0.9493601,3.0759294,236.81572,0.20628096,12.649602,-3.852098,-125.93261,-204.17636,25.189638,-24.137638,657.55493,700000
22
+ 110.40292,60.14348,0.86570007,1.895994,110.40292,0.19373718,14.011779,-7.248346,-130.97884,-204.80545,19.129957,-20.074875,469.14957,705000
23
+ 72.49425,30.535435,0.7542267,1.5890441,72.49425,0.18179429,9.890281,-0.44828638,-127.03965,-204.66855,12.742153,-11.920443,366.6977,710000
24
+ 156.06422,61.575825,0.7841343,1.7070885,156.06422,0.17184922,17.927404,0.12177783,-125.4343,-200.45535,12.616613,-12.226535,466.5873,715000
25
+ 858.8645,44.070778,0.8632446,2.1876543,858.8645,0.18218645,11.245328,-7.802379,-127.460815,-204.4561,21.323828,-22.761868,658.31494,720000
26
+ 99.98372,34.436348,0.8387096,1.900291,99.98372,0.15597677,9.790974,-6.845425,-131.5822,-205.12852,14.775505,-17.549631,453.32623,725000
27
+ 83.85759,31.245663,0.71451443,1.3745557,83.85759,0.18178865,11.536487,-2.7173047,-126.4156,-201.80025,28.175737,-21.50115,525.6182,730000
28
+ 84.70981,35.586876,0.83791447,1.9721576,84.70981,0.17996073,11.937095,4.8811407,-125.93778,-204.02756,13.099748,-12.63358,448.15125,735000
29
+ 99.702126,46.34567,0.8103316,1.5999976,99.702126,0.1428495,12.179325,-5.7280674,-122.15767,-192.97789,10.100585,-17.692085,455.85052,740000
30
+ 115.676315,51.08859,0.73316145,1.4774945,115.676315,0.15099597,13.225687,-11.864153,-125.622856,-204.49962,17.288893,-15.632038,512.95996,745000
31
+ 296.72595,40.276123,0.8414267,1.8307264,296.72595,0.14819518,9.244667,-12.657666,-126.04624,-203.6618,99.23802,-117.90273,1549.6028,750000
32
+ 75.31554,36.25149,0.7524312,1.5554774,75.31554,0.17218861,7.299953,-7.9652524,-124.77616,-203.99142,18.319195,-17.847937,428.06653,755000
33
+ 407.96024,48.242172,0.7840212,1.9501708,407.96024,0.1994437,15.865409,-4.1825147,-125.52351,-204.85384,20.60463,-22.563837,546.30597,760000
34
+ 297.12958,47.15028,0.8961228,2.200447,297.12958,0.19139022,13.47677,-2.0243084,-125.15696,-205.78304,42.369514,-29.418852,673.3399,765000
35
+ 134.61575,34.066273,0.71541274,1.4078795,134.61575,0.16459785,11.217406,4.6263833,-121.335915,-202.97942,25.3999,-21.273922,542.90686,770000
36
+ 86.78943,30.026144,0.7256012,1.4463723,86.78943,0.1731465,7.500441,-7.0219727,-123.620094,-205.91135,35.474716,-30.04348,519.3639,775000
37
+ 88.62467,69.54186,0.82238936,2.269766,88.62467,0.1766764,7.996998,1.6654927,-122.06277,-205.23578,23.381142,-27.346006,501.26358,780000
38
+ 258.0734,29.775005,0.82372147,1.5895425,258.0734,0.2005885,9.005185,0.66965634,-119.82251,-200.8203,37.73816,-35.82729,615.8845,785000
39
+ 79.11119,40.703876,0.84424543,1.818032,79.11119,0.16544735,8.460082,-2.2207017,-118.06835,-199.8282,32.461025,-31.901474,549.75415,790000
40
+ 121.9729,65.02798,0.8087415,2.113574,121.9729,0.16744576,8.028681,-3.2627184,-119.072975,-201.68086,16.555471,-21.597622,540.55005,795000
41
+ 64.40347,26.755758,0.76965475,1.4884417,64.40347,0.18077958,6.5515084,-0.16252185,-116.631676,-200.90225,20.470827,-21.329819,405.01788,800000
42
+ 76.90129,39.606064,0.79431194,1.6711079,76.90129,0.18487331,10.952805,-7.3467655,-120.43005,-200.0963,15.991554,-16.00049,447.18756,805000
43
+ 112.36836,41.272713,0.84486526,1.77354,112.36836,0.17275488,7.27037,-1.7278196,-117.81675,-200.34712,12.098246,-16.009174,451.49622,810000
44
+ 106.1145,45.15208,0.8163102,2.0301812,106.1145,0.19018981,8.623454,-8.787646,-119.49883,-204.05316,28.805677,-28.304516,467.5287,815000
45
+ 2398.619,80.21301,0.90760803,2.6960726,2398.619,0.17378718,9.32073,-8.874034,-119.12284,-203.55849,200.98038,-223.27432,1972.8844,820000
46
+ 62.67148,44.96986,0.795956,1.7212942,62.67148,0.1761771,16.717821,1.5251267,-113.08595,-198.53874,30.790401,-35.109234,513.5674,825000
47
+ 105.3577,45.45462,0.7925446,1.7962278,105.3577,0.18302529,6.366277,0.6178402,-119.69485,-199.3134,73.16652,-67.8741,730.08875,830000
48
+ 88.46961,53.23252,0.81713635,2.0402372,88.46961,0.17440906,6.387101,1.3297371,-114.77099,-200.9658,11.157689,-11.150724,405.27087,835000
49
+ 90.19444,34.6702,0.8193252,1.6806889,90.19444,0.18953502,12.497539,1.9220384,-116.73303,-203.97699,25.213224,-28.640495,477.07385,840000
50
+ 77.54814,28.131372,0.8158769,1.570888,77.54814,0.15820101,10.664752,-3.1312263,-117.37615,-201.99115,19.274866,-16.214056,465.75928,845000
51
+ 130.55583,74.17273,0.9245645,2.5407798,130.55583,0.15266714,7.0372806,-0.6423221,-109.07824,-204.27013,19.014631,-19.575254,600.4907,850000
52
+ 166.2614,41.734287,0.75466245,1.5426668,166.2614,0.1583428,8.894167,-2.1361284,-116.467285,-203.4683,35.967358,-39.374733,561.6554,855000
53
+ 66.68222,48.689423,0.8618977,2.0638297,66.68222,0.16559076,15.348536,3.7843833,-115.192116,-200.4728,9.027011,-9.840338,482.99847,860000
54
+ 174.76144,175.44623,0.9156026,3.477205,174.76144,0.16508558,9.351112,-5.5988984,-118.16953,-201.73517,34.035553,-38.656048,767.9825,865000
55
+ 63.467735,38.426514,0.76798284,1.6370564,63.467735,0.14187573,11.918647,1.5144751,-114.601295,-200.94809,35.83301,-39.680664,507.22577,870000
56
+ 284.4484,127.49327,0.885101,2.8271816,284.4484,0.16142745,10.902999,-4.0976644,-114.53332,-202.05414,73.8676,-98.94892,1041.4829,875000
57
+ 141.00276,54.18634,0.820929,1.9147552,141.00276,0.17173484,11.624194,-2.4935193,-116.96824,-202.66867,37.200706,-36.220406,694.43884,880000
58
+ 92.75488,58.041317,0.83708024,2.0786572,92.75488,0.12274319,8.187236,-2.2109857,-109.037575,-199.68143,18.314575,-18.216719,499.87036,885000
59
+ 115.22918,38.509007,0.80864227,1.8648466,115.22918,0.15855105,13.574714,-4.231057,-107.70778,-203.82166,41.324097,-48.76467,697.32214,890000
60
+ 265.05573,69.21505,0.8279326,2.1597712,265.05573,0.15720709,5.4897337,1.4719595,-109.89431,-200.55508,20.894363,-19.97661,622.89355,895000
61
+ 166.33757,170.01439,0.9331838,3.2310634,166.33757,0.1831056,9.544947,-4.72836,-112.59954,-197.87367,107.82995,-106.79586,1437.8136,900000
62
+ 126.573074,69.69075,0.7746323,1.9566298,126.573074,0.17245159,8.363074,-3.6770697,-114.56907,-197.50694,28.831131,-19.827318,565.7504,905000
63
+ 1280.8712,74.60937,0.9264285,2.3851745,1280.8712,0.14989658,10.843258,-10.177735,-111.87858,-201.73686,42.93881,-43.420914,1128.0752,910000
64
+ 62.542957,34.076195,0.79469055,1.6123196,62.542957,0.1940282,7.5075235,0.45209748,-111.62914,-192.04414,18.724487,-18.606592,447.19473,915000
65
+ 146.88736,67.42063,0.9241974,2.746955,146.88736,0.16450295,8.26858,-4.5153604,-112.13989,-199.9198,19.422316,-19.031672,534.25507,920000
66
+ 355.48178,41.502285,0.93326205,2.2749908,355.48178,0.1553685,10.377059,-6.840589,-112.314064,-202.40341,33.55652,-38.263256,695.0165,925000
67
+ 85.944786,57.16048,0.8441956,1.8133733,85.944786,0.16007003,13.826093,-1.7819649,-107.97915,-199.35509,15.694579,-15.3992,453.78253,930000
68
+ 216.51486,51.092186,0.87328947,2.0597308,216.51486,0.1641078,9.76714,-1.6427402,-107.532486,-200.56189,17.03799,-18.986279,614.08826,935000
69
+ 117.030914,58.393505,0.8291531,1.8996494,117.030914,0.20449492,13.284592,-3.1901727,-112.06089,-191.27219,17.99918,-20.01054,532.7954,940000
70
+ 297.34613,114.967964,1.0161694,2.915463,297.34613,0.16584441,16.819418,-1.2586844,-115.75478,-201.42812,32.33982,-33.728127,776.9388,945000
71
+ 129.27637,83.92449,0.80734557,2.0713916,129.27637,0.17430839,11.794312,-1.6997619,-105.1416,-203.32286,17.097288,-16.430264,536.853,950000
72
+ 69.11769,60.095345,0.8200682,2.0209315,69.11769,0.16763392,8.644808,-1.0685079,-112.03896,-199.64368,39.185688,-40.821087,580.83185,955000
73
+ 821.9196,52.82723,0.8376874,2.0522065,821.9196,0.15373653,8.5947695,-2.3623211,-106.79146,-197.07117,70.24335,-75.03521,1013.6673,960000
74
+ 202.7137,56.48558,0.8770984,2.0862458,202.7137,0.16340709,17.999537,-0.8744426,-110.71029,-204.48079,67.792404,-76.65341,747.3883,965000
75
+ 94.14429,52.37113,0.8782801,1.993793,94.14429,0.16736406,5.5091844,-1.6583217,-109.598564,-203.3768,14.122066,-13.850578,469.75266,970000
76
+ 154.9466,83.45781,0.8896866,2.2318673,154.9466,0.14044331,13.062606,0.97417766,-106.31301,-194.48235,84.79022,-74.67646,1180.2909,975000
77
+ 71.0815,24.588028,0.76788616,1.5342438,71.0815,0.15407658,6.1259003,1.5550385,-106.5093,-202.06496,12.102496,-10.367851,382.7012,980000
78
+ 164.92126,73.11133,0.8730957,2.1343384,164.92126,0.15865943,16.426413,-2.8187873,-107.89237,-200.62706,34.533833,-45.392677,682.5751,985000
79
+ 130.82394,74.16406,0.8916479,2.62436,130.82394,0.16075987,7.023771,4.0799756,-109.8811,-203.0204,24.615273,-24.303646,604.153,990000
80
+ 80.26304,64.75675,0.80413014,1.8435382,80.26304,0.17246653,12.8868685,0.30688313,-109.1404,-194.55438,19.525543,-15.607178,449.79388,995000
81
+ 123.401764,66.34313,0.81568813,1.885455,123.401764,0.13740584,9.396936,-1.2801621,-105.67364,-201.23892,15.659647,-15.973287,512.97766,1000000
82
+ 69.14002,26.22055,0.71178067,1.3023082,69.14002,0.15613303,9.344432,0.2596136,-106.42743,-202.83096,20.38771,-21.02886,505.3443,1005000
83
+ 91.97873,33.146122,0.7846219,1.5416555,91.97873,0.15625207,10.645762,-8.168058,-111.9563,-200.09962,22.622398,-20.38896,586.61804,1010000
84
+ 181.26971,173.29984,0.8503919,2.91175,181.26971,0.15434423,9.009997,-1.1300106,-105.63971,-195.59328,63.03491,-72.65394,1231.7085,1015000
85
+ 15300.095,96.43712,0.9846521,3.2236278,15300.095,0.16769443,12.890714,0.16133317,-107.28279,-196.81927,166.86398,-173.32443,2141.3328,1020000
86
+ 61.621574,40.748653,0.7695305,1.5941527,61.621574,0.1724328,7.943975,-0.8669249,-103.43816,-204.28217,14.790212,-14.001775,400.68524,1025000
87
+ 96.61952,40.595093,0.88738155,2.1880867,96.61952,0.13918656,5.94731,-1.562173,-103.82969,-193.37045,25.40706,-26.564425,581.48645,1030000
88
+ 352.0761,86.9424,0.8131036,1.9839637,352.0761,0.16944647,7.945401,-0.7606796,-107.70794,-203.92319,45.156063,-48.56829,696.2001,1035000
89
+ 104.24572,82.99218,0.8169589,1.9926178,104.24572,0.12588346,13.67954,0.025616318,-100.08654,-203.04732,17.61375,-19.124722,534.149,1040000
90
+ 96.631,56.5016,0.80682576,1.9428357,96.631,0.15573333,7.8939257,-4.551935,-109.68579,-199.13771,21.3883,-16.988707,520.76904,1045000
91
+ 61.765343,38.34787,0.81095153,1.8212272,61.765343,0.15991107,9.2953205,-4.0365095,-100.757286,-190.88661,18.667572,-24.599667,489.51608,1050000
92
+ 132.57271,46.263367,0.7939622,1.7203248,132.57271,0.1555515,5.8343515,-2.8343046,-105.04922,-198.34929,17.406176,-17.154215,497.0741,1055000
93
+ 111.18706,57.76947,0.7670149,1.8662574,111.18706,0.14340937,14.324576,-3.6935694,-103.45711,-190.11461,18.121563,-16.330654,503.72333,1060000
94
+ 152.0599,67.84329,0.864278,2.0463395,152.0599,0.1488274,12.442489,0.11306816,-102.563835,-194.33258,16.24041,-18.117676,535.98047,1065000
95
+ 77.008484,56.465633,0.71490324,1.7902718,77.008484,0.16292518,11.351893,-1.5257083,-101.4096,-197.98996,62.28985,-71.82328,1040.186,1070000
96
+ 1661.9811,44.92079,0.75329834,1.7453952,1661.9811,0.15642813,10.620486,0.23484376,-102.23683,-203.10156,35.96415,-40.727848,891.6581,1075000
97
+ 113.96086,42.16313,0.85966843,1.8897458,113.96086,0.17036521,7.991859,1.1724658,-101.96935,-191.13919,9.874797,-9.831017,395.47815,1080000
98
+ 169.31976,57.798428,0.85721177,1.8759164,169.31976,0.15252313,5.9271617,0.63266104,-103.00437,-199.11816,29.646618,-25.018135,514.8704,1085000
99
+ 99.649414,125.30438,0.84761786,2.698416,99.649414,0.13272819,5.187229,-1.4829121,-102.29288,-202.05945,30.709936,-28.06792,650.7717,1090000
100
+ 125.41076,75.08093,0.92823607,2.6344483,125.41076,0.1279184,6.3107924,0.34163475,-97.12932,-204.65622,33.973812,-31.995897,605.9402,1095000
101
+ 98.8253,98.859726,0.9146226,2.359048,98.8253,0.14653623,12.0077305,2.5657792,-97.70174,-203.70912,79.49923,-89.67711,782.53046,1100000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98ebdd723de17fc59962329984280daad4fad4b6823bc50237e72f669cfbb9e5
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07ca6a78c9aca4fd4d2a394d9c74dcfe9baf8cc4244ac5c294e19bc7523e58be
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b6cb86f0cae444cd91c913872ba9b432db0302c56f5090395c92743ddc2adea
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f14aaf51d6552a7ffae9d3b9319fd6c6e3982f3f239365ee3c90362cd9ea8d7
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4545bb7752e22f1ad6dcf03123800e588062bdb80058c5677a19a72302a84f0
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a484224ccd7b3672cea13fefb4f7a0751086a1529c821b8352f33e81da7049
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cca8e6951d12c4a14f8683a90073aad271b19d8af94ec375f463d59412d942f
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b5ff0357c8d23f8aea929a0139ecf605d2ad01f6d06739f264629221256b44a
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffce322d0539d1946e3c9dfa7e98b64e7bdaa923c573edf40a0cabf69d73d7c7
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:817bd6cb87c7fb75faae59d3f178df6c028be4f6f43a974e2b0b4dde62bb16e0
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_215352/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/ti4284jr