Tiredsheep commited on
Commit
a519009
·
verified ·
1 Parent(s): 2f44a56

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_150000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_200000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_250000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_300000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_350000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_400000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_450000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_500000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_550000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_600000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.03385103351037707,-0.010616247404904768,-0.03384401844749115,0.0031989451479318607,27.850763567383094,18.09799999999901,0.64,8991.52,-0.4,-500.64,359.96,1.1227212476730346,150000
3
+ 0.0,0.0,-0.019348406215918938,-0.00962307036397924,-0.0193532113442829,-0.009648295435645812,33.57245627171439,10.046999999999585,0.96,23773.26,-0.04,-277.62,198.94,0.6462104988098144,200000
4
+ 0.0,0.0,-0.000920401382665779,-0.004313898361735827,-0.0010067807858315859,-0.0028248553150622886,34.28144282930519,7.980999999999563,0.96,32806.2,-0.06,-225.78,157.62,0.5235851907730102,250000
5
+ 0.0,0.0,-0.009562072946173745,-0.004720033347244513,-0.00967361484180405,0.019710165072517338,35.06711177455224,7.377999999999584,1.0,40597.8,0.0,-208.9,145.56,0.48729743957519533,300000
6
+ 0.0,0.0,-0.016318924542043287,-0.004887201351372639,-0.016418156992558667,-0.001786110346209942,33.781529696808754,6.626999999999571,0.98,47624.04,-0.02,-182.24,130.54,0.43165849208831786,350000
7
+ 0.0,0.0,-0.014581414669869775,-0.005185560686161875,-0.014885829496432721,-0.003369998704214715,35.37773282416594,6.201999999999633,1.0,54295.12,0.0,-166.78,122.04,0.4118465709686279,400000
8
+ 0.0,0.0,-0.0287584283186193,0.006561642603341335,-0.02882080461053384,0.015665128396034535,35.27263949716333,5.599999999999676,1.0,60399.36,0.0,-150.8,110.0,0.38089192867279054,450000
9
+ 0.0,0.0,-0.00946136804744225,0.005616976124239648,-0.009169138438167383,-0.001079813445013522,35.12106424934494,5.05399999999967,1.0,65735.04,0.0,-135.88,99.08,0.3353633546829224,500000
10
+ 0.0,0.0,-0.02417046036036548,0.002871799379083545,-0.023849062058605323,0.0007284456823377965,35.5507515541935,4.921999999999703,1.0,70876.94,0.0,-133.38,96.44,0.33138572692871093,550000
11
+ 0.0,0.0,-0.01771153224969534,0.0156575334210416,-0.016952440355236787,0.009580046522440698,35.52035308817831,5.710999999999749,1.0,76043.34,0.0,-152.86,112.22,0.378305459022522,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.03385103351037707,-0.010616247404904768,-0.03384401844749115,0.0031989451479318607,27.850763567383094,18.09799999999901,0.64,8991.52,-0.4,-500.64,359.96,1.1227212476730346,150000
3
+ 0.0,0.0,-0.019348406215918938,-0.00962307036397924,-0.0193532113442829,-0.009648295435645812,33.57245627171439,10.046999999999585,0.96,23773.26,-0.04,-277.62,198.94,0.6462104988098144,200000
4
+ 0.0,0.0,-0.000920401382665779,-0.004313898361735827,-0.0010067807858315859,-0.0028248553150622886,34.28144282930519,7.980999999999563,0.96,32806.2,-0.06,-225.78,157.62,0.5235851907730102,250000
5
+ 0.0,0.0,-0.009562072946173745,-0.004720033347244513,-0.00967361484180405,0.019710165072517338,35.06711177455224,7.377999999999584,1.0,40597.8,0.0,-208.9,145.56,0.48729743957519533,300000
6
+ 0.0,0.0,-0.016318924542043287,-0.004887201351372639,-0.016418156992558667,-0.001786110346209942,33.781529696808754,6.626999999999571,0.98,47624.04,-0.02,-182.24,130.54,0.43165849208831786,350000
7
+ 0.0,0.0,-0.014581414669869775,-0.005185560686161875,-0.014885829496432721,-0.003369998704214715,35.37773282416594,6.201999999999633,1.0,54295.12,0.0,-166.78,122.04,0.4118465709686279,400000
8
+ 0.0,0.0,-0.0287584283186193,0.006561642603341335,-0.02882080461053384,0.015665128396034535,35.27263949716333,5.599999999999676,1.0,60399.36,0.0,-150.8,110.0,0.38089192867279054,450000
9
+ 0.0,0.0,-0.00946136804744225,0.005616976124239648,-0.009169138438167383,-0.001079813445013522,35.12106424934494,5.05399999999967,1.0,65735.04,0.0,-135.88,99.08,0.3353633546829224,500000
10
+ 0.0,0.0,-0.02417046036036548,0.002871799379083545,-0.023849062058605323,0.0007284456823377965,35.5507515541935,4.921999999999703,1.0,70876.94,0.0,-133.38,96.44,0.33138572692871093,550000
11
+ 0.0,0.0,-0.01771153224969534,0.0156575334210416,-0.016952440355236787,0.009580046522440698,35.52035308817831,5.710999999999749,1.0,76043.34,0.0,-152.86,112.22,0.378305459022522,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/adj_loss,actor/adj_max,actor/adj_mean,actor/adj_std,actor/fast_loss,actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 84.9986,38.490253,0.65134263,1.38216,84.9986,0.2231794,8.21242,-53.741108,-158.01625,-204.42906,8.688932,-10.577248,356.46786,105000
3
+ 71.80443,19.740747,0.6285404,1.2179642,71.80443,0.19830465,11.146601,-77.03343,-157.0688,-201.66331,8.620195,-11.487813,396.64877,110000
4
+ 1450.8083,34.65538,0.6678076,1.3058261,1450.8083,0.19830379,6.7819543,-53.91802,-156.67021,-202.15552,25.610573,-25.510687,781.62256,115000
5
+ 219.07047,33.349052,0.7260814,1.377426,219.07047,0.20159224,8.327773,-65.1689,-156.64775,-205.83165,14.998541,-16.313728,485.24066,120000
6
+ 548.9114,21.711025,0.7093183,1.4310056,548.9114,0.19329041,7.001138,-60.18718,-154.8955,-202.6037,34.598522,-31.269981,743.83875,125000
7
+ 72.10883,54.83886,0.72847897,1.931026,72.10883,0.19961098,6.3651943,-68.2359,-154.09921,-205.06859,9.269782,-13.57906,385.3069,130000
8
+ 73.44324,25.194992,0.6608466,1.2994014,73.44324,0.17738083,11.062413,-73.26482,-154.30846,-201.96234,15.307721,-16.57786,434.8391,135000
9
+ 60.037003,26.291428,0.6445731,1.2450026,60.037003,0.18798184,10.213315,-58.797443,-154.42174,-204.776,12.994168,-12.894409,353.39706,140000
10
+ 71.05096,40.616985,0.7128165,1.5807749,71.05096,0.17759523,7.5404215,-90.74909,-156.05646,-200.53044,13.097041,-10.418508,371.60846,145000
11
+ 85.57614,35.63509,0.6749023,1.2831047,85.57614,0.2063818,11.529177,-68.39919,-155.79845,-202.53891,14.331142,-13.58364,427.0389,150000
12
+ 221.71332,33.790993,0.7484053,1.4896675,221.71332,0.20386174,25.66815,-35.22244,-149.6881,-205.58583,10.775572,-11.463785,570.9187,155000
13
+ 156.7138,30.45201,0.68260586,1.2442116,156.7138,0.21948534,11.207429,-50.277164,-146.26947,-203.60765,21.483,-22.642382,529.82776,160000
14
+ 98.567184,48.958073,0.9392311,2.1652136,98.567184,0.17548627,20.886068,-25.841606,-144.13316,-205.48604,19.108625,-20.79315,485.79037,165000
15
+ 198.52177,29.562206,0.8487519,1.7444082,198.52177,0.1890708,11.542412,-31.525604,-135.69987,-205.11978,15.52565,-15.317123,531.3907,170000
16
+ 268.63324,44.609154,0.8242529,1.9295472,268.63324,0.19294724,11.505355,-7.931072,-141.07509,-204.74529,17.630358,-22.742083,586.13434,175000
17
+ 91.5396,39.034492,0.81521297,1.6495264,91.5396,0.17907217,6.6592607,-14.702395,-138.93867,-202.65674,15.816161,-14.579877,474.1693,180000
18
+ 72.3384,36.28542,0.71464807,1.2782298,72.3384,0.16901502,8.375873,-55.86979,-138.06282,-205.73732,9.86204,-9.664801,384.8045,185000
19
+ 92.78259,35.89763,0.87836874,1.980462,92.78259,0.19223672,14.584076,-16.653263,-138.53746,-206.24194,43.439144,-45.438644,621.8632,190000
20
+ 65.15044,34.23367,0.7728893,1.600216,65.15044,0.14981565,8.034434,-19.48286,-137.42471,-207.08798,9.405551,-9.493402,407.43945,195000
21
+ 194.90286,40.70943,0.75752765,1.5772402,194.90286,0.1743502,14.973487,-10.823095,-133.3817,-205.32596,50.77012,-49.777184,759.6549,200000
22
+ 127.71857,37.147015,0.824467,1.4425995,127.71857,0.19919568,11.704943,-33.824585,-136.99939,-203.89441,19.312954,-20.355133,566.60144,205000
23
+ 107.74555,34.62462,0.8341346,1.751991,107.74555,0.18402164,40.50252,-33.536797,-134.0385,-205.00055,11.743233,-10.553571,503.23215,210000
24
+ 152.84265,45.01117,0.7340411,1.3862822,152.84265,0.16535807,13.897203,0.6640814,-130.2428,-207.00949,35.26787,-28.308777,656.849,215000
25
+ 152.46095,82.406235,0.75744796,2.171418,152.46095,0.17566273,12.42583,-17.245298,-133.11992,-206.90717,11.671249,-12.283522,451.00583,220000
26
+ 522.701,28.850016,0.78091717,1.406027,522.701,0.21372673,15.542922,1.9261624,-135.07552,-200.05025,19.496601,-20.800238,586.3484,225000
27
+ 308.21774,51.76392,0.8510136,1.8743544,308.21774,0.17705989,13.71037,-8.4884205,-132.19273,-202.17552,51.084625,-54.515938,1025.366,230000
28
+ 805.5532,43.81808,0.7985733,1.7025145,805.5532,0.18057218,6.718457,1.3565173,-131.69077,-199.22342,77.340454,-46.60201,1088.6672,235000
29
+ 69.08243,31.789879,0.7148272,1.3504378,69.08243,0.21667987,12.104392,-3.8577733,-125.91089,-195.36058,10.35708,-10.353268,414.29288,240000
30
+ 106.39357,26.893793,0.8241099,1.4993757,106.39357,0.18119174,16.779936,-7.645455,-130.33867,-199.33064,11.435097,-13.942217,436.7211,245000
31
+ 76.1992,44.597893,0.7560875,1.5606606,76.1992,0.19960274,11.792714,-1.7389245,-130.81798,-204.91092,24.740555,-20.54556,468.87445,250000
32
+ 228.27785,148.20648,0.83528364,3.1322594,228.27785,0.17188673,10.855125,-1.5222214,-129.34703,-203.14763,52.7293,-52.787807,820.3153,255000
33
+ 133.68375,47.948673,0.7697123,1.7332665,133.68375,0.18813561,15.019637,-20.758224,-130.69571,-205.75293,10.723822,-11.807228,455.89185,260000
34
+ 63.422714,44.745003,0.82768965,1.6325815,63.422714,0.18332802,13.511748,1.2949204,-127.513115,-195.73401,12.703833,-12.47715,383.00537,265000
35
+ 103.28775,51.96643,0.87539977,1.8172731,103.28775,0.18794492,9.756273,-0.67552876,-124.72268,-201.47227,7.909751,-7.187502,391.13373,270000
36
+ 132.68022,43.93638,0.78716856,2.0164766,132.68022,0.21751435,9.879516,-31.524637,-130.07755,-206.44225,39.60531,-32.976486,685.974,275000
37
+ 83.9982,43.438244,0.8292384,1.8491647,83.9982,0.18626916,11.746462,1.4606591,-128.5084,-204.77426,14.171001,-16.072771,499.5422,280000
38
+ 87.61865,37.16065,0.71766186,1.3198029,87.61865,0.18317533,8.398822,-6.1316986,-122.21763,-193.4382,25.024677,-20.552155,500.6711,285000
39
+ 48.273506,52.904873,0.75464916,1.4859717,48.273506,0.16403145,7.5321784,-4.553059,-123.732254,-201.28328,8.859496,-8.635879,342.011,290000
40
+ 84.65943,40.67781,0.83642775,1.898746,84.65943,0.17639187,6.6089263,-8.609693,-127.05672,-200.36346,10.263585,-9.4640875,408.64874,295000
41
+ 113.328995,43.365753,0.8207455,1.9048511,113.328995,0.19876163,12.530192,-3.704317,-124.27002,-201.70216,37.51599,-32.694477,598.0128,300000
42
+ 78.46153,27.283104,0.7989409,1.4488378,78.46153,0.16089018,13.2798815,1.7791697,-124.68052,-201.17387,16.092913,-17.304956,462.81128,305000
43
+ 672.2737,41.60972,0.842259,1.6914173,672.2737,0.16638775,9.894249,-2.6931477,-124.86061,-195.05202,26.588545,-21.034996,735.77423,310000
44
+ 124.76822,41.06168,0.76338875,1.5441905,124.76822,0.17252925,11.578829,-4.654511,-127.97793,-205.70935,37.35299,-39.712715,653.97687,315000
45
+ 120.92458,31.133564,0.7759654,1.409005,120.92458,0.1568943,7.359407,-4.732303,-122.8489,-197.64975,11.604851,-12.918893,386.51392,320000
46
+ 77.47899,56.72152,0.81528544,1.9918426,77.47899,0.19119981,14.115352,-5.3410535,-119.94784,-201.57439,11.417133,-14.768316,445.69647,325000
47
+ 325.22958,70.97129,0.8076796,2.2718678,325.22958,0.19424349,7.434391,-5.8761735,-124.049614,-200.09326,20.565613,-20.159649,608.7074,330000
48
+ 104.481346,49.54311,0.84009093,2.1351945,104.481346,0.16939506,6.201992,-4.5997767,-121.46748,-204.28247,48.69379,-51.859028,664.61206,335000
49
+ 86.40007,37.892002,0.82187665,1.7849493,86.40007,0.1691418,11.344989,2.8591762,-123.9685,-206.24869,20.596172,-19.672804,555.71533,340000
50
+ 79.38672,36.792473,0.88142747,1.734323,79.38672,0.18577464,9.362975,-4.1407633,-122.42339,-202.4346,13.854903,-21.52782,439.23044,345000
51
+ 252.95921,37.313107,0.775518,1.6437738,252.95921,0.16821179,11.733416,-1.8437394,-110.326294,-205.11015,13.602529,-14.788429,440.7539,350000
52
+ 3651.2917,57.626434,0.81523144,2.1398342,3651.2917,0.16856289,9.161817,-2.966847,-122.5767,-202.7774,52.548138,-51.49904,1294.411,355000
53
+ 64.23634,33.17639,0.82690704,1.6498772,64.23634,0.19962955,10.72042,0.588774,-119.744286,-203.07811,13.45561,-13.724808,408.9029,360000
54
+ 71.080635,37.46924,0.8638291,1.8039786,71.080635,0.17148551,7.7987075,-4.056342,-121.677246,-202.5961,16.029196,-15.959038,430.79602,365000
55
+ 216.78818,48.531868,0.91077316,1.9897447,216.78818,0.18084814,15.056406,-5.1918354,-120.77445,-202.03221,13.243851,-14.269577,512.9997,370000
56
+ 92.73246,48.64613,0.83046955,1.7610444,92.73246,0.19168735,6.5771117,0.5093008,-116.410034,-203.00813,18.57888,-16.516748,474.93036,375000
57
+ 161.6145,55.921955,0.9540994,2.2136002,161.6145,0.18293454,6.5310388,-7.458355,-121.45044,-197.05507,35.183556,-30.310081,606.96936,380000
58
+ 136.03465,53.63168,0.88887185,2.012301,136.03465,0.1645481,9.159507,-4.6393023,-115.36672,-196.37299,32.374157,-28.227627,627.42084,385000
59
+ 90.72073,85.05633,0.89413875,2.3462472,90.72073,0.15680324,14.94815,-3.8244007,-112.83593,-199.95097,17.04215,-16.948996,493.63257,390000
60
+ 338.9651,53.77865,0.8633517,2.0960102,338.9651,0.16113189,7.9767923,0.6883432,-114.43147,-203.24858,16.499435,-15.538507,564.058,395000
61
+ 219.14107,90.067696,0.93138653,2.5374782,219.14107,0.13984978,10.330123,-0.48604184,-117.54424,-199.65112,15.947937,-15.535738,556.9319,400000
62
+ 72.10672,27.98709,0.73238933,1.3534682,72.10672,0.17138283,9.492484,-4.4979577,-117.616264,-201.17018,16.588198,-14.615789,452.2244,405000
63
+ 475.84723,48.37165,0.87457764,2.02035,475.84723,0.16075395,15.622342,-7.450268,-115.509605,-204.3447,16.458332,-18.307468,668.64404,410000
64
+ 132.93723,99.645905,0.94589347,2.901441,132.93723,0.18277797,9.461051,3.2320051,-115.874,-198.04318,65.74164,-62.692886,783.3456,415000
65
+ 114.17372,51.375523,0.7930702,1.8984705,114.17372,0.169837,13.00455,-3.9641886,-117.72256,-198.84982,18.49348,-17.959616,469.59387,420000
66
+ 238.99358,51.285633,0.9062994,2.0000052,238.99358,0.17658281,8.741752,-2.9115453,-116.78699,-203.97638,45.644432,-40.478672,812.58215,425000
67
+ 2506.9482,56.29423,0.99440753,2.4166048,2506.9482,0.18536519,7.799747,-0.16168718,-114.162796,-201.33519,50.681854,-54.724392,1132.9775,430000
68
+ 810.0545,50.058975,0.88397014,2.3720396,810.0545,0.16525365,12.986582,-4.866958,-114.58105,-196.6716,22.05334,-31.238918,725.22424,435000
69
+ 101.839554,36.750954,0.75649196,1.3419853,101.839554,0.19717325,12.252675,-0.81006825,-115.81699,-199.55286,14.499509,-16.674034,502.94543,440000
70
+ 97.599335,68.064384,0.86793035,1.8926169,97.599335,0.17137769,8.838882,-5.1897793,-120.458855,-200.23172,11.593443,-13.17149,423.07834,445000
71
+ 174.83582,51.287567,0.8762877,2.4377725,174.83582,0.15701263,8.575307,-6.5566244,-109.57361,-205.49174,22.260086,-22.746935,622.0069,450000
72
+ 2548.2532,33.961983,0.7440039,1.3785844,2548.2532,0.15169556,8.31474,-0.5715104,-113.56325,-201.10742,79.57989,-71.33638,1410.0388,455000
73
+ 91.70215,43.62592,0.800348,1.6937621,91.70215,0.18876983,8.243253,-4.868858,-111.6074,-201.17792,15.098608,-15.740318,458.14203,460000
74
+ 94.54309,28.654772,0.81867504,1.5935866,94.54309,0.16738439,8.944723,-3.8670204,-116.101135,-204.90266,19.452074,-14.687879,472.31833,465000
75
+ 395.2856,32.98037,0.8388029,1.688208,395.2856,0.1640034,14.212847,-3.6405795,-115.00442,-200.83392,14.303207,-13.332868,525.8547,470000
76
+ 83.78932,59.604153,0.9169752,2.3102028,83.78932,0.16834147,10.566783,0.76702535,-111.16856,-197.73349,37.083546,-42.06968,778.31116,475000
77
+ 162.92493,42.411205,0.76884276,1.6901368,162.92493,0.15925641,8.074055,0.9953007,-110.146416,-200.34506,14.037521,-19.302116,485.71106,480000
78
+ 103.860466,57.710693,0.8444749,1.9697499,103.860466,0.14222254,9.00529,0.6815147,-112.32104,-200.59338,32.936237,-30.860853,548.0703,485000
79
+ 94.07065,32.039505,0.8779022,1.693911,94.07065,0.16627432,11.504512,4.6098895,-113.758354,-199.32204,12.724657,-12.508746,439.66428,490000
80
+ 72.83943,38.168636,0.81087947,1.5516995,72.83943,0.16348962,9.277791,-3.27739,-112.52378,-190.81831,10.369949,-9.972333,398.6861,495000
81
+ 101.870804,34.23674,0.77842444,1.4383914,101.870804,0.14892262,7.321419,0.17214409,-106.67578,-199.1479,20.452936,-20.222765,467.23663,500000
82
+ 127.79046,99.50051,0.92487407,2.2952237,127.79046,0.17695993,15.635508,-0.7711282,-111.25478,-201.60017,15.805653,-13.867865,502.92523,505000
83
+ 109.09259,38.933296,0.8472357,1.7792853,109.09259,0.19294398,7.495514,-5.086394,-114.46069,-194.63588,11.830526,-14.859557,411.97272,510000
84
+ 202.58356,44.393642,0.8289693,2.0253313,202.58356,0.15584931,4.07896,-3.2346933,-108.31439,-190.99124,59.27357,-39.83462,653.86926,515000
85
+ 167.8015,68.147194,0.9603267,2.4210396,167.8015,0.1720478,13.428798,-1.7049742,-112.48351,-196.59813,48.293465,-47.080208,838.8777,520000
86
+ 123.579605,48.321133,0.88175994,2.0516856,123.579605,0.15430884,9.350075,-3.2023575,-107.999146,-201.57047,15.126288,-16.755049,438.998,525000
87
+ 196.70557,120.43546,0.85734177,2.3159778,196.70557,0.1810668,8.431354,-1.2252799,-108.81414,-199.11755,85.95344,-79.01262,1108.2952,530000
88
+ 77.75775,31.352087,0.73715514,1.4743444,77.75775,0.18277466,6.801811,-5.859634,-111.122,-197.25482,13.83059,-14.393426,413.513,535000
89
+ 292.4198,74.57016,0.87583935,2.2357063,292.4198,0.14935282,11.9120865,-4.2060637,-105.784,-200.47827,11.752449,-13.537443,540.3278,540000
90
+ 105.220184,49.1251,0.85643184,1.9133042,105.220184,0.17687315,6.732488,-1.0561564,-111.51544,-194.99706,13.317604,-14.593079,391.75742,545000
91
+ 431.6839,68.63869,0.8475386,2.0386324,431.6839,0.1420134,9.78439,1.4054762,-105.57383,-188.67372,15.02692,-14.345902,557.2569,550000
92
+ 1149.7229,30.199726,0.765263,1.4871308,1149.7229,0.17151617,10.315224,-3.935351,-109.864586,-198.82225,19.391724,-18.26979,752.9205,555000
93
+ 170.35075,77.99528,0.89683735,2.329923,170.35075,0.15721218,11.540813,0.983745,-105.00065,-184.55766,30.742935,-29.539663,542.2997,560000
94
+ 162.8379,131.30463,0.98578215,3.0197399,162.8379,0.17083316,19.248049,-2.2953825,-107.525246,-194.65265,36.784378,-32.050293,890.22125,565000
95
+ 51.544548,22.923882,0.7190681,1.2243936,51.544548,0.14861679,6.1750407,-1.7422162,-103.00594,-190.52397,12.024064,-12.397168,390.0031,570000
96
+ 93.27014,33.817444,0.8105764,1.5704151,93.27014,0.17951879,12.468375,-4.8765507,-105.14292,-203.656,14.194128,-14.339928,447.76508,575000
97
+ 163.91164,104.91942,0.8463881,2.1340363,163.91164,0.14521353,10.693664,1.2752868,-107.673706,-198.24275,10.648975,-10.769197,479.54364,580000
98
+ 104.36951,43.51225,0.9013191,2.050441,104.36951,0.16994676,9.086749,-2.0451095,-106.23256,-197.26317,14.491342,-10.148512,454.91376,585000
99
+ 55.59825,53.53889,0.77959555,1.5354826,55.59825,0.16713539,4.716781,-1.7410746,-107.36354,-198.04944,10.407258,-10.876343,366.6279,590000
100
+ 4002.9648,72.9704,0.9210225,2.4739516,4002.9648,0.12963635,9.205474,-1.3758767,-101.18406,-201.37773,89.45847,-96.14933,1732.6564,595000
101
+ 278.67145,49.53215,0.9139203,2.022677,278.67145,0.17482448,8.577777,2.495098,-99.37137,-202.62375,72.01041,-48.577602,674.02826,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/adj_loss,actor/adj_max,actor/adj_mean,actor/adj_std,actor/fast_loss,actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 84.9986,38.490253,0.65134263,1.38216,84.9986,0.2231794,8.21242,-53.741108,-158.01625,-204.42906,8.688932,-10.577248,356.46786,105000
3
+ 71.80443,19.740747,0.6285404,1.2179642,71.80443,0.19830465,11.146601,-77.03343,-157.0688,-201.66331,8.620195,-11.487813,396.64877,110000
4
+ 1450.8083,34.65538,0.6678076,1.3058261,1450.8083,0.19830379,6.7819543,-53.91802,-156.67021,-202.15552,25.610573,-25.510687,781.62256,115000
5
+ 219.07047,33.349052,0.7260814,1.377426,219.07047,0.20159224,8.327773,-65.1689,-156.64775,-205.83165,14.998541,-16.313728,485.24066,120000
6
+ 548.9114,21.711025,0.7093183,1.4310056,548.9114,0.19329041,7.001138,-60.18718,-154.8955,-202.6037,34.598522,-31.269981,743.83875,125000
7
+ 72.10883,54.83886,0.72847897,1.931026,72.10883,0.19961098,6.3651943,-68.2359,-154.09921,-205.06859,9.269782,-13.57906,385.3069,130000
8
+ 73.44324,25.194992,0.6608466,1.2994014,73.44324,0.17738083,11.062413,-73.26482,-154.30846,-201.96234,15.307721,-16.57786,434.8391,135000
9
+ 60.037003,26.291428,0.6445731,1.2450026,60.037003,0.18798184,10.213315,-58.797443,-154.42174,-204.776,12.994168,-12.894409,353.39706,140000
10
+ 71.05096,40.616985,0.7128165,1.5807749,71.05096,0.17759523,7.5404215,-90.74909,-156.05646,-200.53044,13.097041,-10.418508,371.60846,145000
11
+ 85.57614,35.63509,0.6749023,1.2831047,85.57614,0.2063818,11.529177,-68.39919,-155.79845,-202.53891,14.331142,-13.58364,427.0389,150000
12
+ 221.71332,33.790993,0.7484053,1.4896675,221.71332,0.20386174,25.66815,-35.22244,-149.6881,-205.58583,10.775572,-11.463785,570.9187,155000
13
+ 156.7138,30.45201,0.68260586,1.2442116,156.7138,0.21948534,11.207429,-50.277164,-146.26947,-203.60765,21.483,-22.642382,529.82776,160000
14
+ 98.567184,48.958073,0.9392311,2.1652136,98.567184,0.17548627,20.886068,-25.841606,-144.13316,-205.48604,19.108625,-20.79315,485.79037,165000
15
+ 198.52177,29.562206,0.8487519,1.7444082,198.52177,0.1890708,11.542412,-31.525604,-135.69987,-205.11978,15.52565,-15.317123,531.3907,170000
16
+ 268.63324,44.609154,0.8242529,1.9295472,268.63324,0.19294724,11.505355,-7.931072,-141.07509,-204.74529,17.630358,-22.742083,586.13434,175000
17
+ 91.5396,39.034492,0.81521297,1.6495264,91.5396,0.17907217,6.6592607,-14.702395,-138.93867,-202.65674,15.816161,-14.579877,474.1693,180000
18
+ 72.3384,36.28542,0.71464807,1.2782298,72.3384,0.16901502,8.375873,-55.86979,-138.06282,-205.73732,9.86204,-9.664801,384.8045,185000
19
+ 92.78259,35.89763,0.87836874,1.980462,92.78259,0.19223672,14.584076,-16.653263,-138.53746,-206.24194,43.439144,-45.438644,621.8632,190000
20
+ 65.15044,34.23367,0.7728893,1.600216,65.15044,0.14981565,8.034434,-19.48286,-137.42471,-207.08798,9.405551,-9.493402,407.43945,195000
21
+ 194.90286,40.70943,0.75752765,1.5772402,194.90286,0.1743502,14.973487,-10.823095,-133.3817,-205.32596,50.77012,-49.777184,759.6549,200000
22
+ 127.71857,37.147015,0.824467,1.4425995,127.71857,0.19919568,11.704943,-33.824585,-136.99939,-203.89441,19.312954,-20.355133,566.60144,205000
23
+ 107.74555,34.62462,0.8341346,1.751991,107.74555,0.18402164,40.50252,-33.536797,-134.0385,-205.00055,11.743233,-10.553571,503.23215,210000
24
+ 152.84265,45.01117,0.7340411,1.3862822,152.84265,0.16535807,13.897203,0.6640814,-130.2428,-207.00949,35.26787,-28.308777,656.849,215000
25
+ 152.46095,82.406235,0.75744796,2.171418,152.46095,0.17566273,12.42583,-17.245298,-133.11992,-206.90717,11.671249,-12.283522,451.00583,220000
26
+ 522.701,28.850016,0.78091717,1.406027,522.701,0.21372673,15.542922,1.9261624,-135.07552,-200.05025,19.496601,-20.800238,586.3484,225000
27
+ 308.21774,51.76392,0.8510136,1.8743544,308.21774,0.17705989,13.71037,-8.4884205,-132.19273,-202.17552,51.084625,-54.515938,1025.366,230000
28
+ 805.5532,43.81808,0.7985733,1.7025145,805.5532,0.18057218,6.718457,1.3565173,-131.69077,-199.22342,77.340454,-46.60201,1088.6672,235000
29
+ 69.08243,31.789879,0.7148272,1.3504378,69.08243,0.21667987,12.104392,-3.8577733,-125.91089,-195.36058,10.35708,-10.353268,414.29288,240000
30
+ 106.39357,26.893793,0.8241099,1.4993757,106.39357,0.18119174,16.779936,-7.645455,-130.33867,-199.33064,11.435097,-13.942217,436.7211,245000
31
+ 76.1992,44.597893,0.7560875,1.5606606,76.1992,0.19960274,11.792714,-1.7389245,-130.81798,-204.91092,24.740555,-20.54556,468.87445,250000
32
+ 228.27785,148.20648,0.83528364,3.1322594,228.27785,0.17188673,10.855125,-1.5222214,-129.34703,-203.14763,52.7293,-52.787807,820.3153,255000
33
+ 133.68375,47.948673,0.7697123,1.7332665,133.68375,0.18813561,15.019637,-20.758224,-130.69571,-205.75293,10.723822,-11.807228,455.89185,260000
34
+ 63.422714,44.745003,0.82768965,1.6325815,63.422714,0.18332802,13.511748,1.2949204,-127.513115,-195.73401,12.703833,-12.47715,383.00537,265000
35
+ 103.28775,51.96643,0.87539977,1.8172731,103.28775,0.18794492,9.756273,-0.67552876,-124.72268,-201.47227,7.909751,-7.187502,391.13373,270000
36
+ 132.68022,43.93638,0.78716856,2.0164766,132.68022,0.21751435,9.879516,-31.524637,-130.07755,-206.44225,39.60531,-32.976486,685.974,275000
37
+ 83.9982,43.438244,0.8292384,1.8491647,83.9982,0.18626916,11.746462,1.4606591,-128.5084,-204.77426,14.171001,-16.072771,499.5422,280000
38
+ 87.61865,37.16065,0.71766186,1.3198029,87.61865,0.18317533,8.398822,-6.1316986,-122.21763,-193.4382,25.024677,-20.552155,500.6711,285000
39
+ 48.273506,52.904873,0.75464916,1.4859717,48.273506,0.16403145,7.5321784,-4.553059,-123.732254,-201.28328,8.859496,-8.635879,342.011,290000
40
+ 84.65943,40.67781,0.83642775,1.898746,84.65943,0.17639187,6.6089263,-8.609693,-127.05672,-200.36346,10.263585,-9.4640875,408.64874,295000
41
+ 113.328995,43.365753,0.8207455,1.9048511,113.328995,0.19876163,12.530192,-3.704317,-124.27002,-201.70216,37.51599,-32.694477,598.0128,300000
42
+ 78.46153,27.283104,0.7989409,1.4488378,78.46153,0.16089018,13.2798815,1.7791697,-124.68052,-201.17387,16.092913,-17.304956,462.81128,305000
43
+ 672.2737,41.60972,0.842259,1.6914173,672.2737,0.16638775,9.894249,-2.6931477,-124.86061,-195.05202,26.588545,-21.034996,735.77423,310000
44
+ 124.76822,41.06168,0.76338875,1.5441905,124.76822,0.17252925,11.578829,-4.654511,-127.97793,-205.70935,37.35299,-39.712715,653.97687,315000
45
+ 120.92458,31.133564,0.7759654,1.409005,120.92458,0.1568943,7.359407,-4.732303,-122.8489,-197.64975,11.604851,-12.918893,386.51392,320000
46
+ 77.47899,56.72152,0.81528544,1.9918426,77.47899,0.19119981,14.115352,-5.3410535,-119.94784,-201.57439,11.417133,-14.768316,445.69647,325000
47
+ 325.22958,70.97129,0.8076796,2.2718678,325.22958,0.19424349,7.434391,-5.8761735,-124.049614,-200.09326,20.565613,-20.159649,608.7074,330000
48
+ 104.481346,49.54311,0.84009093,2.1351945,104.481346,0.16939506,6.201992,-4.5997767,-121.46748,-204.28247,48.69379,-51.859028,664.61206,335000
49
+ 86.40007,37.892002,0.82187665,1.7849493,86.40007,0.1691418,11.344989,2.8591762,-123.9685,-206.24869,20.596172,-19.672804,555.71533,340000
50
+ 79.38672,36.792473,0.88142747,1.734323,79.38672,0.18577464,9.362975,-4.1407633,-122.42339,-202.4346,13.854903,-21.52782,439.23044,345000
51
+ 252.95921,37.313107,0.775518,1.6437738,252.95921,0.16821179,11.733416,-1.8437394,-110.326294,-205.11015,13.602529,-14.788429,440.7539,350000
52
+ 3651.2917,57.626434,0.81523144,2.1398342,3651.2917,0.16856289,9.161817,-2.966847,-122.5767,-202.7774,52.548138,-51.49904,1294.411,355000
53
+ 64.23634,33.17639,0.82690704,1.6498772,64.23634,0.19962955,10.72042,0.588774,-119.744286,-203.07811,13.45561,-13.724808,408.9029,360000
54
+ 71.080635,37.46924,0.8638291,1.8039786,71.080635,0.17148551,7.7987075,-4.056342,-121.677246,-202.5961,16.029196,-15.959038,430.79602,365000
55
+ 216.78818,48.531868,0.91077316,1.9897447,216.78818,0.18084814,15.056406,-5.1918354,-120.77445,-202.03221,13.243851,-14.269577,512.9997,370000
56
+ 92.73246,48.64613,0.83046955,1.7610444,92.73246,0.19168735,6.5771117,0.5093008,-116.410034,-203.00813,18.57888,-16.516748,474.93036,375000
57
+ 161.6145,55.921955,0.9540994,2.2136002,161.6145,0.18293454,6.5310388,-7.458355,-121.45044,-197.05507,35.183556,-30.310081,606.96936,380000
58
+ 136.03465,53.63168,0.88887185,2.012301,136.03465,0.1645481,9.159507,-4.6393023,-115.36672,-196.37299,32.374157,-28.227627,627.42084,385000
59
+ 90.72073,85.05633,0.89413875,2.3462472,90.72073,0.15680324,14.94815,-3.8244007,-112.83593,-199.95097,17.04215,-16.948996,493.63257,390000
60
+ 338.9651,53.77865,0.8633517,2.0960102,338.9651,0.16113189,7.9767923,0.6883432,-114.43147,-203.24858,16.499435,-15.538507,564.058,395000
61
+ 219.14107,90.067696,0.93138653,2.5374782,219.14107,0.13984978,10.330123,-0.48604184,-117.54424,-199.65112,15.947937,-15.535738,556.9319,400000
62
+ 72.10672,27.98709,0.73238933,1.3534682,72.10672,0.17138283,9.492484,-4.4979577,-117.616264,-201.17018,16.588198,-14.615789,452.2244,405000
63
+ 475.84723,48.37165,0.87457764,2.02035,475.84723,0.16075395,15.622342,-7.450268,-115.509605,-204.3447,16.458332,-18.307468,668.64404,410000
64
+ 132.93723,99.645905,0.94589347,2.901441,132.93723,0.18277797,9.461051,3.2320051,-115.874,-198.04318,65.74164,-62.692886,783.3456,415000
65
+ 114.17372,51.375523,0.7930702,1.8984705,114.17372,0.169837,13.00455,-3.9641886,-117.72256,-198.84982,18.49348,-17.959616,469.59387,420000
66
+ 238.99358,51.285633,0.9062994,2.0000052,238.99358,0.17658281,8.741752,-2.9115453,-116.78699,-203.97638,45.644432,-40.478672,812.58215,425000
67
+ 2506.9482,56.29423,0.99440753,2.4166048,2506.9482,0.18536519,7.799747,-0.16168718,-114.162796,-201.33519,50.681854,-54.724392,1132.9775,430000
68
+ 810.0545,50.058975,0.88397014,2.3720396,810.0545,0.16525365,12.986582,-4.866958,-114.58105,-196.6716,22.05334,-31.238918,725.22424,435000
69
+ 101.839554,36.750954,0.75649196,1.3419853,101.839554,0.19717325,12.252675,-0.81006825,-115.81699,-199.55286,14.499509,-16.674034,502.94543,440000
70
+ 97.599335,68.064384,0.86793035,1.8926169,97.599335,0.17137769,8.838882,-5.1897793,-120.458855,-200.23172,11.593443,-13.17149,423.07834,445000
71
+ 174.83582,51.287567,0.8762877,2.4377725,174.83582,0.15701263,8.575307,-6.5566244,-109.57361,-205.49174,22.260086,-22.746935,622.0069,450000
72
+ 2548.2532,33.961983,0.7440039,1.3785844,2548.2532,0.15169556,8.31474,-0.5715104,-113.56325,-201.10742,79.57989,-71.33638,1410.0388,455000
73
+ 91.70215,43.62592,0.800348,1.6937621,91.70215,0.18876983,8.243253,-4.868858,-111.6074,-201.17792,15.098608,-15.740318,458.14203,460000
74
+ 94.54309,28.654772,0.81867504,1.5935866,94.54309,0.16738439,8.944723,-3.8670204,-116.101135,-204.90266,19.452074,-14.687879,472.31833,465000
75
+ 395.2856,32.98037,0.8388029,1.688208,395.2856,0.1640034,14.212847,-3.6405795,-115.00442,-200.83392,14.303207,-13.332868,525.8547,470000
76
+ 83.78932,59.604153,0.9169752,2.3102028,83.78932,0.16834147,10.566783,0.76702535,-111.16856,-197.73349,37.083546,-42.06968,778.31116,475000
77
+ 162.92493,42.411205,0.76884276,1.6901368,162.92493,0.15925641,8.074055,0.9953007,-110.146416,-200.34506,14.037521,-19.302116,485.71106,480000
78
+ 103.860466,57.710693,0.8444749,1.9697499,103.860466,0.14222254,9.00529,0.6815147,-112.32104,-200.59338,32.936237,-30.860853,548.0703,485000
79
+ 94.07065,32.039505,0.8779022,1.693911,94.07065,0.16627432,11.504512,4.6098895,-113.758354,-199.32204,12.724657,-12.508746,439.66428,490000
80
+ 72.83943,38.168636,0.81087947,1.5516995,72.83943,0.16348962,9.277791,-3.27739,-112.52378,-190.81831,10.369949,-9.972333,398.6861,495000
81
+ 101.870804,34.23674,0.77842444,1.4383914,101.870804,0.14892262,7.321419,0.17214409,-106.67578,-199.1479,20.452936,-20.222765,467.23663,500000
82
+ 127.79046,99.50051,0.92487407,2.2952237,127.79046,0.17695993,15.635508,-0.7711282,-111.25478,-201.60017,15.805653,-13.867865,502.92523,505000
83
+ 109.09259,38.933296,0.8472357,1.7792853,109.09259,0.19294398,7.495514,-5.086394,-114.46069,-194.63588,11.830526,-14.859557,411.97272,510000
84
+ 202.58356,44.393642,0.8289693,2.0253313,202.58356,0.15584931,4.07896,-3.2346933,-108.31439,-190.99124,59.27357,-39.83462,653.86926,515000
85
+ 167.8015,68.147194,0.9603267,2.4210396,167.8015,0.1720478,13.428798,-1.7049742,-112.48351,-196.59813,48.293465,-47.080208,838.8777,520000
86
+ 123.579605,48.321133,0.88175994,2.0516856,123.579605,0.15430884,9.350075,-3.2023575,-107.999146,-201.57047,15.126288,-16.755049,438.998,525000
87
+ 196.70557,120.43546,0.85734177,2.3159778,196.70557,0.1810668,8.431354,-1.2252799,-108.81414,-199.11755,85.95344,-79.01262,1108.2952,530000
88
+ 77.75775,31.352087,0.73715514,1.4743444,77.75775,0.18277466,6.801811,-5.859634,-111.122,-197.25482,13.83059,-14.393426,413.513,535000
89
+ 292.4198,74.57016,0.87583935,2.2357063,292.4198,0.14935282,11.9120865,-4.2060637,-105.784,-200.47827,11.752449,-13.537443,540.3278,540000
90
+ 105.220184,49.1251,0.85643184,1.9133042,105.220184,0.17687315,6.732488,-1.0561564,-111.51544,-194.99706,13.317604,-14.593079,391.75742,545000
91
+ 431.6839,68.63869,0.8475386,2.0386324,431.6839,0.1420134,9.78439,1.4054762,-105.57383,-188.67372,15.02692,-14.345902,557.2569,550000
92
+ 1149.7229,30.199726,0.765263,1.4871308,1149.7229,0.17151617,10.315224,-3.935351,-109.864586,-198.82225,19.391724,-18.26979,752.9205,555000
93
+ 170.35075,77.99528,0.89683735,2.329923,170.35075,0.15721218,11.540813,0.983745,-105.00065,-184.55766,30.742935,-29.539663,542.2997,560000
94
+ 162.8379,131.30463,0.98578215,3.0197399,162.8379,0.17083316,19.248049,-2.2953825,-107.525246,-194.65265,36.784378,-32.050293,890.22125,565000
95
+ 51.544548,22.923882,0.7190681,1.2243936,51.544548,0.14861679,6.1750407,-1.7422162,-103.00594,-190.52397,12.024064,-12.397168,390.0031,570000
96
+ 93.27014,33.817444,0.8105764,1.5704151,93.27014,0.17951879,12.468375,-4.8765507,-105.14292,-203.656,14.194128,-14.339928,447.76508,575000
97
+ 163.91164,104.91942,0.8463881,2.1340363,163.91164,0.14521353,10.693664,1.2752868,-107.673706,-198.24275,10.648975,-10.769197,479.54364,580000
98
+ 104.36951,43.51225,0.9013191,2.050441,104.36951,0.16994676,9.086749,-2.0451095,-106.23256,-197.26317,14.491342,-10.148512,454.91376,585000
99
+ 55.59825,53.53889,0.77959555,1.5354826,55.59825,0.16713539,4.716781,-1.7410746,-107.36354,-198.04944,10.407258,-10.876343,366.6279,590000
100
+ 4002.9648,72.9704,0.9210225,2.4739516,4002.9648,0.12963635,9.205474,-1.3758767,-101.18406,-201.37773,89.45847,-96.14933,1732.6564,595000
101
+ 278.67145,49.53215,0.9139203,2.022677,278.67145,0.17482448,8.577777,2.495098,-99.37137,-202.62375,72.01041,-48.577602,674.02826,600000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cac518d9a7aa762567ce73e83e0891f42a8168f18f16263ff433dd9f75e8d547
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f29cb146c5f84611035439a81ae2105816ef1cf4682568420c9cf1a536683f8e
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54ad1dc1fc88f1716bac51dfd7522b07f7b7431ecf02686c1966a407fcbf4fd1
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89034f32f310af293a30632453d50d55969a7605d6117741f2b471391cf313c1
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17db721c2835e99415aa5d43bdf951079eea70539cead49596e11907078a8656
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab611deb2ad40c64c19cfca07d6a71b1ed3507bf2727fc6994e730f52e9e1026
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa9dfd18ef4b0408733d08f0c88650b06be7e4423212b8929b0b0a9423e51cbc
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3584c013cfa6384b46aeaeeb307a1507bb1710a8b29ac8e6261f3b3857a29121
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8b8a437760d9e636e75653c4b3c5b5d40991dc960be8b1428428a0e6bacd787
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef7831843db7e3b5739fc270e87c7a11a20b244a10ac35e614614d4bd97d0199
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260318_121804/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/1odm5r9y