Tiredsheep commited on
Commit
af045b5
·
verified ·
1 Parent(s): 4e0b568

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_350000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_400000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_450000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_500000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_550000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_600000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_650000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_700000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_750000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_800000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.18023879206055538,-0.0015090259749501631,-0.1802771316583113,-0.0004450533770509198,27.623941996356216,50.10000000001527,0.0,25500.0,-1.02,-1013.6,1000.0,3.0428732299804686,350000
3
+ 0.0,0.0,-0.1764988287383111,-0.004752026065822408,-0.17678020312898618,-0.005053791620835983,29.47941383502958,50.10000000001527,0.0,77500.0,-1.02,-1019.64,1000.0,3.073791470527649,400000
4
+ 0.0,0.0,-0.1881473674782404,0.00029935094471769696,-0.1881279261179786,0.0001999090870128458,32.827550192509555,50.10000000001527,0.0,129500.0,-1.02,-1019.58,1000.0,3.0785155963897703,450000
5
+ 0.0,0.0,-0.1863560185578464,0.0009274905285603198,-0.18629731867647367,0.000856554790798375,34.21534544723085,48.230000000014655,0.04,180583.7,-0.98,-982.12,962.6,2.9646342468261717,500000
6
+ 0.0,0.0,-0.17846615061623086,-0.0021202988673427194,-0.17857304315375871,-0.001775641041719191,33.93582426949633,50.10000000001527,0.0,231630.0,-1.0,-1000.0,1000.0,3.075405898094177,550000
7
+ 0.0,0.0,-0.17256955624843898,-0.0015509329581578953,-0.1726852102208228,-0.0019737425483242733,32.873393013884225,50.10000000001527,0.0,283630.0,-1.0,-1000.0,1000.0,3.0667025947570803,600000
8
+ 0.0,0.0,-0.17269818598565545,0.00022526790990483415,-0.1726829985263323,0.000290520635124085,34.17882695808487,50.10000000001527,0.0,335630.0,-1.0,-1000.0,1000.0,3.0610155630111695,650000
9
+ 0.0,0.0,-0.18972412804697894,-0.00036082169914548857,-0.18974408099461781,-0.0003212047160283418,34.77472398078858,50.10000000001527,0.0,387630.0,-1.0,-1000.0,1000.0,3.0999815893173217,700000
10
+ 0.0,0.0,-0.17654538863547928,-0.0009057599582300324,-0.17657596467670522,-0.000667767765128538,33.39504806668945,48.22200000001465,0.04,439047.48,-0.96,-962.4,962.44,2.952495188713074,750000
11
+ 0.0,0.0,-0.15431464359759367,0.0008218001362183306,-0.15432091667350833,0.00034033101401089393,32.925095281633354,50.10000000001527,0.0,489752.0,-1.0,-1000.0,1000.0,3.0637408018112184,800000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.18023879206055538,-0.0015090259749501631,-0.1802771316583113,-0.0004450533770509198,27.623941996356216,50.10000000001527,0.0,25500.0,-1.02,-1013.6,1000.0,3.0428732299804686,350000
3
+ 0.0,0.0,-0.1764988287383111,-0.004752026065822408,-0.17678020312898618,-0.005053791620835983,29.47941383502958,50.10000000001527,0.0,77500.0,-1.02,-1019.64,1000.0,3.073791470527649,400000
4
+ 0.0,0.0,-0.1881473674782404,0.00029935094471769696,-0.1881279261179786,0.0001999090870128458,32.827550192509555,50.10000000001527,0.0,129500.0,-1.02,-1019.58,1000.0,3.0785155963897703,450000
5
+ 0.0,0.0,-0.1863560185578464,0.0009274905285603198,-0.18629731867647367,0.000856554790798375,34.21534544723085,48.230000000014655,0.04,180583.7,-0.98,-982.12,962.6,2.9646342468261717,500000
6
+ 0.0,0.0,-0.17846615061623086,-0.0021202988673427194,-0.17857304315375871,-0.001775641041719191,33.93582426949633,50.10000000001527,0.0,231630.0,-1.0,-1000.0,1000.0,3.075405898094177,550000
7
+ 0.0,0.0,-0.17256955624843898,-0.0015509329581578953,-0.1726852102208228,-0.0019737425483242733,32.873393013884225,50.10000000001527,0.0,283630.0,-1.0,-1000.0,1000.0,3.0667025947570803,600000
8
+ 0.0,0.0,-0.17269818598565545,0.00022526790990483415,-0.1726829985263323,0.000290520635124085,34.17882695808487,50.10000000001527,0.0,335630.0,-1.0,-1000.0,1000.0,3.0610155630111695,650000
9
+ 0.0,0.0,-0.18972412804697894,-0.00036082169914548857,-0.18974408099461781,-0.0003212047160283418,34.77472398078858,50.10000000001527,0.0,387630.0,-1.0,-1000.0,1000.0,3.0999815893173217,700000
10
+ 0.0,0.0,-0.17654538863547928,-0.0009057599582300324,-0.17657596467670522,-0.000667767765128538,33.39504806668945,48.22200000001465,0.04,439047.48,-0.96,-962.4,962.44,2.952495188713074,750000
11
+ 0.0,0.0,-0.15431464359759367,0.0008218001362183306,-0.15432091667350833,0.00034033101401089393,32.925095281633354,50.10000000001527,0.0,489752.0,-1.0,-1000.0,1000.0,3.0637408018112184,800000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
2
+ 0.6644302,287.8457,0.004301978,-0.0013610249,-12.816372,0.16198651,-287.7906,288.00632,8.001165,10.007518,-108.30868,-288.85437,-303.09412,18.008682,4.098134,-4.5296106,256.24353,305000
3
+ 0.669014,285.04434,0.0044764197,0.0008986983,-12.299237,0.19769819,-284.98932,285.24292,2.5018673,6.8204665,-158.03436,-285.81882,-302.53674,9.322334,0.5658894,-0.96999526,94.73556,310000
4
+ 0.6571826,281.06274,0.0042703114,0.0008337927,-12.304747,0.1729198,-281.0102,281.23648,4.428573,13.595145,-107.44074,-282.02234,-302.79538,18.023718,6.5452075,-6.394309,259.48553,315000
5
+ 0.6490956,287.14832,0.004355761,-0.00081868254,-12.687954,0.18398614,-287.09302,287.33148,2.8152614,6.1822915,-173.55641,-288.85425,-302.85696,8.997553,1.2361869,-1.0007355,124.54308,320000
6
+ 0.6456623,284.20053,0.0042796414,-0.01512543,-16.034275,0.21283051,-284.1319,284.39822,2.343795,5.308229,-106.823845,-285.45068,-302.7311,7.6520243,0.69752705,-0.5811456,88.27592,325000
7
+ 0.6692465,284.2591,0.004191262,0.008407374,-10.494071,0.20007658,-284.2151,284.46756,1.5856186,5.480632,2.2329502,-284.99323,-302.72598,7.0662503,2.464924,-2.4509728,93.22647,330000
8
+ 0.6680937,287.7744,0.004306559,0.0050009303,-11.338764,0.17685218,-287.72556,287.95627,1.6979821,7.003452,-103.10716,-288.69296,-302.6692,8.701434,0.6177458,-0.57384676,88.99411,335000
9
+ 0.6727923,283.28986,0.004692932,0.014388341,-9.43404,0.18402806,-283.24557,283.48825,2.012737,3.614269,-100.91894,-284.1826,-302.71667,5.627006,0.8767326,-1.0045528,80.76254,340000
10
+ 0.66874313,283.97925,0.0043335566,0.0040230346,-11.571655,0.18635349,-283.92908,284.16962,1.9605721,5.972544,-100.83468,-284.88223,-303.20203,7.9331164,1.7814046,-0.8960423,108.84259,345000
11
+ 0.662225,282.29016,0.004123468,0.0031395229,-11.738621,0.19507983,-282.24176,282.48837,1.3459777,4.350292,-100.40695,-283.35104,-302.7905,5.69627,0.67335373,-0.53554124,75.93465,350000
12
+ 0.65680236,282.80157,0.0044184527,0.00011928326,-12.473003,0.19026282,-282.74646,282.99197,2.0741482,7.7435327,-100.757645,-283.8674,-303.05832,9.81768,0.81936425,-1.6414585,96.99141,355000
13
+ 0.6625112,282.81732,0.004552278,0.003535646,-11.723324,0.21912019,-282.76395,283.03998,1.7698987,5.650407,-102.03703,-283.4048,-302.69366,7.4203053,1.0559391,-0.8942263,92.79312,360000
14
+ 0.66274655,283.7535,0.004277591,0.0041669407,-11.525867,0.18087336,-283.70422,283.93857,1.5166241,3.9052784,-100.69106,-284.83517,-303.09534,5.4219027,0.69302154,-0.6310374,72.50021,365000
15
+ 0.65287185,276.27982,0.004554521,0.0019007329,-12.082671,0.18424967,-276.2248,276.46594,1.6134278,4.6983204,-101.012054,-277.2858,-302.72998,6.311748,0.72091556,-0.47588557,76.53245,370000
16
+ 0.644207,275.3484,0.004359532,-0.015020308,-15.9453945,0.21017215,-275.27887,275.54355,2.5729294,6.452949,-37.602314,-277.15982,-302.77444,9.025879,1.3512064,-1.4069008,116.32476,375000
17
+ 0.6349845,276.985,0.0042854883,-0.01621786,-16.284367,0.18621714,-276.91522,277.155,2.679957,4.933501,-100.61954,-278.13116,-302.4467,7.6134577,1.0171608,-1.0772505,82.52959,380000
18
+ 0.6523465,279.07056,0.0043897163,-0.00943801,-14.650027,0.18695939,-279.00626,279.24808,2.1781363,6.59966,-67.12562,-279.9166,-302.6114,8.777796,1.0517906,-2.068527,123.032684,385000
19
+ 0.6476531,280.09946,0.0044805435,-0.0058048554,-13.795569,0.17369725,-280.03766,280.26736,2.1712122,5.6169953,-100.28506,-281.108,-302.5187,7.7882075,0.6982482,-0.9801612,91.471634,390000
20
+ 0.654013,279.575,0.0044190786,0.0040249852,-11.58918,0.18384722,-279.5238,279.76288,1.7756637,4.599647,-100.51435,-280.50818,-303.49994,6.375311,0.7141902,-0.7056673,74.72863,395000
21
+ 0.6381815,276.80457,0.0040838025,-0.014336305,-16.010529,0.16644864,-276.7392,276.95667,1.8178848,7.81055,-87.03934,-277.8911,-302.5544,9.628435,1.6649102,-1.998895,105.31186,400000
22
+ 0.6605147,280.26273,0.0042364174,0.0019830733,-12.0318985,0.20053121,-280.21176,280.46524,1.7050847,5.1348224,-100.46689,-281.1069,-302.83203,6.839907,0.65522087,-0.6160283,78.406555,405000
23
+ 0.64635277,279.9599,0.004161377,-0.011098709,-15.167076,0.19476625,-279.89676,280.14355,17.680342,6.6968055,-45.13941,-280.883,-302.6795,24.377148,1.8115996,-1.3298532,134.22011,410000
24
+ 0.6451673,276.6292,0.0040364903,-0.008576957,-14.624855,0.2063176,-276.57016,276.82697,1.5537825,13.052439,-100.550545,-277.77258,-302.7233,14.606221,4.8850656,-4.919883,174.38593,415000
25
+ 0.6494969,273.31052,0.0041016284,0.0005039767,-12.377128,0.1777437,-273.25977,273.48877,1.4975628,5.3284984,-100.35958,-274.17596,-302.47562,6.8260612,0.68214244,-0.6576895,75.86508,420000
26
+ 0.66763616,280.3579,0.0040141484,0.007210281,-10.703783,0.19056647,-280.31497,280.55566,1.2604564,4.6342573,-87.381096,-281.40952,-302.6503,5.894714,2.3723512,-0.5575035,86.777435,425000
27
+ 0.6605937,277.74777,0.0041731643,-0.0023355887,-13.059669,0.2047035,-277.69327,277.95013,3.4085443,5.5912046,-100.472404,-279.09445,-302.95157,8.999749,5.23813,-5.455099,175.68408,430000
28
+ 0.65392745,278.68732,0.0038837008,-0.00025921315,-12.566744,0.168918,-278.6385,278.856,2.2438924,5.9817033,-100.37773,-279.638,-302.6359,8.225595,2.160954,-0.8957074,93.15115,435000
29
+ 0.66499525,274.94727,0.0040012947,0.0018859672,-12.028661,0.20882758,-274.89914,275.158,1.5758051,5.0442686,-100.384575,-275.6686,-302.57257,6.620074,0.6256214,-0.42625925,67.98132,440000
30
+ 0.65481436,272.33228,0.003872646,0.0035685443,-11.578526,0.19697094,-272.28748,272.5328,3.5737865,6.2261424,-100.29901,-273.4665,-302.76025,9.799929,12.808319,-10.697351,276.96747,445000
31
+ 0.65546554,278.28687,0.004019086,-0.0007593394,-12.688933,0.16655791,-278.2359,278.45267,1.5980083,3.8631642,-100.41003,-278.92905,-302.43604,5.4611726,0.7026018,-0.4638818,61.097366,450000
32
+ 0.6530008,276.0895,0.004059205,-0.0008696637,-12.714245,0.17226967,-276.0379,276.26093,1.6492262,4.7996707,-100.23153,-276.6734,-302.263,6.448897,2.778954,-2.1379287,104.44095,455000
33
+ 0.6554821,270.7886,0.004188647,-0.0010720481,-12.755941,0.20318736,-270.7352,270.99072,1.4621271,4.5579104,-100.2724,-271.70786,-302.70422,6.0200377,0.69879264,-0.6608154,71.084145,460000
34
+ 0.6596234,272.28433,0.0042293207,0.00020159713,-12.452333,0.18037684,-272.2317,272.46494,1.481711,4.0395947,-100.382126,-273.58005,-302.6132,5.5213056,0.79350924,-0.6443036,77.29178,465000
35
+ 0.6597553,271.3466,0.003791467,0.0042950646,-11.367176,0.19965884,-271.30347,271.55054,6.704764,8.09662,-100.35994,-272.56296,-302.63586,14.801384,3.584199,-4.219602,160.16846,470000
36
+ 0.65404415,272.3339,0.003939522,-0.0019079355,-12.984306,0.19806805,-272.2827,272.53003,2.508462,4.109176,-100.28566,-273.24667,-302.7701,6.617638,0.6730824,-0.44346315,71.69325,475000
37
+ 0.6443356,272.5381,0.004073699,-0.009242656,-14.768861,0.19652185,-272.4779,272.72537,2.0353892,4.711815,-100.127144,-273.27554,-303.6413,6.747204,1.8147693,-2.4370422,99.715706,480000
38
+ 0.65857786,269.04218,0.0039341175,0.0023757946,-11.896105,0.16081099,-268.99536,269.20535,1.8709191,3.9811037,-100.32084,-269.6927,-302.7424,5.8520226,0.60452056,-0.4251092,64.4144,485000
39
+ 0.6573267,268.54608,0.0039117783,0.00030795048,-12.421276,0.1734781,-268.4975,268.71988,1.3003157,5.4634376,-100.13655,-269.3789,-302.34528,6.7637534,1.0261009,-0.73550916,69.89128,490000
40
+ 0.64508665,275.90652,0.0038667505,-0.002922797,-13.255879,0.18168011,-275.85526,276.08527,1.4121122,4.0830064,-100.23735,-276.85333,-302.30975,5.4951186,0.9995203,-0.7321601,73.63788,495000
41
+ 0.65551853,268.85327,0.004202587,-0.008610755,-14.548918,0.17566916,-268.7921,269.02032,3.322596,10.674686,-100.21806,-269.29572,-302.84332,13.997282,1.5054824,-1.5703661,131.9115,500000
42
+ 0.6427433,268.26453,0.0038748495,-0.010073147,-15.099623,0.19395903,-268.20602,268.44843,2.2759125,4.583321,-100.22445,-268.8059,-302.29855,6.859234,0.69423974,-0.88444555,93.4533,505000
43
+ 0.6571682,271.0443,0.0040199105,0.0070433007,-10.747896,0.21194865,-271.0011,271.2633,1.5017874,4.3578935,-99.52925,-271.89786,-302.4765,5.859681,0.7393448,-0.54491407,76.837074,510000
44
+ 0.6587528,267.78476,0.0039496333,0.004225918,-11.430048,0.16876166,-267.73962,267.95773,1.200001,2.9682362,-100.31598,-268.7687,-302.72293,4.168237,0.64519405,-0.82751095,61.47215,515000
45
+ 0.65593934,272.69125,0.0038750123,0.00035068076,-12.409502,0.18954614,-272.64316,272.88113,1.1828362,3.6375356,-100.33802,-273.47617,-302.5813,4.8203716,0.4260553,-0.4827187,67.59282,520000
46
+ 0.6568121,273.8451,0.0038406441,0.0018908884,-12.007664,0.17333534,-273.79895,274.02032,1.2490805,3.3988464,-100.20055,-274.90918,-302.368,4.647927,0.5365727,-0.40816203,59.02067,525000
47
+ 0.6500991,274.06863,0.0039715273,-0.008600781,-14.66561,0.1958934,-274.01038,274.25592,1.9873003,5.445539,-98.17235,-275.61444,-302.3528,7.4328394,3.7452836,-4.854759,143.24277,530000
48
+ 0.67411834,270.74377,0.0040188543,0.012923867,-9.284191,0.23322387,-270.70648,270.9899,1.3411597,5.6793184,-33.86404,-271.3967,-302.20087,7.0204782,0.84348214,-0.63969225,73.10893,535000
49
+ 0.65211546,273.46133,0.0040447,-0.004379292,-13.582724,0.16345622,-273.40643,273.6204,7.947208,17.57704,-100.43764,-274.84146,-302.58685,25.524248,6.8441515,-5.3247223,265.4073,540000
50
+ 0.6679531,264.74036,0.003797679,0.010362425,-9.771379,0.18761022,-264.70325,264.93835,1.2662568,5.8906693,-100.06622,-265.27158,-302.4461,7.156926,3.9169266,-4.6824527,139.70099,545000
51
+ 0.6800357,274.62732,0.003876801,0.010078472,-9.900312,0.15891287,-274.58893,274.7963,1.3751003,3.5062625,-100.19342,-275.72073,-302.6781,4.881363,0.71664006,-0.49707633,62.339462,550000
52
+ 0.66053504,268.6845,0.0038398895,0.0070922105,-10.653017,0.1911758,-268.64362,268.88275,1.4140915,3.830838,-97.96146,-269.43677,-302.55444,5.2449293,1.2219263,-0.9967634,68.86004,555000
53
+ 0.66772884,267.34796,0.00404272,0.008648295,-10.360773,0.18598686,-267.3061,267.54257,1.4683155,5.016164,-100.20284,-268.07144,-302.24536,6.4844794,2.213316,-1.7816901,101.025055,560000
54
+ 0.65750456,268.48126,0.0039412277,0.0060885507,-10.955164,0.18179497,-268.43808,268.66916,1.2141771,7.4797683,-100.18381,-269.7825,-302.57443,8.693945,2.9628515,-3.7657597,153.93706,565000
55
+ 0.6553488,272.4113,0.004336389,-0.0086391475,-14.492245,0.16905552,-272.34845,272.57172,1.591072,5.9920764,-38.81717,-273.2822,-302.1164,7.5831485,2.0837677,-1.8157223,89.32085,570000
56
+ 0.66209334,265.23227,0.003963708,0.005093901,-11.214865,0.20234497,-265.1878,265.4397,1.669854,6.014098,-42.50181,-266.38013,-302.71277,7.6839523,0.64316297,-0.58341014,76.3264,575000
57
+ 0.66747314,265.31818,0.0037663234,0.0017377925,-12.038597,0.17254105,-265.27286,265.49246,1.0499634,2.3537674,-100.1745,-266.13474,-302.2984,3.4037309,0.45182693,-0.33286244,44.759933,580000
58
+ 0.649006,270.77295,0.0035283635,-0.0034338837,-13.473223,0.16599843,-270.7254,270.9355,1.2050089,10.894768,-100.21717,-271.6336,-302.88657,12.099776,1.231109,-0.9039874,105.517,585000
59
+ 0.6528696,264.6501,0.0038359056,-0.004105354,-13.570244,0.16549526,-264.59802,264.81146,1.2072431,3.6726937,-100.35389,-265.76242,-302.2865,4.8799367,0.5456162,-0.3511809,57.99547,590000
60
+ 0.6617504,271.2904,0.0037523787,0.0026927923,-11.782377,0.18054736,-271.2462,271.47363,0.92026776,3.2275212,-100.365685,-272.2999,-302.5638,4.147789,0.66860366,-0.4718945,56.707996,595000
61
+ 0.659523,266.08838,0.0035880085,0.0045060376,-11.24414,0.18162605,-266.04803,266.27454,1.1805038,3.5469193,-100.23354,-266.89136,-302.09723,4.727423,0.51158184,-0.75029886,67.283554,600000
62
+ 0.6771019,265.48233,0.003541884,0.009156585,-9.91477,0.17284378,-265.4472,265.66434,1.1025395,5.048964,-100.29571,-266.24423,-302.31107,6.1515036,1.9376183,-1.858375,64.21513,605000
63
+ 0.64834964,263.59625,0.0036061932,-0.006125565,-14.198624,0.17041332,-263.54504,263.76053,1.1674837,3.0481842,-92.88444,-264.3798,-302.31848,4.2156677,0.41323245,-0.41355324,51.28817,610000
64
+ 0.66491616,259.6806,0.0038658269,0.0033103533,-11.643688,0.16935983,-259.6356,259.85327,2.1344888,4.4233394,-100.19764,-260.55853,-302.2452,6.557828,0.6677824,-0.76642835,71.79792,615000
65
+ 0.65818435,255.5948,0.003945643,0.011605198,-9.558731,0.15347782,-255.55707,255.75989,1.1583645,3.3778894,-100.22854,-256.32275,-302.00275,4.536254,0.40150627,-0.3952595,49.97339,620000
66
+ 0.6453615,267.089,0.0038598739,-0.004301594,-13.614439,0.1539142,-267.03644,267.2386,1.5865153,3.7322907,-100.22377,-268.267,-302.0116,5.318806,0.5008452,-0.50049746,59.186512,625000
67
+ 0.6614549,262.7303,0.0038760304,0.0016772699,-12.067271,0.14656617,-262.6835,262.87854,1.2616233,4.321479,-100.29239,-264.013,-302.2057,5.583102,1.7451209,-1.6191995,76.45695,630000
68
+ 0.6577365,260.09106,0.0038312715,-6.1529745e-06,-12.501606,0.15839955,-260.04318,260.24945,1.4178619,3.2587967,-100.235535,-260.98965,-302.4148,4.6766586,0.39655346,-0.5491807,53.628735,635000
69
+ 0.6700688,268.87476,0.003883549,0.00234819,-11.8953495,0.18461484,-268.82855,269.0617,1.1848578,3.9269264,-100.01316,-269.59918,-301.99252,5.111784,0.46776035,-0.67345107,69.65006,640000
70
+ 0.65309066,269.66605,0.003724765,-0.0017996007,-12.983145,0.15907419,-269.61768,269.82333,1.5884018,3.777932,-100.12485,-270.18335,-302.00684,5.366334,0.60908407,-1.0054773,75.394,645000
71
+ 0.6717532,261.4618,0.003846463,0.0025412366,-11.839332,0.20071773,-261.41626,261.66504,1.7431504,4.34383,-100.190674,-262.33652,-302.53864,6.0869803,2.78162,-3.225754,124.33297,650000
72
+ 0.6478329,264.19235,0.003449955,-0.007653522,-14.718441,0.20461264,-264.14154,264.3893,1.8761996,7.228372,-100.10977,-265.2072,-302.20554,9.104571,15.650413,-13.379855,215.76414,655000
73
+ 0.66276234,262.77087,0.0038403694,0.0010509067,-12.226353,0.19775373,-262.72394,262.96967,1.4154332,2.8792424,-100.12799,-263.7201,-302.15994,4.294676,0.5230831,-0.45698956,57.531548,660000
74
+ 0.673046,266.46994,0.0035680756,0.0061245416,-10.783517,0.18588938,-266.43146,266.66196,1.2429913,2.6485069,-100.24523,-267.0508,-301.90643,3.891498,0.4945835,-0.39271468,50.217983,665000
75
+ 0.6615302,256.74652,0.0037284896,0.004400824,-11.319676,0.16876785,-256.7043,256.91968,1.0291542,2.939411,-100.11955,-257.5023,-302.0246,3.968565,0.41417027,-0.3583135,55.739975,670000
76
+ 0.6532685,266.57483,0.0033182437,-0.004133286,-13.745625,0.18946446,-266.5292,266.76016,1.1749461,5.2627926,-100.218666,-267.42892,-302.9529,6.4377384,0.7964609,-0.8140777,69.743576,675000
77
+ 0.6565495,263.26398,0.0035770142,0.0032024698,-11.604709,0.1627447,-263.22244,263.42993,1.4942058,3.711966,-100.18405,-263.49005,-302.05035,5.206172,0.8732362,-0.87778324,76.87399,680000
78
+ 0.6600427,263.501,0.0036110338,-0.0024038996,-13.1657095,0.16628553,-263.45346,263.6649,1.2756698,4.0623016,-50.259544,-264.46854,-301.8646,5.3379717,0.62308896,-0.61528486,65.7741,685000
79
+ 0.66865796,257.74567,0.003502779,0.0018667607,-11.967063,0.17443812,-257.70374,257.92197,1.6178454,3.7766304,-31.697088,-258.31744,-302.07504,5.394476,0.49879992,-0.67956144,69.986824,690000
80
+ 0.6696111,262.90567,0.003632642,0.006835728,-10.618249,0.21033913,-262.86713,263.12283,1.3923894,3.4323761,-100.237755,-263.46616,-302.2734,4.8247657,0.2850576,-0.45422623,51.704697,695000
81
+ 0.66222656,260.01004,0.0036959443,0.0037166663,-11.494393,0.20123854,-259.96756,260.215,1.2576951,12.44988,-99.85627,-260.95712,-302.15225,13.707575,3.019903,-3.0100858,127.7622,700000
82
+ 0.66531414,262.53827,0.0035852825,0.0025055222,-11.801165,0.20209739,-262.49597,262.74286,1.9200596,3.3711026,-100.15275,-263.05283,-301.94092,5.291162,1.8057503,-1.535044,84.04935,705000
83
+ 0.6584493,261.78687,0.0034739592,-0.0045052213,-13.796855,0.16334984,-261.73892,261.9457,1.2744713,28.870161,-100.22894,-263.23093,-302.1383,30.144632,20.974653,-20.883453,299.75348,710000
84
+ 0.66262233,254.60959,0.0034021582,0.004929235,-11.051145,0.16009328,-254.57199,254.77461,1.2509406,3.7539108,-100.121605,-255.17847,-302.4758,5.0048513,0.40442216,-0.7871465,67.241295,715000
85
+ 0.6517007,261.7128,0.0036070463,-0.0033503987,-13.428848,0.16414309,-261.66437,261.8736,1.9920692,4.3916855,-100.11076,-262.49207,-302.07498,6.3837547,0.8083738,-0.8489048,58.98429,720000
86
+ 0.6474212,263.58276,0.0033819464,-0.003164095,-13.435584,0.15454565,-263.53735,263.73413,1.2325003,3.0588224,-100.11535,-264.26364,-302.05518,4.2913227,0.29472327,-0.4612715,50.442387,725000
87
+ 0.6436142,260.04553,0.0033952964,-0.0065441867,-14.427427,0.19214118,-259.99652,260.23114,2.7593307,5.1528487,-99.57826,-261.02292,-302.1291,7.9121795,0.83469707,-0.33383918,71.27556,730000
88
+ 0.6746609,257.17844,0.0034371035,0.004006143,-11.334442,0.17089164,-257.13947,257.35333,4.069108,4.227159,-100.27334,-258.1258,-302.1013,8.296267,1.119619,-0.79359937,91.947624,735000
89
+ 0.6700413,256.0669,0.0035705795,0.0046678684,-11.192686,0.14165911,-256.02692,256.21323,1.4213337,3.4553406,-100.06731,-257.00772,-302.11258,4.876674,0.432797,-0.45332974,62.67444,740000
90
+ 0.68431264,251.86797,0.003563524,0.014129835,-8.53487,0.13558123,-251.83755,252.01767,1.5472517,2.9611473,-100.176186,-252.56754,-302.01523,4.508399,0.4273402,-0.37009326,59.63759,745000
91
+ 0.6655863,256.9035,0.0033707395,0.0018539942,-11.949974,0.15463006,-256.86322,257.06,1.075502,4.4876094,-100.16642,-257.95114,-302.00955,5.5631113,0.9555393,-0.6841232,77.739655,750000
92
+ 0.66330856,259.95612,0.0035073333,0.0029457759,-11.6601095,0.17538422,-259.91522,260.13446,1.2554436,2.6410832,-100.21567,-260.68698,-302.0484,3.8965268,0.35901296,-0.435489,45.461594,755000
93
+ 0.669992,250.04152,0.0032469798,0.010592469,-9.237747,0.19422531,-250.01152,250.24634,1.348582,2.748563,-100.136375,-250.78398,-302.17624,4.097145,0.77668947,-0.6943876,58.133446,760000
94
+ 0.6635854,254.49225,0.0032146266,0.0011428128,-12.144496,0.16553992,-254.4532,254.65894,1.1819588,4.9225807,-100.14366,-254.93916,-302.09302,6.1045394,0.47048792,-0.49590516,57.92588,765000
95
+ 0.65675557,258.2877,0.003353339,0.00054009625,-12.338938,0.17159548,-258.24634,258.45984,1.316704,2.4983788,-100.12609,-259.01498,-301.975,3.8150828,0.37134,-0.37199786,44.282623,770000
96
+ 0.66738516,253.31973,0.003659861,-0.0017879246,-12.988523,0.1612143,-253.27219,253.47916,1.4221287,3.2504203,-100.124,-254.3189,-302.31592,4.6725492,0.568604,-0.523463,50.58736,775000
97
+ 0.6629232,262.2678,0.003291636,-0.00048047182,-12.6459675,0.19522619,-262.2262,262.46252,1.0030549,5.3783045,-100.23964,-263.74985,-302.21945,6.381359,1.0184851,-0.95021826,95.31219,780000
98
+ 0.6459732,261.67358,0.0034862692,-0.0068414197,-14.46239,0.17689551,-261.62314,261.84366,1.4791747,4.019632,-100.181076,-262.70245,-301.9297,5.4988065,0.42879802,-0.34685728,60.657513,785000
99
+ 0.64579916,254.8952,0.0034330771,-0.007193463,-14.59534,0.16531593,-254.84511,255.05333,1.4095088,3.878299,-100.18207,-255.56998,-302.00046,5.287808,0.5303389,-0.3950243,59.403805,790000
100
+ 0.66523343,253.30927,0.0034016096,7.293872e-05,-12.478558,0.1557012,-253.26683,253.46504,1.1992292,3.4699268,-100.10741,-254.2585,-301.77847,4.669156,0.38036108,-0.41586685,53.08068,795000
101
+ 0.655725,261.06848,0.003257073,-0.005820258,-14.28696,0.16168444,-261.02197,261.22433,1.338032,5.0318007,-84.66507,-262.04492,-302.03687,6.369833,1.1686889,-0.7713798,71.26152,800000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
2
+ 0.6644302,287.8457,0.004301978,-0.0013610249,-12.816372,0.16198651,-287.7906,288.00632,8.001165,10.007518,-108.30868,-288.85437,-303.09412,18.008682,4.098134,-4.5296106,256.24353,305000
3
+ 0.669014,285.04434,0.0044764197,0.0008986983,-12.299237,0.19769819,-284.98932,285.24292,2.5018673,6.8204665,-158.03436,-285.81882,-302.53674,9.322334,0.5658894,-0.96999526,94.73556,310000
4
+ 0.6571826,281.06274,0.0042703114,0.0008337927,-12.304747,0.1729198,-281.0102,281.23648,4.428573,13.595145,-107.44074,-282.02234,-302.79538,18.023718,6.5452075,-6.394309,259.48553,315000
5
+ 0.6490956,287.14832,0.004355761,-0.00081868254,-12.687954,0.18398614,-287.09302,287.33148,2.8152614,6.1822915,-173.55641,-288.85425,-302.85696,8.997553,1.2361869,-1.0007355,124.54308,320000
6
+ 0.6456623,284.20053,0.0042796414,-0.01512543,-16.034275,0.21283051,-284.1319,284.39822,2.343795,5.308229,-106.823845,-285.45068,-302.7311,7.6520243,0.69752705,-0.5811456,88.27592,325000
7
+ 0.6692465,284.2591,0.004191262,0.008407374,-10.494071,0.20007658,-284.2151,284.46756,1.5856186,5.480632,2.2329502,-284.99323,-302.72598,7.0662503,2.464924,-2.4509728,93.22647,330000
8
+ 0.6680937,287.7744,0.004306559,0.0050009303,-11.338764,0.17685218,-287.72556,287.95627,1.6979821,7.003452,-103.10716,-288.69296,-302.6692,8.701434,0.6177458,-0.57384676,88.99411,335000
9
+ 0.6727923,283.28986,0.004692932,0.014388341,-9.43404,0.18402806,-283.24557,283.48825,2.012737,3.614269,-100.91894,-284.1826,-302.71667,5.627006,0.8767326,-1.0045528,80.76254,340000
10
+ 0.66874313,283.97925,0.0043335566,0.0040230346,-11.571655,0.18635349,-283.92908,284.16962,1.9605721,5.972544,-100.83468,-284.88223,-303.20203,7.9331164,1.7814046,-0.8960423,108.84259,345000
11
+ 0.662225,282.29016,0.004123468,0.0031395229,-11.738621,0.19507983,-282.24176,282.48837,1.3459777,4.350292,-100.40695,-283.35104,-302.7905,5.69627,0.67335373,-0.53554124,75.93465,350000
12
+ 0.65680236,282.80157,0.0044184527,0.00011928326,-12.473003,0.19026282,-282.74646,282.99197,2.0741482,7.7435327,-100.757645,-283.8674,-303.05832,9.81768,0.81936425,-1.6414585,96.99141,355000
13
+ 0.6625112,282.81732,0.004552278,0.003535646,-11.723324,0.21912019,-282.76395,283.03998,1.7698987,5.650407,-102.03703,-283.4048,-302.69366,7.4203053,1.0559391,-0.8942263,92.79312,360000
14
+ 0.66274655,283.7535,0.004277591,0.0041669407,-11.525867,0.18087336,-283.70422,283.93857,1.5166241,3.9052784,-100.69106,-284.83517,-303.09534,5.4219027,0.69302154,-0.6310374,72.50021,365000
15
+ 0.65287185,276.27982,0.004554521,0.0019007329,-12.082671,0.18424967,-276.2248,276.46594,1.6134278,4.6983204,-101.012054,-277.2858,-302.72998,6.311748,0.72091556,-0.47588557,76.53245,370000
16
+ 0.644207,275.3484,0.004359532,-0.015020308,-15.9453945,0.21017215,-275.27887,275.54355,2.5729294,6.452949,-37.602314,-277.15982,-302.77444,9.025879,1.3512064,-1.4069008,116.32476,375000
17
+ 0.6349845,276.985,0.0042854883,-0.01621786,-16.284367,0.18621714,-276.91522,277.155,2.679957,4.933501,-100.61954,-278.13116,-302.4467,7.6134577,1.0171608,-1.0772505,82.52959,380000
18
+ 0.6523465,279.07056,0.0043897163,-0.00943801,-14.650027,0.18695939,-279.00626,279.24808,2.1781363,6.59966,-67.12562,-279.9166,-302.6114,8.777796,1.0517906,-2.068527,123.032684,385000
19
+ 0.6476531,280.09946,0.0044805435,-0.0058048554,-13.795569,0.17369725,-280.03766,280.26736,2.1712122,5.6169953,-100.28506,-281.108,-302.5187,7.7882075,0.6982482,-0.9801612,91.471634,390000
20
+ 0.654013,279.575,0.0044190786,0.0040249852,-11.58918,0.18384722,-279.5238,279.76288,1.7756637,4.599647,-100.51435,-280.50818,-303.49994,6.375311,0.7141902,-0.7056673,74.72863,395000
21
+ 0.6381815,276.80457,0.0040838025,-0.014336305,-16.010529,0.16644864,-276.7392,276.95667,1.8178848,7.81055,-87.03934,-277.8911,-302.5544,9.628435,1.6649102,-1.998895,105.31186,400000
22
+ 0.6605147,280.26273,0.0042364174,0.0019830733,-12.0318985,0.20053121,-280.21176,280.46524,1.7050847,5.1348224,-100.46689,-281.1069,-302.83203,6.839907,0.65522087,-0.6160283,78.406555,405000
23
+ 0.64635277,279.9599,0.004161377,-0.011098709,-15.167076,0.19476625,-279.89676,280.14355,17.680342,6.6968055,-45.13941,-280.883,-302.6795,24.377148,1.8115996,-1.3298532,134.22011,410000
24
+ 0.6451673,276.6292,0.0040364903,-0.008576957,-14.624855,0.2063176,-276.57016,276.82697,1.5537825,13.052439,-100.550545,-277.77258,-302.7233,14.606221,4.8850656,-4.919883,174.38593,415000
25
+ 0.6494969,273.31052,0.0041016284,0.0005039767,-12.377128,0.1777437,-273.25977,273.48877,1.4975628,5.3284984,-100.35958,-274.17596,-302.47562,6.8260612,0.68214244,-0.6576895,75.86508,420000
26
+ 0.66763616,280.3579,0.0040141484,0.007210281,-10.703783,0.19056647,-280.31497,280.55566,1.2604564,4.6342573,-87.381096,-281.40952,-302.6503,5.894714,2.3723512,-0.5575035,86.777435,425000
27
+ 0.6605937,277.74777,0.0041731643,-0.0023355887,-13.059669,0.2047035,-277.69327,277.95013,3.4085443,5.5912046,-100.472404,-279.09445,-302.95157,8.999749,5.23813,-5.455099,175.68408,430000
28
+ 0.65392745,278.68732,0.0038837008,-0.00025921315,-12.566744,0.168918,-278.6385,278.856,2.2438924,5.9817033,-100.37773,-279.638,-302.6359,8.225595,2.160954,-0.8957074,93.15115,435000
29
+ 0.66499525,274.94727,0.0040012947,0.0018859672,-12.028661,0.20882758,-274.89914,275.158,1.5758051,5.0442686,-100.384575,-275.6686,-302.57257,6.620074,0.6256214,-0.42625925,67.98132,440000
30
+ 0.65481436,272.33228,0.003872646,0.0035685443,-11.578526,0.19697094,-272.28748,272.5328,3.5737865,6.2261424,-100.29901,-273.4665,-302.76025,9.799929,12.808319,-10.697351,276.96747,445000
31
+ 0.65546554,278.28687,0.004019086,-0.0007593394,-12.688933,0.16655791,-278.2359,278.45267,1.5980083,3.8631642,-100.41003,-278.92905,-302.43604,5.4611726,0.7026018,-0.4638818,61.097366,450000
32
+ 0.6530008,276.0895,0.004059205,-0.0008696637,-12.714245,0.17226967,-276.0379,276.26093,1.6492262,4.7996707,-100.23153,-276.6734,-302.263,6.448897,2.778954,-2.1379287,104.44095,455000
33
+ 0.6554821,270.7886,0.004188647,-0.0010720481,-12.755941,0.20318736,-270.7352,270.99072,1.4621271,4.5579104,-100.2724,-271.70786,-302.70422,6.0200377,0.69879264,-0.6608154,71.084145,460000
34
+ 0.6596234,272.28433,0.0042293207,0.00020159713,-12.452333,0.18037684,-272.2317,272.46494,1.481711,4.0395947,-100.382126,-273.58005,-302.6132,5.5213056,0.79350924,-0.6443036,77.29178,465000
35
+ 0.6597553,271.3466,0.003791467,0.0042950646,-11.367176,0.19965884,-271.30347,271.55054,6.704764,8.09662,-100.35994,-272.56296,-302.63586,14.801384,3.584199,-4.219602,160.16846,470000
36
+ 0.65404415,272.3339,0.003939522,-0.0019079355,-12.984306,0.19806805,-272.2827,272.53003,2.508462,4.109176,-100.28566,-273.24667,-302.7701,6.617638,0.6730824,-0.44346315,71.69325,475000
37
+ 0.6443356,272.5381,0.004073699,-0.009242656,-14.768861,0.19652185,-272.4779,272.72537,2.0353892,4.711815,-100.127144,-273.27554,-303.6413,6.747204,1.8147693,-2.4370422,99.715706,480000
38
+ 0.65857786,269.04218,0.0039341175,0.0023757946,-11.896105,0.16081099,-268.99536,269.20535,1.8709191,3.9811037,-100.32084,-269.6927,-302.7424,5.8520226,0.60452056,-0.4251092,64.4144,485000
39
+ 0.6573267,268.54608,0.0039117783,0.00030795048,-12.421276,0.1734781,-268.4975,268.71988,1.3003157,5.4634376,-100.13655,-269.3789,-302.34528,6.7637534,1.0261009,-0.73550916,69.89128,490000
40
+ 0.64508665,275.90652,0.0038667505,-0.002922797,-13.255879,0.18168011,-275.85526,276.08527,1.4121122,4.0830064,-100.23735,-276.85333,-302.30975,5.4951186,0.9995203,-0.7321601,73.63788,495000
41
+ 0.65551853,268.85327,0.004202587,-0.008610755,-14.548918,0.17566916,-268.7921,269.02032,3.322596,10.674686,-100.21806,-269.29572,-302.84332,13.997282,1.5054824,-1.5703661,131.9115,500000
42
+ 0.6427433,268.26453,0.0038748495,-0.010073147,-15.099623,0.19395903,-268.20602,268.44843,2.2759125,4.583321,-100.22445,-268.8059,-302.29855,6.859234,0.69423974,-0.88444555,93.4533,505000
43
+ 0.6571682,271.0443,0.0040199105,0.0070433007,-10.747896,0.21194865,-271.0011,271.2633,1.5017874,4.3578935,-99.52925,-271.89786,-302.4765,5.859681,0.7393448,-0.54491407,76.837074,510000
44
+ 0.6587528,267.78476,0.0039496333,0.004225918,-11.430048,0.16876166,-267.73962,267.95773,1.200001,2.9682362,-100.31598,-268.7687,-302.72293,4.168237,0.64519405,-0.82751095,61.47215,515000
45
+ 0.65593934,272.69125,0.0038750123,0.00035068076,-12.409502,0.18954614,-272.64316,272.88113,1.1828362,3.6375356,-100.33802,-273.47617,-302.5813,4.8203716,0.4260553,-0.4827187,67.59282,520000
46
+ 0.6568121,273.8451,0.0038406441,0.0018908884,-12.007664,0.17333534,-273.79895,274.02032,1.2490805,3.3988464,-100.20055,-274.90918,-302.368,4.647927,0.5365727,-0.40816203,59.02067,525000
47
+ 0.6500991,274.06863,0.0039715273,-0.008600781,-14.66561,0.1958934,-274.01038,274.25592,1.9873003,5.445539,-98.17235,-275.61444,-302.3528,7.4328394,3.7452836,-4.854759,143.24277,530000
48
+ 0.67411834,270.74377,0.0040188543,0.012923867,-9.284191,0.23322387,-270.70648,270.9899,1.3411597,5.6793184,-33.86404,-271.3967,-302.20087,7.0204782,0.84348214,-0.63969225,73.10893,535000
49
+ 0.65211546,273.46133,0.0040447,-0.004379292,-13.582724,0.16345622,-273.40643,273.6204,7.947208,17.57704,-100.43764,-274.84146,-302.58685,25.524248,6.8441515,-5.3247223,265.4073,540000
50
+ 0.6679531,264.74036,0.003797679,0.010362425,-9.771379,0.18761022,-264.70325,264.93835,1.2662568,5.8906693,-100.06622,-265.27158,-302.4461,7.156926,3.9169266,-4.6824527,139.70099,545000
51
+ 0.6800357,274.62732,0.003876801,0.010078472,-9.900312,0.15891287,-274.58893,274.7963,1.3751003,3.5062625,-100.19342,-275.72073,-302.6781,4.881363,0.71664006,-0.49707633,62.339462,550000
52
+ 0.66053504,268.6845,0.0038398895,0.0070922105,-10.653017,0.1911758,-268.64362,268.88275,1.4140915,3.830838,-97.96146,-269.43677,-302.55444,5.2449293,1.2219263,-0.9967634,68.86004,555000
53
+ 0.66772884,267.34796,0.00404272,0.008648295,-10.360773,0.18598686,-267.3061,267.54257,1.4683155,5.016164,-100.20284,-268.07144,-302.24536,6.4844794,2.213316,-1.7816901,101.025055,560000
54
+ 0.65750456,268.48126,0.0039412277,0.0060885507,-10.955164,0.18179497,-268.43808,268.66916,1.2141771,7.4797683,-100.18381,-269.7825,-302.57443,8.693945,2.9628515,-3.7657597,153.93706,565000
55
+ 0.6553488,272.4113,0.004336389,-0.0086391475,-14.492245,0.16905552,-272.34845,272.57172,1.591072,5.9920764,-38.81717,-273.2822,-302.1164,7.5831485,2.0837677,-1.8157223,89.32085,570000
56
+ 0.66209334,265.23227,0.003963708,0.005093901,-11.214865,0.20234497,-265.1878,265.4397,1.669854,6.014098,-42.50181,-266.38013,-302.71277,7.6839523,0.64316297,-0.58341014,76.3264,575000
57
+ 0.66747314,265.31818,0.0037663234,0.0017377925,-12.038597,0.17254105,-265.27286,265.49246,1.0499634,2.3537674,-100.1745,-266.13474,-302.2984,3.4037309,0.45182693,-0.33286244,44.759933,580000
58
+ 0.649006,270.77295,0.0035283635,-0.0034338837,-13.473223,0.16599843,-270.7254,270.9355,1.2050089,10.894768,-100.21717,-271.6336,-302.88657,12.099776,1.231109,-0.9039874,105.517,585000
59
+ 0.6528696,264.6501,0.0038359056,-0.004105354,-13.570244,0.16549526,-264.59802,264.81146,1.2072431,3.6726937,-100.35389,-265.76242,-302.2865,4.8799367,0.5456162,-0.3511809,57.99547,590000
60
+ 0.6617504,271.2904,0.0037523787,0.0026927923,-11.782377,0.18054736,-271.2462,271.47363,0.92026776,3.2275212,-100.365685,-272.2999,-302.5638,4.147789,0.66860366,-0.4718945,56.707996,595000
61
+ 0.659523,266.08838,0.0035880085,0.0045060376,-11.24414,0.18162605,-266.04803,266.27454,1.1805038,3.5469193,-100.23354,-266.89136,-302.09723,4.727423,0.51158184,-0.75029886,67.283554,600000
62
+ 0.6771019,265.48233,0.003541884,0.009156585,-9.91477,0.17284378,-265.4472,265.66434,1.1025395,5.048964,-100.29571,-266.24423,-302.31107,6.1515036,1.9376183,-1.858375,64.21513,605000
63
+ 0.64834964,263.59625,0.0036061932,-0.006125565,-14.198624,0.17041332,-263.54504,263.76053,1.1674837,3.0481842,-92.88444,-264.3798,-302.31848,4.2156677,0.41323245,-0.41355324,51.28817,610000
64
+ 0.66491616,259.6806,0.0038658269,0.0033103533,-11.643688,0.16935983,-259.6356,259.85327,2.1344888,4.4233394,-100.19764,-260.55853,-302.2452,6.557828,0.6677824,-0.76642835,71.79792,615000
65
+ 0.65818435,255.5948,0.003945643,0.011605198,-9.558731,0.15347782,-255.55707,255.75989,1.1583645,3.3778894,-100.22854,-256.32275,-302.00275,4.536254,0.40150627,-0.3952595,49.97339,620000
66
+ 0.6453615,267.089,0.0038598739,-0.004301594,-13.614439,0.1539142,-267.03644,267.2386,1.5865153,3.7322907,-100.22377,-268.267,-302.0116,5.318806,0.5008452,-0.50049746,59.186512,625000
67
+ 0.6614549,262.7303,0.0038760304,0.0016772699,-12.067271,0.14656617,-262.6835,262.87854,1.2616233,4.321479,-100.29239,-264.013,-302.2057,5.583102,1.7451209,-1.6191995,76.45695,630000
68
+ 0.6577365,260.09106,0.0038312715,-6.1529745e-06,-12.501606,0.15839955,-260.04318,260.24945,1.4178619,3.2587967,-100.235535,-260.98965,-302.4148,4.6766586,0.39655346,-0.5491807,53.628735,635000
69
+ 0.6700688,268.87476,0.003883549,0.00234819,-11.8953495,0.18461484,-268.82855,269.0617,1.1848578,3.9269264,-100.01316,-269.59918,-301.99252,5.111784,0.46776035,-0.67345107,69.65006,640000
70
+ 0.65309066,269.66605,0.003724765,-0.0017996007,-12.983145,0.15907419,-269.61768,269.82333,1.5884018,3.777932,-100.12485,-270.18335,-302.00684,5.366334,0.60908407,-1.0054773,75.394,645000
71
+ 0.6717532,261.4618,0.003846463,0.0025412366,-11.839332,0.20071773,-261.41626,261.66504,1.7431504,4.34383,-100.190674,-262.33652,-302.53864,6.0869803,2.78162,-3.225754,124.33297,650000
72
+ 0.6478329,264.19235,0.003449955,-0.007653522,-14.718441,0.20461264,-264.14154,264.3893,1.8761996,7.228372,-100.10977,-265.2072,-302.20554,9.104571,15.650413,-13.379855,215.76414,655000
73
+ 0.66276234,262.77087,0.0038403694,0.0010509067,-12.226353,0.19775373,-262.72394,262.96967,1.4154332,2.8792424,-100.12799,-263.7201,-302.15994,4.294676,0.5230831,-0.45698956,57.531548,660000
74
+ 0.673046,266.46994,0.0035680756,0.0061245416,-10.783517,0.18588938,-266.43146,266.66196,1.2429913,2.6485069,-100.24523,-267.0508,-301.90643,3.891498,0.4945835,-0.39271468,50.217983,665000
75
+ 0.6615302,256.74652,0.0037284896,0.004400824,-11.319676,0.16876785,-256.7043,256.91968,1.0291542,2.939411,-100.11955,-257.5023,-302.0246,3.968565,0.41417027,-0.3583135,55.739975,670000
76
+ 0.6532685,266.57483,0.0033182437,-0.004133286,-13.745625,0.18946446,-266.5292,266.76016,1.1749461,5.2627926,-100.218666,-267.42892,-302.9529,6.4377384,0.7964609,-0.8140777,69.743576,675000
77
+ 0.6565495,263.26398,0.0035770142,0.0032024698,-11.604709,0.1627447,-263.22244,263.42993,1.4942058,3.711966,-100.18405,-263.49005,-302.05035,5.206172,0.8732362,-0.87778324,76.87399,680000
78
+ 0.6600427,263.501,0.0036110338,-0.0024038996,-13.1657095,0.16628553,-263.45346,263.6649,1.2756698,4.0623016,-50.259544,-264.46854,-301.8646,5.3379717,0.62308896,-0.61528486,65.7741,685000
79
+ 0.66865796,257.74567,0.003502779,0.0018667607,-11.967063,0.17443812,-257.70374,257.92197,1.6178454,3.7766304,-31.697088,-258.31744,-302.07504,5.394476,0.49879992,-0.67956144,69.986824,690000
80
+ 0.6696111,262.90567,0.003632642,0.006835728,-10.618249,0.21033913,-262.86713,263.12283,1.3923894,3.4323761,-100.237755,-263.46616,-302.2734,4.8247657,0.2850576,-0.45422623,51.704697,695000
81
+ 0.66222656,260.01004,0.0036959443,0.0037166663,-11.494393,0.20123854,-259.96756,260.215,1.2576951,12.44988,-99.85627,-260.95712,-302.15225,13.707575,3.019903,-3.0100858,127.7622,700000
82
+ 0.66531414,262.53827,0.0035852825,0.0025055222,-11.801165,0.20209739,-262.49597,262.74286,1.9200596,3.3711026,-100.15275,-263.05283,-301.94092,5.291162,1.8057503,-1.535044,84.04935,705000
83
+ 0.6584493,261.78687,0.0034739592,-0.0045052213,-13.796855,0.16334984,-261.73892,261.9457,1.2744713,28.870161,-100.22894,-263.23093,-302.1383,30.144632,20.974653,-20.883453,299.75348,710000
84
+ 0.66262233,254.60959,0.0034021582,0.004929235,-11.051145,0.16009328,-254.57199,254.77461,1.2509406,3.7539108,-100.121605,-255.17847,-302.4758,5.0048513,0.40442216,-0.7871465,67.241295,715000
85
+ 0.6517007,261.7128,0.0036070463,-0.0033503987,-13.428848,0.16414309,-261.66437,261.8736,1.9920692,4.3916855,-100.11076,-262.49207,-302.07498,6.3837547,0.8083738,-0.8489048,58.98429,720000
86
+ 0.6474212,263.58276,0.0033819464,-0.003164095,-13.435584,0.15454565,-263.53735,263.73413,1.2325003,3.0588224,-100.11535,-264.26364,-302.05518,4.2913227,0.29472327,-0.4612715,50.442387,725000
87
+ 0.6436142,260.04553,0.0033952964,-0.0065441867,-14.427427,0.19214118,-259.99652,260.23114,2.7593307,5.1528487,-99.57826,-261.02292,-302.1291,7.9121795,0.83469707,-0.33383918,71.27556,730000
88
+ 0.6746609,257.17844,0.0034371035,0.004006143,-11.334442,0.17089164,-257.13947,257.35333,4.069108,4.227159,-100.27334,-258.1258,-302.1013,8.296267,1.119619,-0.79359937,91.947624,735000
89
+ 0.6700413,256.0669,0.0035705795,0.0046678684,-11.192686,0.14165911,-256.02692,256.21323,1.4213337,3.4553406,-100.06731,-257.00772,-302.11258,4.876674,0.432797,-0.45332974,62.67444,740000
90
+ 0.68431264,251.86797,0.003563524,0.014129835,-8.53487,0.13558123,-251.83755,252.01767,1.5472517,2.9611473,-100.176186,-252.56754,-302.01523,4.508399,0.4273402,-0.37009326,59.63759,745000
91
+ 0.6655863,256.9035,0.0033707395,0.0018539942,-11.949974,0.15463006,-256.86322,257.06,1.075502,4.4876094,-100.16642,-257.95114,-302.00955,5.5631113,0.9555393,-0.6841232,77.739655,750000
92
+ 0.66330856,259.95612,0.0035073333,0.0029457759,-11.6601095,0.17538422,-259.91522,260.13446,1.2554436,2.6410832,-100.21567,-260.68698,-302.0484,3.8965268,0.35901296,-0.435489,45.461594,755000
93
+ 0.669992,250.04152,0.0032469798,0.010592469,-9.237747,0.19422531,-250.01152,250.24634,1.348582,2.748563,-100.136375,-250.78398,-302.17624,4.097145,0.77668947,-0.6943876,58.133446,760000
94
+ 0.6635854,254.49225,0.0032146266,0.0011428128,-12.144496,0.16553992,-254.4532,254.65894,1.1819588,4.9225807,-100.14366,-254.93916,-302.09302,6.1045394,0.47048792,-0.49590516,57.92588,765000
95
+ 0.65675557,258.2877,0.003353339,0.00054009625,-12.338938,0.17159548,-258.24634,258.45984,1.316704,2.4983788,-100.12609,-259.01498,-301.975,3.8150828,0.37134,-0.37199786,44.282623,770000
96
+ 0.66738516,253.31973,0.003659861,-0.0017879246,-12.988523,0.1612143,-253.27219,253.47916,1.4221287,3.2504203,-100.124,-254.3189,-302.31592,4.6725492,0.568604,-0.523463,50.58736,775000
97
+ 0.6629232,262.2678,0.003291636,-0.00048047182,-12.6459675,0.19522619,-262.2262,262.46252,1.0030549,5.3783045,-100.23964,-263.74985,-302.21945,6.381359,1.0184851,-0.95021826,95.31219,780000
98
+ 0.6459732,261.67358,0.0034862692,-0.0068414197,-14.46239,0.17689551,-261.62314,261.84366,1.4791747,4.019632,-100.181076,-262.70245,-301.9297,5.4988065,0.42879802,-0.34685728,60.657513,785000
99
+ 0.64579916,254.8952,0.0034330771,-0.007193463,-14.59534,0.16531593,-254.84511,255.05333,1.4095088,3.878299,-100.18207,-255.56998,-302.00046,5.287808,0.5303389,-0.3950243,59.403805,790000
100
+ 0.66523343,253.30927,0.0034016096,7.293872e-05,-12.478558,0.1557012,-253.26683,253.46504,1.1992292,3.4699268,-100.10741,-254.2585,-301.77847,4.669156,0.38036108,-0.41586685,53.08068,795000
101
+ 0.655725,261.06848,0.003257073,-0.005820258,-14.28696,0.16168444,-261.02197,261.22433,1.338032,5.0318007,-84.66507,-262.04492,-302.03687,6.369833,1.1686889,-0.7713798,71.26152,800000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb31868aa1e031cf468ec24623836edd34ae4c32fd19b15b6547127da6e20c0b
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1186b7e1da56c70614ae5c0684ecc4a996fe126e4dcfe6bddbdba4bcbe6befb
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7afc0f79b6124208b1906bad51a8883944de566471351998fe4cad24b4597809
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1267031d0d70faefe292a33581e8523641470e1811a16538eb6b46447213d11
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73bca4bb74ba820af2b44c6904e62a975cbecb22a89fe3790f002694609a60cd
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2eec4db0f8cd53ce8a13c9bdd1b88e9c64db840a1048883994188e364610723
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b9ce878bf3621a028d0be9e5ebbd247b195f326d55c83dfc34891c5af48467c
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47eaa270e919fcf2d9d8394cad64ca4a86b725a9e93049c327a07e40577bdaf9
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c699e026ab05a78f2d53de2c4b90c5038d5e3fd245ea515938caf93c1503123
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ee127678dbad8ddf4b433edcab9ddf81f38ab3de3faadc2752ff78faefd184
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260325_063539/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/iuu9h1bf