Tiredsheep commited on
Commit
b6b4e18
·
verified ·
1 Parent(s): 5ba144b

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_150000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_200000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_250000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_300000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_350000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_400000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_450000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_500000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_550000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_600000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.07773283159786294,0.0009216747102059366,-0.07752887891729623,0.0028048157640277694,3.255139646708428,50.10000000001527,0.0,25500.0,-1.0,-1000.0,1000.0,3.750422058105469,150000
3
+ 0.0,0.0,-0.22800557533898558,-7.04461748896905e-05,-0.22801241085406126,-1.2899934647831735e-05,0.5427820419982009,50.10000000001527,0.0,77500.0,-1.0,-1000.0,1000.0,3.9620846796035765,200000
4
+ 0.0,0.0,-0.20739193828404778,0.0010357626472615265,-0.20735590187589167,0.0007506099151562651,0.9544932304322317,50.10000000001527,0.0,129500.0,-1.0,-1000.0,1000.0,3.7882498788833616,250000
5
+ 0.0,0.0,-0.16478320196585783,-0.0034683228745744452,-0.16497681527284502,-0.0056486684239169275,0.9434895092212742,49.19300000001496,0.02,181427.44,-1.0,-989.98,981.86,3.797430491447449,300000
6
+ 0.0,0.0,-0.16835165200237087,-0.0002729646152745517,-0.16837773572784986,-0.00023432726487821552,-1.292564352682405,50.10000000001527,0.0,232593.0,-1.0,-1000.0,1000.0,4.127174863815307,350000
7
+ 0.0,0.0,-0.21965550814536547,-0.001743662189924377,-0.21976596411561644,-0.0016897428768377848,-1.5010870182669773,50.10000000001527,0.0,284593.0,-1.0,-1000.0,1000.0,4.079833035469055,400000
8
+ 0.0,0.0,-0.18506980925419017,-0.0007889984943714813,-0.1850936242764962,-0.0007640620728281242,-1.3722756638538094,50.10000000001527,0.0,336593.0,-1.0,-1000.0,1000.0,3.796735429763794,450000
9
+ 0.0,0.0,-0.20024215637693857,-0.0004497402422023376,-0.20027256781526867,-0.00041423022836397093,-0.7815875444667986,50.10000000001527,0.0,388593.0,-1.0,-1000.0,1000.0,4.118025612831116,500000
10
+ 0.0,0.0,-0.21145392911751026,-0.001428583079863914,-0.2115058566415812,-0.001456536016312525,-1.4286960023827497,50.10000000001527,0.0,440593.0,-1.0,-1000.0,1000.0,3.8438741064071653,550000
11
+ 0.0,0.0,-0.18585047638901322,-0.0015535621140722944,-0.1859107541823334,-0.0014644200594050346,-1.4187273590490423,50.10000000001527,0.0,492593.0,-1.0,-1000.0,1000.0,4.0853678369522095,600000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.07773283159786294,0.0009216747102059366,-0.07752887891729623,0.0028048157640277694,3.255139646708428,50.10000000001527,0.0,25500.0,-1.0,-1000.0,1000.0,3.750422058105469,150000
3
+ 0.0,0.0,-0.22800557533898558,-7.04461748896905e-05,-0.22801241085406126,-1.2899934647831735e-05,0.5427820419982009,50.10000000001527,0.0,77500.0,-1.0,-1000.0,1000.0,3.9620846796035765,200000
4
+ 0.0,0.0,-0.20739193828404778,0.0010357626472615265,-0.20735590187589167,0.0007506099151562651,0.9544932304322317,50.10000000001527,0.0,129500.0,-1.0,-1000.0,1000.0,3.7882498788833616,250000
5
+ 0.0,0.0,-0.16478320196585783,-0.0034683228745744452,-0.16497681527284502,-0.0056486684239169275,0.9434895092212742,49.19300000001496,0.02,181427.44,-1.0,-989.98,981.86,3.797430491447449,300000
6
+ 0.0,0.0,-0.16835165200237087,-0.0002729646152745517,-0.16837773572784986,-0.00023432726487821552,-1.292564352682405,50.10000000001527,0.0,232593.0,-1.0,-1000.0,1000.0,4.127174863815307,350000
7
+ 0.0,0.0,-0.21965550814536547,-0.001743662189924377,-0.21976596411561644,-0.0016897428768377848,-1.5010870182669773,50.10000000001527,0.0,284593.0,-1.0,-1000.0,1000.0,4.079833035469055,400000
8
+ 0.0,0.0,-0.18506980925419017,-0.0007889984943714813,-0.1850936242764962,-0.0007640620728281242,-1.3722756638538094,50.10000000001527,0.0,336593.0,-1.0,-1000.0,1000.0,3.796735429763794,450000
9
+ 0.0,0.0,-0.20024215637693857,-0.0004497402422023376,-0.20027256781526867,-0.00041423022836397093,-0.7815875444667986,50.10000000001527,0.0,388593.0,-1.0,-1000.0,1000.0,4.118025612831116,500000
10
+ 0.0,0.0,-0.21145392911751026,-0.001428583079863914,-0.2115058566415812,-0.001456536016312525,-1.4286960023827497,50.10000000001527,0.0,440593.0,-1.0,-1000.0,1000.0,3.8438741064071653,550000
11
+ 0.0,0.0,-0.18585047638901322,-0.0015535621140722944,-0.1859107541823334,-0.0014644200594050346,-1.4187273590490423,50.10000000001527,0.0,492593.0,-1.0,-1000.0,1000.0,4.0853678369522095,600000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
2
+ 0.68451923,293.98334,0.004215054,0.0046282164,-11.401979,0.20430833,-293.9353,294.1923,8.61393,25.79129,-120.61603,-294.26282,-307.31775,34.40522,5.2540226,-5.060202,393.57745,105000
3
+ 0.6664912,290.70602,0.0046371436,-0.008489391,-14.330737,0.197492,-290.63956,290.89502,5.013113,22.589014,-169.75346,-291.70996,-305.7043,27.602127,3.9411929,-5.9833426,326.2362,110000
4
+ 0.6737685,287.6887,0.0044078766,0.0020398856,-12.037218,0.20666528,-287.63562,287.8974,7.102314,25.196747,-113.6555,-287.85153,-306.3591,32.29906,6.815852,-6.1600866,407.57263,115000
5
+ 0.6718844,293.38538,0.004288726,0.0022887704,-11.966329,0.21459414,-293.33405,293.60226,4.4136996,11.819016,-181.89738,-294.0934,-304.90286,16.232716,3.626711,-3.0821896,286.95926,120000
6
+ 0.65428245,288.97845,0.004355067,-0.016249988,-16.231283,0.19001204,-288.90778,289.15222,5.14059,13.85441,-107.70928,-289.96884,-306.5796,18.995,3.698928,-3.1010113,224.71878,125000
7
+ 0.6907408,288.9909,0.0045750574,0.0123588145,-9.798654,0.20672882,-288.9461,289.21,3.6387048,14.658521,4.2862983,-289.10812,-305.74902,18.297226,4.1496353,-3.9220872,226.3634,130000
8
+ 0.6703889,292.08197,0.0046265484,-0.004213269,-13.410672,0.18716109,-292.01993,292.26492,3.3115585,7.1005297,-101.87245,-293.5209,-305.90848,10.412088,1.334328,-1.1911694,157.5768,135000
9
+ 0.66610444,287.25046,0.004556834,0.00470983,-11.466425,0.19062734,-287.19818,287.44577,3.6017377,6.1707683,-100.08451,-288.02393,-306.60336,9.772506,0.83226186,-0.8993608,113.91702,140000
10
+ 0.675869,288.59216,0.00464063,0.013250917,-9.644587,0.1905204,-288.54742,288.79593,5.51095,12.069573,-100.46694,-289.20197,-305.9452,17.580524,6.0347023,-6.004706,232.73694,145000
11
+ 0.6680993,286.18616,0.0042730775,-0.0008521981,-12.699434,0.20471343,-286.13184,286.39,2.78796,13.464238,-100.32881,-287.00558,-306.2396,16.252197,2.0013406,-2.17956,173.22699,150000
12
+ 0.6715216,286.87073,0.0047365464,-0.0058059935,-13.725786,0.19051635,-286.8057,287.05545,2.6988049,6.896187,-100.64366,-287.42056,-304.72647,9.594992,5.382665,-5.665446,179.83746,155000
13
+ 0.6671254,286.4673,0.004245301,0.0054082307,-11.226067,0.22228831,-286.41962,286.69498,3.5842488,6.6831675,-100.71774,-286.98907,-304.64276,10.267416,2.811478,-2.902136,158.75244,160000
14
+ 0.6781303,287.3279,0.0045389323,0.003620719,-11.702297,0.18457285,-287.27478,287.5161,2.0543249,7.3452773,-100.53266,-288.2166,-304.43292,9.399602,1.1019225,-2.0408275,117.167595,165000
15
+ 0.6573901,280.77863,0.0045718886,-0.002415692,-13.028379,0.2033413,-280.71906,280.97955,4.2643714,8.362673,-99.95689,-281.51517,-304.00513,12.627045,1.4380249,-1.6364849,144.34888,170000
16
+ 0.6497354,279.42328,0.0044190474,-0.013431877,-15.539541,0.21280237,-279.35464,279.62265,4.528965,9.813952,-42.049603,-280.848,-303.59167,14.342917,2.0279415,-2.1281364,193.70285,175000
17
+ 0.65134305,280.63416,0.0047699413,-0.007488661,-14.069969,0.1817931,-280.56705,280.80847,4.013481,9.317459,-100.84814,-281.5577,-303.74457,13.33094,4.431979,-4.6011686,223.049,180000
18
+ 0.6655947,283.35968,0.004696949,0.0022555098,-12.019793,0.17607799,-283.30322,283.53802,6.766423,16.835356,-72.148964,-283.8523,-303.50494,23.60178,3.632357,-6.7889514,318.7234,185000
19
+ 0.6349745,283.1961,0.004591602,-0.015801165,-15.9413185,0.19876814,-283.12292,283.37906,2.6018686,6.587053,-100.68098,-283.95624,-303.44083,9.188921,0.9927075,-1.0739177,112.39383,190000
20
+ 0.66981256,283.4567,0.004645815,-0.0022180397,-12.9774275,0.16931374,-283.39636,283.62378,4.4622335,9.366705,-100.50177,-284.42932,-306.06396,13.8289385,5.4966736,-2.433301,195.22653,195000
21
+ 0.6382584,280.38306,0.004144511,-0.010709961,-15.084131,0.18243904,-280.32056,280.55478,3.6834378,8.6417675,-100.41263,-281.379,-303.55994,12.325205,5.3457522,-5.8637404,170.8758,200000
22
+ 0.6657277,282.63913,0.0045498973,0.0028504592,-11.873511,0.20646295,-282.58508,282.84842,2.4107628,5.298977,-100.572426,-283.78427,-303.83258,7.7097397,0.95388204,-1.0594045,104.795715,205000
23
+ 0.6620062,283.28467,0.0045103584,-0.0053976453,-13.696722,0.20741685,-283.22287,283.4867,3.7311432,6.724145,-100.697426,-283.7058,-304.37314,10.455288,1.6010253,-0.8894999,132.09682,210000
24
+ 0.65642774,279.51703,0.004300823,-0.0055446285,-13.789202,0.18040115,-279.4577,279.69186,3.4798627,29.228643,-100.97223,-280.72983,-304.1224,32.708508,3.1732996,-3.195035,215.67845,215000
25
+ 0.65613544,275.7928,0.004515519,0.00045565324,-12.399092,0.1809637,-275.73682,275.9742,2.6306727,6.939186,-100.66823,-276.3704,-303.0552,9.569859,1.0368266,-0.8023071,106.97895,220000
26
+ 0.6728544,282.9552,0.0045306766,0.008741714,-10.57055,0.20210044,-282.90732,283.16602,2.231251,4.362925,-100.50309,-283.87277,-305.88812,6.5941763,0.7409519,-1.1349382,100.86598,225000
27
+ 0.6683748,280.78998,0.0045794556,-0.0033889709,-13.240038,0.19279812,-280.72937,280.9794,3.4110935,5.8313403,-100.64743,-281.72174,-303.58395,9.242434,2.8267136,-2.7897112,148.8169,230000
28
+ 0.6597693,281.06482,0.004272183,-0.0013453406,-12.814907,0.1842169,-281.01007,281.24768,3.6299736,13.969589,-100.8249,-281.4045,-303.58853,17.599564,1.0069147,-0.97952545,134.486,235000
29
+ 0.6695947,277.21915,0.0044925003,0.008298579,-10.652793,0.22515234,-277.17126,277.4526,4.136679,7.339206,-100.54731,-278.1678,-303.50122,11.475885,7.918346,-8.001877,208.47581,240000
30
+ 0.6538633,274.71268,0.004400906,-0.0038007684,-13.363633,0.19521847,-274.65387,274.90408,2.9407256,6.7453265,-100.455215,-275.6302,-303.27167,9.686052,1.7203066,-1.6504842,111.534325,245000
31
+ 0.6578575,280.63586,0.004306516,0.0027046083,-11.871973,0.20322004,-280.58472,280.8418,2.016702,5.3264565,-100.855125,-281.3919,-302.95084,7.3431587,4.2510114,-2.8743126,147.61621,250000
32
+ 0.6720497,277.4738,0.004528949,0.0028827512,-11.863483,0.17018196,-277.42004,277.64685,2.8924577,6.676891,-100.64984,-278.5212,-302.9243,9.569348,0.9179635,-0.97357893,103.63555,255000
33
+ 0.66854036,273.23895,0.004256538,0.0039268904,-11.577445,0.19259477,-273.18967,273.4355,2.6040218,9.133765,-100.49883,-274.07578,-303.4401,11.737787,0.9358999,-1.0847982,122.35719,260000
34
+ 0.6613903,274.36584,0.004028555,0.0039120675,-11.528915,0.19637986,-274.3194,274.56613,2.5180829,5.306285,-100.66111,-275.45166,-302.85785,7.8243675,1.1225915,-1.1349574,116.20146,265000
35
+ 0.66029286,273.8703,0.004433171,-0.0015998,-12.86087,0.20323831,-273.8133,274.07196,7.245473,10.597219,-100.36418,-274.73776,-303.07095,17.842693,5.6964917,-4.9104033,246.95653,270000
36
+ 0.6482542,274.31622,0.004108795,0.0010193775,-12.251904,0.20527336,-274.26587,274.5225,2.0742817,7.367837,-100.60472,-275.14087,-302.7074,9.442119,2.5282898,-2.7159488,127.72145,275000
37
+ 0.6597041,275.10065,0.0040816613,-0.000114293805,-12.528002,0.20006415,-275.04953,275.3006,2.068011,5.9473357,-100.37619,-276.2026,-304.5306,8.015347,5.112983,-6.832732,169.8475,280000
38
+ 0.6677756,271.6299,0.004193853,-0.00021519286,-12.5513115,0.19781375,-271.57727,271.8275,1.6568222,3.8411744,-100.51346,-272.08755,-302.8718,5.4979963,1.2215536,-1.3024983,89.15317,285000
39
+ 0.65976745,270.4936,0.004100183,-0.0011627644,-12.783588,0.18433033,-270.44116,270.67676,2.1886604,7.725998,-100.71729,-271.20178,-302.5945,9.914659,1.0844638,-1.2236246,105.463455,290000
40
+ 0.65960634,278.31415,0.0039842115,0.00069572934,-12.325378,0.18725109,-278.265,278.5021,1.8796847,4.661954,-100.57267,-278.8693,-302.68384,6.5416384,0.95619905,-0.8847669,85.41288,295000
41
+ 0.6599329,270.85397,0.004216248,-0.00109362,-12.759382,0.21784757,-270.80017,271.0707,3.1765423,11.988109,-100.4198,-271.38773,-304.3664,15.164651,5.3894196,-4.9390607,210.92844,300000
42
+ 0.64567715,269.56607,0.004222326,-0.0072350847,-14.213531,0.16086668,-269.50604,269.7197,1.8978827,4.760344,-100.51973,-270.08176,-303.1313,6.658227,1.4176608,-0.75859535,97.41152,305000
43
+ 0.6560849,273.22064,0.00393441,0.0003329429,-12.415377,0.18586269,-273.17178,273.40683,1.8375494,4.9716363,-100.08516,-274.1525,-303.42465,6.809186,0.6252449,-0.58951265,78.60679,310000
44
+ 0.6577029,269.73346,0.004189126,-8.976105e-05,-12.521427,0.16532847,-269.68103,269.89868,1.7167877,3.6434686,-100.46334,-270.6368,-303.2639,5.360256,0.46297807,-0.49564347,65.871346,315000
45
+ 0.6593379,273.85428,0.003908834,0.0021221435,-11.95709,0.18615955,-273.80753,274.04257,1.8063011,6.0722303,-100.40095,-274.6954,-303.16742,7.8785315,1.4955211,-1.5284106,93.95325,320000
46
+ 0.65785885,275.83673,0.0038910322,-0.00061753276,-12.658707,0.20111777,-275.78748,276.03723,1.672944,3.7476952,-100.45736,-276.59448,-302.97992,5.420639,0.47753397,-0.49360105,68.22826,325000
47
+ 0.6698183,276.1263,0.0039922427,-0.003559288,-13.391551,0.19342044,-276.07288,276.31616,2.3274605,5.4082446,-100.21273,-277.21484,-302.68057,7.7357054,0.9723817,-0.80500937,94.65053,330000
48
+ 0.66569716,272.54523,0.0040205005,0.005621855,-11.101703,0.19483946,-272.50058,272.74567,2.3991742,5.6730013,-36.752174,-273.46356,-302.66028,8.072176,0.5943003,-0.74300194,84.91491,335000
49
+ 0.6471759,275.0191,0.0040887557,-0.010069604,-14.962755,0.16455427,-274.95792,275.17358,10.494473,13.302347,-100.24765,-276.1551,-302.59515,23.796822,5.8674083,-4.6791883,170.15817,340000
50
+ 0.66667485,266.31665,0.0039652037,0.006164384,-10.94538,0.19398738,-266.27325,266.5168,1.2723359,5.591412,-100.295555,-266.78683,-302.73563,6.863748,1.3614144,-1.6400306,113.02138,345000
51
+ 0.67841774,276.90933,0.0039304798,0.008492002,-10.339449,0.19118927,-276.8687,277.109,1.8647327,4.250465,-100.40966,-277.59274,-304.21945,6.1151977,0.6850765,-0.72678417,81.964066,350000
52
+ 0.6497261,269.5616,0.003967053,-0.0048569855,-13.724331,0.1736053,-269.5072,269.73038,1.5876282,5.1157737,-100.502464,-270.44888,-302.73444,6.703402,1.0497494,-0.7462057,76.77505,355000
53
+ 0.66736066,268.97766,0.00395821,0.01413966,-8.927764,0.20399728,-268.94232,269.1958,4.561915,7.1822853,-100.46868,-269.78522,-303.59982,11.7442,0.8934831,-3.0045388,107.14699,360000
54
+ 0.65771663,269.98834,0.0039226175,-0.00090162415,-12.729853,0.16083995,-269.93842,270.14825,1.6294245,7.070563,-100.51358,-271.15344,-302.86667,8.699987,7.033176,-2.9473987,159.60751,365000
55
+ 0.6653325,274.75217,0.0041245143,-0.0032500783,-13.287991,0.18056744,-274.69736,274.9295,3.9107327,15.733594,-100.43659,-275.4692,-302.85837,19.644327,2.4299672,-2.79613,151.33267,370000
56
+ 0.6642539,266.6115,0.0040915236,-0.00019664424,-12.548061,0.18847454,-266.56015,266.7998,2.0304866,9.097063,-51.658092,-268.2601,-303.45563,11.12755,2.9823604,-3.4687304,167.4929,375000
57
+ 0.6748687,267.19022,0.0038476244,0.007849054,-10.460026,0.16590168,-267.14996,267.36395,1.1332228,3.366885,-100.55124,-268.11914,-302.71567,4.500108,0.4425672,-0.33690852,59.050903,380000
58
+ 0.65113336,271.90912,0.0039671496,-0.008543671,-14.6536045,0.17974496,-271.851,272.08032,1.7223713,4.4875803,-100.489,-272.8671,-302.89377,6.2099514,0.58376765,-0.57324445,75.50888,385000
59
+ 0.6560427,266.07416,0.0038806133,-0.0003673307,-12.594658,0.16777676,-266.02527,266.24158,1.8161602,5.1352806,-100.39454,-267.01874,-302.7291,6.951441,0.782713,-0.62384737,75.767746,390000
60
+ 0.6597192,272.55554,0.0039010996,0.0028020998,-11.781715,0.16661847,-272.50958,272.72498,1.3667477,3.5228863,-100.346085,-273.77838,-302.6089,4.889634,0.59984815,-0.550295,75.89462,395000
61
+ 0.6668584,267.29028,0.0036817214,0.005079087,-11.120459,0.15862839,-267.24933,267.45398,2.1448905,4.8165584,-100.17544,-267.87378,-302.60162,6.9614487,0.7769519,-1.0737119,94.71971,400000
62
+ 0.66693467,267.22937,0.0036424336,0.004723875,-11.203099,0.18740317,-267.18857,267.4215,1.2318159,3.8680942,-100.434265,-267.7701,-302.64264,5.0999103,0.6635179,-0.3770324,57.668232,405000
63
+ 0.66256905,265.29175,0.0035590257,0.0024014912,-11.825239,0.18866329,-265.24963,265.48282,1.9301949,4.0989823,-100.35318,-266.0905,-302.5925,6.029177,2.175365,-1.9823674,111.53575,410000
64
+ 0.66590106,260.9079,0.0038136372,0.00293987,-11.729116,0.18806663,-260.86316,261.0989,2.1116588,4.9312487,-100.30906,-261.70477,-303.49286,7.0429077,0.63569945,-0.5917638,74.79365,415000
65
+ 0.6547557,257.19592,0.0035813132,0.0034239176,-11.543949,0.15109244,-257.15454,257.35043,1.8327223,5.431681,-100.22818,-257.88254,-302.83374,7.2644033,4.2294197,-4.2095594,113.1483,420000
66
+ 0.6550953,269.07922,0.0038441767,-0.00039488217,-12.602722,0.18713096,-269.03076,269.26596,1.5472673,3.5903041,-100.41402,-270.26718,-302.55588,5.1375713,0.6697365,-0.65533626,70.6969,425000
67
+ 0.6617154,264.55463,0.0036031115,-0.0025399597,-13.204935,0.18797025,-264.50705,264.74005,1.5975531,5.0644383,-100.30801,-265.46118,-302.2158,6.6619916,1.0897309,-1.0215456,83.90999,430000
68
+ 0.67918974,261.80035,0.0037656464,0.012858917,-9.085203,0.17467204,-261.76617,261.98788,1.5609797,3.9593887,-100.42784,-262.74976,-302.55017,5.5203686,0.3749403,-0.43101916,67.10281,435000
69
+ 0.6610254,271.09827,0.0036392147,0.0053234883,-11.037188,0.20606509,-271.05807,271.30963,1.1009724,3.3793056,-100.42159,-271.95554,-302.79916,4.480278,0.40706867,-0.4043219,56.8023,440000
70
+ 0.64622223,270.71924,0.0035865668,-0.007326635,-14.542799,0.18937825,-270.66708,270.9013,1.583169,4.402729,-100.22965,-271.82144,-302.18585,5.985898,0.52071285,-0.3771574,68.14932,445000
71
+ 0.66553956,262.93646,0.0036322526,0.0030756039,-11.653252,0.15485878,-262.89417,263.0944,1.6846799,6.641065,-100.289314,-263.55573,-302.8689,8.325745,0.65142953,-0.6787297,81.82866,450000
72
+ 0.6544496,265.32275,0.003469738,-0.0004956882,-12.64286,0.17467663,-265.27887,265.49695,1.6914753,5.181705,-100.32149,-266.64224,-302.25452,6.8731804,0.5946399,-0.8987936,80.91699,455000
73
+ 0.661275,264.6247,0.0034403221,0.0034033624,-11.510743,0.199944,-264.58508,264.82806,2.6594207,5.0236216,-100.27758,-265.28134,-302.50952,7.6830425,1.3234826,-1.374464,98.816025,460000
74
+ 0.6691528,267.14932,0.0037049805,0.0031800526,-11.641682,0.1758295,-267.1062,267.32834,1.3890438,3.4824243,-100.34266,-268.08398,-302.36304,4.871468,0.53933835,-0.5151295,65.53829,465000
75
+ 0.6651159,257.7638,0.0037054275,0.006768373,-10.673389,0.17916575,-257.72424,257.94974,1.8000523,3.9009697,-100.333534,-258.51636,-302.29333,5.701022,0.45482826,-0.9027178,69.833244,470000
76
+ 0.6470896,267.89145,0.0037664545,-0.0040861797,-13.5848875,0.17886014,-267.84027,268.06622,1.2086172,3.6171665,-100.37444,-268.5765,-302.3025,4.8257837,0.44596443,-0.5893723,63.880737,475000
77
+ 0.66398215,264.41736,0.0036332346,0.0051661683,-11.07808,0.17725262,-264.3771,264.59976,1.313259,3.962143,-100.27923,-264.84796,-302.48904,5.275402,0.7113575,-0.7270033,72.45816,480000
78
+ 0.64862746,264.52533,0.0034179534,-0.006979307,-14.541955,0.16015942,-264.47565,264.6785,1.4047166,4.246804,-49.13206,-265.38412,-302.5549,5.6515207,0.39226666,-0.3512892,63.005272,485000
79
+ 0.67060804,258.71368,0.0037436234,0.008691588,-10.178295,0.17607416,-258.67557,258.89847,1.4046863,3.0822053,-100.35954,-259.63388,-302.05594,4.4868917,0.45084843,-0.47043863,62.72486,490000
80
+ 0.67268723,262.85504,0.0038914883,0.006823918,-10.74645,0.1733397,-262.81323,263.03522,2.0744379,6.509088,-100.31038,-263.66266,-302.66074,8.583526,4.872945,-3.3207226,145.63272,495000
81
+ 0.66265976,260.78113,0.0036554534,5.4045195e-05,-12.485215,0.15784723,-260.73547,260.93903,1.5869172,8.185119,-100.379074,-261.936,-302.51483,9.772036,1.5826226,-1.5574999,104.27873,500000
82
+ 0.6696322,263.16147,0.0037451177,0.0065610493,-10.748106,0.2037558,-263.12122,263.3718,2.3565044,3.804779,-100.31009,-263.91174,-302.35544,6.1612835,0.9989629,-0.78786004,89.67894,505000
83
+ 0.6598066,262.78113,0.0037632303,-0.0025056165,-13.165815,0.20673466,-262.73157,262.98535,1.5182848,5.4889116,-100.371086,-264.3733,-302.5626,7.0071964,0.79459846,-0.9425655,86.70977,510000
84
+ 0.6638613,255.15154,0.0034852421,0.0010051461,-12.211599,0.17222558,-255.10898,255.32477,1.3549465,3.783877,-100.31756,-256.06445,-302.64673,5.1388235,0.6954565,-0.40338624,64.308044,515000
85
+ 0.6645097,263.03864,0.003636254,-0.0010092136,-12.777542,0.17728382,-262.9922,263.2149,1.4959633,5.121807,-100.29835,-263.7994,-302.45508,6.61777,0.8594134,-0.5416299,67.083305,520000
86
+ 0.64552563,264.2447,0.0036034072,-0.009251364,-15.067393,0.16150019,-264.19037,264.39694,1.3065583,4.094031,-100.3187,-264.9648,-302.51474,5.400589,0.40394333,-0.36000612,59.201073,525000
87
+ 0.63946295,260.93713,0.0034755634,-0.008292902,-14.88606,0.18506974,-260.8854,261.1139,2.108486,5.8457904,-100.35292,-261.9248,-302.1821,7.954276,0.6245933,-0.8549057,86.610794,530000
88
+ 0.6666075,257.79724,0.0035996477,0.0030597087,-11.649998,0.19104975,-257.75528,257.99133,2.9473777,3.8159091,-100.279175,-258.4902,-302.08545,6.7632866,0.72072214,-0.8505405,84.17893,535000
89
+ 0.6662889,257.3421,0.0034619027,0.00038196036,-12.3896675,0.14244072,-257.29922,257.48492,1.6505024,3.4612808,-100.259056,-258.20966,-302.2991,5.111783,0.4436833,-0.66530514,67.85698,540000
90
+ 0.68550396,252.89435,0.0035221889,0.015234091,-8.174823,0.17175764,-252.86555,253.08133,1.6659569,3.6017644,-100.20689,-253.32396,-302.17047,5.267721,0.42580527,-0.568149,61.383785,545000
91
+ 0.6713665,257.42035,0.0038264317,0.008253699,-10.342978,0.1618889,-257.38077,257.59048,1.05686,5.7909865,-100.21844,-258.278,-302.24124,6.8478465,2.3671372,-0.8056934,71.247246,550000
92
+ 0.67156875,260.82404,0.0034859385,-0.00019464323,-12.555837,0.18921193,-260.78027,261.01306,1.4202822,3.1921444,-100.22907,-261.2267,-302.34344,4.6124268,0.4274565,-0.5339117,65.67468,555000
93
+ 0.6700907,250.4118,0.0035086782,0.0032158713,-11.583452,0.15827966,-250.37115,250.5733,2.086684,4.059724,-100.31648,-251.28703,-302.20697,6.146408,0.5088454,-0.6695686,71.05435,560000
94
+ 0.6573655,255.22278,0.003217155,-0.0011752979,-12.865322,0.16857062,-255.1814,255.39017,1.3405058,3.9540634,-100.34573,-255.93086,-302.42392,5.294569,0.35376257,-0.5055719,58.01864,565000
95
+ 0.65466523,258.8454,0.0036407355,-0.00561268,-14.041634,0.15855432,-258.79425,258.99835,1.4427881,3.6242638,-100.150154,-259.70126,-302.28806,5.067052,0.38692856,-0.41798764,54.29637,570000
96
+ 0.6625096,253.87921,0.0035959147,-0.0010707814,-12.797777,0.19699055,-253.8332,254.07513,1.8116016,4.229809,-100.28493,-254.89073,-302.35074,6.0414104,1.3772709,-1.0897532,76.565765,575000
97
+ 0.66512954,263.3871,0.003535649,-0.0013838576,-12.891401,0.165701,-263.34152,263.55142,1.6386791,4.217614,-100.273186,-264.43112,-302.66315,5.856293,1.0860491,-1.4778864,95.738556,580000
98
+ 0.6509602,262.9912,0.0033089768,-0.004857346,-13.96793,0.17098415,-262.94498,263.15735,1.3490771,4.2768984,-100.26749,-264.0121,-302.2061,5.6259756,0.9776824,-1.298924,70.03726,585000
99
+ 0.64459014,256.02484,0.0036025136,-0.009305472,-15.08305,0.17216453,-255.97052,256.18768,1.3192867,4.109779,-100.256256,-256.91724,-301.99246,5.4290657,0.37471634,-0.39286894,55.79483,590000
100
+ 0.66373885,253.92383,0.0035825344,-0.0029191866,-13.314838,0.15676078,-253.87613,254.07767,1.4664825,4.342646,-100.16853,-254.62108,-302.0377,5.8091288,0.51011455,-0.62640184,62.835793,595000
101
+ 0.6594551,261.6609,0.00341665,-0.004945126,-13.947361,0.16314459,-261.61325,261.8191,1.1677507,4.358751,-100.24205,-262.6666,-302.34567,5.5265017,0.44820026,-0.4858847,60.441536,600000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
2
+ 0.68451923,293.98334,0.004215054,0.0046282164,-11.401979,0.20430833,-293.9353,294.1923,8.61393,25.79129,-120.61603,-294.26282,-307.31775,34.40522,5.2540226,-5.060202,393.57745,105000
3
+ 0.6664912,290.70602,0.0046371436,-0.008489391,-14.330737,0.197492,-290.63956,290.89502,5.013113,22.589014,-169.75346,-291.70996,-305.7043,27.602127,3.9411929,-5.9833426,326.2362,110000
4
+ 0.6737685,287.6887,0.0044078766,0.0020398856,-12.037218,0.20666528,-287.63562,287.8974,7.102314,25.196747,-113.6555,-287.85153,-306.3591,32.29906,6.815852,-6.1600866,407.57263,115000
5
+ 0.6718844,293.38538,0.004288726,0.0022887704,-11.966329,0.21459414,-293.33405,293.60226,4.4136996,11.819016,-181.89738,-294.0934,-304.90286,16.232716,3.626711,-3.0821896,286.95926,120000
6
+ 0.65428245,288.97845,0.004355067,-0.016249988,-16.231283,0.19001204,-288.90778,289.15222,5.14059,13.85441,-107.70928,-289.96884,-306.5796,18.995,3.698928,-3.1010113,224.71878,125000
7
+ 0.6907408,288.9909,0.0045750574,0.0123588145,-9.798654,0.20672882,-288.9461,289.21,3.6387048,14.658521,4.2862983,-289.10812,-305.74902,18.297226,4.1496353,-3.9220872,226.3634,130000
8
+ 0.6703889,292.08197,0.0046265484,-0.004213269,-13.410672,0.18716109,-292.01993,292.26492,3.3115585,7.1005297,-101.87245,-293.5209,-305.90848,10.412088,1.334328,-1.1911694,157.5768,135000
9
+ 0.66610444,287.25046,0.004556834,0.00470983,-11.466425,0.19062734,-287.19818,287.44577,3.6017377,6.1707683,-100.08451,-288.02393,-306.60336,9.772506,0.83226186,-0.8993608,113.91702,140000
10
+ 0.675869,288.59216,0.00464063,0.013250917,-9.644587,0.1905204,-288.54742,288.79593,5.51095,12.069573,-100.46694,-289.20197,-305.9452,17.580524,6.0347023,-6.004706,232.73694,145000
11
+ 0.6680993,286.18616,0.0042730775,-0.0008521981,-12.699434,0.20471343,-286.13184,286.39,2.78796,13.464238,-100.32881,-287.00558,-306.2396,16.252197,2.0013406,-2.17956,173.22699,150000
12
+ 0.6715216,286.87073,0.0047365464,-0.0058059935,-13.725786,0.19051635,-286.8057,287.05545,2.6988049,6.896187,-100.64366,-287.42056,-304.72647,9.594992,5.382665,-5.665446,179.83746,155000
13
+ 0.6671254,286.4673,0.004245301,0.0054082307,-11.226067,0.22228831,-286.41962,286.69498,3.5842488,6.6831675,-100.71774,-286.98907,-304.64276,10.267416,2.811478,-2.902136,158.75244,160000
14
+ 0.6781303,287.3279,0.0045389323,0.003620719,-11.702297,0.18457285,-287.27478,287.5161,2.0543249,7.3452773,-100.53266,-288.2166,-304.43292,9.399602,1.1019225,-2.0408275,117.167595,165000
15
+ 0.6573901,280.77863,0.0045718886,-0.002415692,-13.028379,0.2033413,-280.71906,280.97955,4.2643714,8.362673,-99.95689,-281.51517,-304.00513,12.627045,1.4380249,-1.6364849,144.34888,170000
16
+ 0.6497354,279.42328,0.0044190474,-0.013431877,-15.539541,0.21280237,-279.35464,279.62265,4.528965,9.813952,-42.049603,-280.848,-303.59167,14.342917,2.0279415,-2.1281364,193.70285,175000
17
+ 0.65134305,280.63416,0.0047699413,-0.007488661,-14.069969,0.1817931,-280.56705,280.80847,4.013481,9.317459,-100.84814,-281.5577,-303.74457,13.33094,4.431979,-4.6011686,223.049,180000
18
+ 0.6655947,283.35968,0.004696949,0.0022555098,-12.019793,0.17607799,-283.30322,283.53802,6.766423,16.835356,-72.148964,-283.8523,-303.50494,23.60178,3.632357,-6.7889514,318.7234,185000
19
+ 0.6349745,283.1961,0.004591602,-0.015801165,-15.9413185,0.19876814,-283.12292,283.37906,2.6018686,6.587053,-100.68098,-283.95624,-303.44083,9.188921,0.9927075,-1.0739177,112.39383,190000
20
+ 0.66981256,283.4567,0.004645815,-0.0022180397,-12.9774275,0.16931374,-283.39636,283.62378,4.4622335,9.366705,-100.50177,-284.42932,-306.06396,13.8289385,5.4966736,-2.433301,195.22653,195000
21
+ 0.6382584,280.38306,0.004144511,-0.010709961,-15.084131,0.18243904,-280.32056,280.55478,3.6834378,8.6417675,-100.41263,-281.379,-303.55994,12.325205,5.3457522,-5.8637404,170.8758,200000
22
+ 0.6657277,282.63913,0.0045498973,0.0028504592,-11.873511,0.20646295,-282.58508,282.84842,2.4107628,5.298977,-100.572426,-283.78427,-303.83258,7.7097397,0.95388204,-1.0594045,104.795715,205000
23
+ 0.6620062,283.28467,0.0045103584,-0.0053976453,-13.696722,0.20741685,-283.22287,283.4867,3.7311432,6.724145,-100.697426,-283.7058,-304.37314,10.455288,1.6010253,-0.8894999,132.09682,210000
24
+ 0.65642774,279.51703,0.004300823,-0.0055446285,-13.789202,0.18040115,-279.4577,279.69186,3.4798627,29.228643,-100.97223,-280.72983,-304.1224,32.708508,3.1732996,-3.195035,215.67845,215000
25
+ 0.65613544,275.7928,0.004515519,0.00045565324,-12.399092,0.1809637,-275.73682,275.9742,2.6306727,6.939186,-100.66823,-276.3704,-303.0552,9.569859,1.0368266,-0.8023071,106.97895,220000
26
+ 0.6728544,282.9552,0.0045306766,0.008741714,-10.57055,0.20210044,-282.90732,283.16602,2.231251,4.362925,-100.50309,-283.87277,-305.88812,6.5941763,0.7409519,-1.1349382,100.86598,225000
27
+ 0.6683748,280.78998,0.0045794556,-0.0033889709,-13.240038,0.19279812,-280.72937,280.9794,3.4110935,5.8313403,-100.64743,-281.72174,-303.58395,9.242434,2.8267136,-2.7897112,148.8169,230000
28
+ 0.6597693,281.06482,0.004272183,-0.0013453406,-12.814907,0.1842169,-281.01007,281.24768,3.6299736,13.969589,-100.8249,-281.4045,-303.58853,17.599564,1.0069147,-0.97952545,134.486,235000
29
+ 0.6695947,277.21915,0.0044925003,0.008298579,-10.652793,0.22515234,-277.17126,277.4526,4.136679,7.339206,-100.54731,-278.1678,-303.50122,11.475885,7.918346,-8.001877,208.47581,240000
30
+ 0.6538633,274.71268,0.004400906,-0.0038007684,-13.363633,0.19521847,-274.65387,274.90408,2.9407256,6.7453265,-100.455215,-275.6302,-303.27167,9.686052,1.7203066,-1.6504842,111.534325,245000
31
+ 0.6578575,280.63586,0.004306516,0.0027046083,-11.871973,0.20322004,-280.58472,280.8418,2.016702,5.3264565,-100.855125,-281.3919,-302.95084,7.3431587,4.2510114,-2.8743126,147.61621,250000
32
+ 0.6720497,277.4738,0.004528949,0.0028827512,-11.863483,0.17018196,-277.42004,277.64685,2.8924577,6.676891,-100.64984,-278.5212,-302.9243,9.569348,0.9179635,-0.97357893,103.63555,255000
33
+ 0.66854036,273.23895,0.004256538,0.0039268904,-11.577445,0.19259477,-273.18967,273.4355,2.6040218,9.133765,-100.49883,-274.07578,-303.4401,11.737787,0.9358999,-1.0847982,122.35719,260000
34
+ 0.6613903,274.36584,0.004028555,0.0039120675,-11.528915,0.19637986,-274.3194,274.56613,2.5180829,5.306285,-100.66111,-275.45166,-302.85785,7.8243675,1.1225915,-1.1349574,116.20146,265000
35
+ 0.66029286,273.8703,0.004433171,-0.0015998,-12.86087,0.20323831,-273.8133,274.07196,7.245473,10.597219,-100.36418,-274.73776,-303.07095,17.842693,5.6964917,-4.9104033,246.95653,270000
36
+ 0.6482542,274.31622,0.004108795,0.0010193775,-12.251904,0.20527336,-274.26587,274.5225,2.0742817,7.367837,-100.60472,-275.14087,-302.7074,9.442119,2.5282898,-2.7159488,127.72145,275000
37
+ 0.6597041,275.10065,0.0040816613,-0.000114293805,-12.528002,0.20006415,-275.04953,275.3006,2.068011,5.9473357,-100.37619,-276.2026,-304.5306,8.015347,5.112983,-6.832732,169.8475,280000
38
+ 0.6677756,271.6299,0.004193853,-0.00021519286,-12.5513115,0.19781375,-271.57727,271.8275,1.6568222,3.8411744,-100.51346,-272.08755,-302.8718,5.4979963,1.2215536,-1.3024983,89.15317,285000
39
+ 0.65976745,270.4936,0.004100183,-0.0011627644,-12.783588,0.18433033,-270.44116,270.67676,2.1886604,7.725998,-100.71729,-271.20178,-302.5945,9.914659,1.0844638,-1.2236246,105.463455,290000
40
+ 0.65960634,278.31415,0.0039842115,0.00069572934,-12.325378,0.18725109,-278.265,278.5021,1.8796847,4.661954,-100.57267,-278.8693,-302.68384,6.5416384,0.95619905,-0.8847669,85.41288,295000
41
+ 0.6599329,270.85397,0.004216248,-0.00109362,-12.759382,0.21784757,-270.80017,271.0707,3.1765423,11.988109,-100.4198,-271.38773,-304.3664,15.164651,5.3894196,-4.9390607,210.92844,300000
42
+ 0.64567715,269.56607,0.004222326,-0.0072350847,-14.213531,0.16086668,-269.50604,269.7197,1.8978827,4.760344,-100.51973,-270.08176,-303.1313,6.658227,1.4176608,-0.75859535,97.41152,305000
43
+ 0.6560849,273.22064,0.00393441,0.0003329429,-12.415377,0.18586269,-273.17178,273.40683,1.8375494,4.9716363,-100.08516,-274.1525,-303.42465,6.809186,0.6252449,-0.58951265,78.60679,310000
44
+ 0.6577029,269.73346,0.004189126,-8.976105e-05,-12.521427,0.16532847,-269.68103,269.89868,1.7167877,3.6434686,-100.46334,-270.6368,-303.2639,5.360256,0.46297807,-0.49564347,65.871346,315000
45
+ 0.6593379,273.85428,0.003908834,0.0021221435,-11.95709,0.18615955,-273.80753,274.04257,1.8063011,6.0722303,-100.40095,-274.6954,-303.16742,7.8785315,1.4955211,-1.5284106,93.95325,320000
46
+ 0.65785885,275.83673,0.0038910322,-0.00061753276,-12.658707,0.20111777,-275.78748,276.03723,1.672944,3.7476952,-100.45736,-276.59448,-302.97992,5.420639,0.47753397,-0.49360105,68.22826,325000
47
+ 0.6698183,276.1263,0.0039922427,-0.003559288,-13.391551,0.19342044,-276.07288,276.31616,2.3274605,5.4082446,-100.21273,-277.21484,-302.68057,7.7357054,0.9723817,-0.80500937,94.65053,330000
48
+ 0.66569716,272.54523,0.0040205005,0.005621855,-11.101703,0.19483946,-272.50058,272.74567,2.3991742,5.6730013,-36.752174,-273.46356,-302.66028,8.072176,0.5943003,-0.74300194,84.91491,335000
49
+ 0.6471759,275.0191,0.0040887557,-0.010069604,-14.962755,0.16455427,-274.95792,275.17358,10.494473,13.302347,-100.24765,-276.1551,-302.59515,23.796822,5.8674083,-4.6791883,170.15817,340000
50
+ 0.66667485,266.31665,0.0039652037,0.006164384,-10.94538,0.19398738,-266.27325,266.5168,1.2723359,5.591412,-100.295555,-266.78683,-302.73563,6.863748,1.3614144,-1.6400306,113.02138,345000
51
+ 0.67841774,276.90933,0.0039304798,0.008492002,-10.339449,0.19118927,-276.8687,277.109,1.8647327,4.250465,-100.40966,-277.59274,-304.21945,6.1151977,0.6850765,-0.72678417,81.964066,350000
52
+ 0.6497261,269.5616,0.003967053,-0.0048569855,-13.724331,0.1736053,-269.5072,269.73038,1.5876282,5.1157737,-100.502464,-270.44888,-302.73444,6.703402,1.0497494,-0.7462057,76.77505,355000
53
+ 0.66736066,268.97766,0.00395821,0.01413966,-8.927764,0.20399728,-268.94232,269.1958,4.561915,7.1822853,-100.46868,-269.78522,-303.59982,11.7442,0.8934831,-3.0045388,107.14699,360000
54
+ 0.65771663,269.98834,0.0039226175,-0.00090162415,-12.729853,0.16083995,-269.93842,270.14825,1.6294245,7.070563,-100.51358,-271.15344,-302.86667,8.699987,7.033176,-2.9473987,159.60751,365000
55
+ 0.6653325,274.75217,0.0041245143,-0.0032500783,-13.287991,0.18056744,-274.69736,274.9295,3.9107327,15.733594,-100.43659,-275.4692,-302.85837,19.644327,2.4299672,-2.79613,151.33267,370000
56
+ 0.6642539,266.6115,0.0040915236,-0.00019664424,-12.548061,0.18847454,-266.56015,266.7998,2.0304866,9.097063,-51.658092,-268.2601,-303.45563,11.12755,2.9823604,-3.4687304,167.4929,375000
57
+ 0.6748687,267.19022,0.0038476244,0.007849054,-10.460026,0.16590168,-267.14996,267.36395,1.1332228,3.366885,-100.55124,-268.11914,-302.71567,4.500108,0.4425672,-0.33690852,59.050903,380000
58
+ 0.65113336,271.90912,0.0039671496,-0.008543671,-14.6536045,0.17974496,-271.851,272.08032,1.7223713,4.4875803,-100.489,-272.8671,-302.89377,6.2099514,0.58376765,-0.57324445,75.50888,385000
59
+ 0.6560427,266.07416,0.0038806133,-0.0003673307,-12.594658,0.16777676,-266.02527,266.24158,1.8161602,5.1352806,-100.39454,-267.01874,-302.7291,6.951441,0.782713,-0.62384737,75.767746,390000
60
+ 0.6597192,272.55554,0.0039010996,0.0028020998,-11.781715,0.16661847,-272.50958,272.72498,1.3667477,3.5228863,-100.346085,-273.77838,-302.6089,4.889634,0.59984815,-0.550295,75.89462,395000
61
+ 0.6668584,267.29028,0.0036817214,0.005079087,-11.120459,0.15862839,-267.24933,267.45398,2.1448905,4.8165584,-100.17544,-267.87378,-302.60162,6.9614487,0.7769519,-1.0737119,94.71971,400000
62
+ 0.66693467,267.22937,0.0036424336,0.004723875,-11.203099,0.18740317,-267.18857,267.4215,1.2318159,3.8680942,-100.434265,-267.7701,-302.64264,5.0999103,0.6635179,-0.3770324,57.668232,405000
63
+ 0.66256905,265.29175,0.0035590257,0.0024014912,-11.825239,0.18866329,-265.24963,265.48282,1.9301949,4.0989823,-100.35318,-266.0905,-302.5925,6.029177,2.175365,-1.9823674,111.53575,410000
64
+ 0.66590106,260.9079,0.0038136372,0.00293987,-11.729116,0.18806663,-260.86316,261.0989,2.1116588,4.9312487,-100.30906,-261.70477,-303.49286,7.0429077,0.63569945,-0.5917638,74.79365,415000
65
+ 0.6547557,257.19592,0.0035813132,0.0034239176,-11.543949,0.15109244,-257.15454,257.35043,1.8327223,5.431681,-100.22818,-257.88254,-302.83374,7.2644033,4.2294197,-4.2095594,113.1483,420000
66
+ 0.6550953,269.07922,0.0038441767,-0.00039488217,-12.602722,0.18713096,-269.03076,269.26596,1.5472673,3.5903041,-100.41402,-270.26718,-302.55588,5.1375713,0.6697365,-0.65533626,70.6969,425000
67
+ 0.6617154,264.55463,0.0036031115,-0.0025399597,-13.204935,0.18797025,-264.50705,264.74005,1.5975531,5.0644383,-100.30801,-265.46118,-302.2158,6.6619916,1.0897309,-1.0215456,83.90999,430000
68
+ 0.67918974,261.80035,0.0037656464,0.012858917,-9.085203,0.17467204,-261.76617,261.98788,1.5609797,3.9593887,-100.42784,-262.74976,-302.55017,5.5203686,0.3749403,-0.43101916,67.10281,435000
69
+ 0.6610254,271.09827,0.0036392147,0.0053234883,-11.037188,0.20606509,-271.05807,271.30963,1.1009724,3.3793056,-100.42159,-271.95554,-302.79916,4.480278,0.40706867,-0.4043219,56.8023,440000
70
+ 0.64622223,270.71924,0.0035865668,-0.007326635,-14.542799,0.18937825,-270.66708,270.9013,1.583169,4.402729,-100.22965,-271.82144,-302.18585,5.985898,0.52071285,-0.3771574,68.14932,445000
71
+ 0.66553956,262.93646,0.0036322526,0.0030756039,-11.653252,0.15485878,-262.89417,263.0944,1.6846799,6.641065,-100.289314,-263.55573,-302.8689,8.325745,0.65142953,-0.6787297,81.82866,450000
72
+ 0.6544496,265.32275,0.003469738,-0.0004956882,-12.64286,0.17467663,-265.27887,265.49695,1.6914753,5.181705,-100.32149,-266.64224,-302.25452,6.8731804,0.5946399,-0.8987936,80.91699,455000
73
+ 0.661275,264.6247,0.0034403221,0.0034033624,-11.510743,0.199944,-264.58508,264.82806,2.6594207,5.0236216,-100.27758,-265.28134,-302.50952,7.6830425,1.3234826,-1.374464,98.816025,460000
74
+ 0.6691528,267.14932,0.0037049805,0.0031800526,-11.641682,0.1758295,-267.1062,267.32834,1.3890438,3.4824243,-100.34266,-268.08398,-302.36304,4.871468,0.53933835,-0.5151295,65.53829,465000
75
+ 0.6651159,257.7638,0.0037054275,0.006768373,-10.673389,0.17916575,-257.72424,257.94974,1.8000523,3.9009697,-100.333534,-258.51636,-302.29333,5.701022,0.45482826,-0.9027178,69.833244,470000
76
+ 0.6470896,267.89145,0.0037664545,-0.0040861797,-13.5848875,0.17886014,-267.84027,268.06622,1.2086172,3.6171665,-100.37444,-268.5765,-302.3025,4.8257837,0.44596443,-0.5893723,63.880737,475000
77
+ 0.66398215,264.41736,0.0036332346,0.0051661683,-11.07808,0.17725262,-264.3771,264.59976,1.313259,3.962143,-100.27923,-264.84796,-302.48904,5.275402,0.7113575,-0.7270033,72.45816,480000
78
+ 0.64862746,264.52533,0.0034179534,-0.006979307,-14.541955,0.16015942,-264.47565,264.6785,1.4047166,4.246804,-49.13206,-265.38412,-302.5549,5.6515207,0.39226666,-0.3512892,63.005272,485000
79
+ 0.67060804,258.71368,0.0037436234,0.008691588,-10.178295,0.17607416,-258.67557,258.89847,1.4046863,3.0822053,-100.35954,-259.63388,-302.05594,4.4868917,0.45084843,-0.47043863,62.72486,490000
80
+ 0.67268723,262.85504,0.0038914883,0.006823918,-10.74645,0.1733397,-262.81323,263.03522,2.0744379,6.509088,-100.31038,-263.66266,-302.66074,8.583526,4.872945,-3.3207226,145.63272,495000
81
+ 0.66265976,260.78113,0.0036554534,5.4045195e-05,-12.485215,0.15784723,-260.73547,260.93903,1.5869172,8.185119,-100.379074,-261.936,-302.51483,9.772036,1.5826226,-1.5574999,104.27873,500000
82
+ 0.6696322,263.16147,0.0037451177,0.0065610493,-10.748106,0.2037558,-263.12122,263.3718,2.3565044,3.804779,-100.31009,-263.91174,-302.35544,6.1612835,0.9989629,-0.78786004,89.67894,505000
83
+ 0.6598066,262.78113,0.0037632303,-0.0025056165,-13.165815,0.20673466,-262.73157,262.98535,1.5182848,5.4889116,-100.371086,-264.3733,-302.5626,7.0071964,0.79459846,-0.9425655,86.70977,510000
84
+ 0.6638613,255.15154,0.0034852421,0.0010051461,-12.211599,0.17222558,-255.10898,255.32477,1.3549465,3.783877,-100.31756,-256.06445,-302.64673,5.1388235,0.6954565,-0.40338624,64.308044,515000
85
+ 0.6645097,263.03864,0.003636254,-0.0010092136,-12.777542,0.17728382,-262.9922,263.2149,1.4959633,5.121807,-100.29835,-263.7994,-302.45508,6.61777,0.8594134,-0.5416299,67.083305,520000
86
+ 0.64552563,264.2447,0.0036034072,-0.009251364,-15.067393,0.16150019,-264.19037,264.39694,1.3065583,4.094031,-100.3187,-264.9648,-302.51474,5.400589,0.40394333,-0.36000612,59.201073,525000
87
+ 0.63946295,260.93713,0.0034755634,-0.008292902,-14.88606,0.18506974,-260.8854,261.1139,2.108486,5.8457904,-100.35292,-261.9248,-302.1821,7.954276,0.6245933,-0.8549057,86.610794,530000
88
+ 0.6666075,257.79724,0.0035996477,0.0030597087,-11.649998,0.19104975,-257.75528,257.99133,2.9473777,3.8159091,-100.279175,-258.4902,-302.08545,6.7632866,0.72072214,-0.8505405,84.17893,535000
89
+ 0.6662889,257.3421,0.0034619027,0.00038196036,-12.3896675,0.14244072,-257.29922,257.48492,1.6505024,3.4612808,-100.259056,-258.20966,-302.2991,5.111783,0.4436833,-0.66530514,67.85698,540000
90
+ 0.68550396,252.89435,0.0035221889,0.015234091,-8.174823,0.17175764,-252.86555,253.08133,1.6659569,3.6017644,-100.20689,-253.32396,-302.17047,5.267721,0.42580527,-0.568149,61.383785,545000
91
+ 0.6713665,257.42035,0.0038264317,0.008253699,-10.342978,0.1618889,-257.38077,257.59048,1.05686,5.7909865,-100.21844,-258.278,-302.24124,6.8478465,2.3671372,-0.8056934,71.247246,550000
92
+ 0.67156875,260.82404,0.0034859385,-0.00019464323,-12.555837,0.18921193,-260.78027,261.01306,1.4202822,3.1921444,-100.22907,-261.2267,-302.34344,4.6124268,0.4274565,-0.5339117,65.67468,555000
93
+ 0.6700907,250.4118,0.0035086782,0.0032158713,-11.583452,0.15827966,-250.37115,250.5733,2.086684,4.059724,-100.31648,-251.28703,-302.20697,6.146408,0.5088454,-0.6695686,71.05435,560000
94
+ 0.6573655,255.22278,0.003217155,-0.0011752979,-12.865322,0.16857062,-255.1814,255.39017,1.3405058,3.9540634,-100.34573,-255.93086,-302.42392,5.294569,0.35376257,-0.5055719,58.01864,565000
95
+ 0.65466523,258.8454,0.0036407355,-0.00561268,-14.041634,0.15855432,-258.79425,258.99835,1.4427881,3.6242638,-100.150154,-259.70126,-302.28806,5.067052,0.38692856,-0.41798764,54.29637,570000
96
+ 0.6625096,253.87921,0.0035959147,-0.0010707814,-12.797777,0.19699055,-253.8332,254.07513,1.8116016,4.229809,-100.28493,-254.89073,-302.35074,6.0414104,1.3772709,-1.0897532,76.565765,575000
97
+ 0.66512954,263.3871,0.003535649,-0.0013838576,-12.891401,0.165701,-263.34152,263.55142,1.6386791,4.217614,-100.273186,-264.43112,-302.66315,5.856293,1.0860491,-1.4778864,95.738556,580000
98
+ 0.6509602,262.9912,0.0033089768,-0.004857346,-13.96793,0.17098415,-262.94498,263.15735,1.3490771,4.2768984,-100.26749,-264.0121,-302.2061,5.6259756,0.9776824,-1.298924,70.03726,585000
99
+ 0.64459014,256.02484,0.0036025136,-0.009305472,-15.08305,0.17216453,-255.97052,256.18768,1.3192867,4.109779,-100.256256,-256.91724,-301.99246,5.4290657,0.37471634,-0.39286894,55.79483,590000
100
+ 0.66373885,253.92383,0.0035825344,-0.0029191866,-13.314838,0.15676078,-253.87613,254.07767,1.4664825,4.342646,-100.16853,-254.62108,-302.0377,5.8091288,0.51011455,-0.62640184,62.835793,595000
101
+ 0.6594551,261.6609,0.00341665,-0.004945126,-13.947361,0.16314459,-261.61325,261.8191,1.1677507,4.358751,-100.24205,-262.6666,-302.34567,5.5265017,0.44820026,-0.4858847,60.441536,600000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1041200210bc22fcdd89204e66af12fb34291cd3c174ba5b8725a347e3b3e3a2
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dffa13edd098e82b91cdab6706edd865e9c4ef9d94c6bdc254aad5f54ac77ad9
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c1c348211461d8f912d01534ba248774bd783cc343b3156fe83e059dc0c7d1d
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50710caa15ec2b7204184161c15c5974436226119e4a33d8d3bd99f7ff4b4d06
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7562a02f962d8448a574f694b12150fc8dc3d82ce1ebef74b5368f040c1a3c2
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7a412e8310b5d4dae72952c5d86deb5eb977664d7a9f3f6ab36cd9f0e898692
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02140c1daa88151fc4bc5dd36ab1a4c4b169eb58c8c4ec992a71f29d9880882b
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:305ae8a0ebcc9666ea73350389eac4aff9ededce4dfe62dde8a66829603547cf
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:735e24cbced0693f3eb870fa7b7a5670923647edc6740a331a5bf61a2128e5ff
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deb87e90dbe24b3687cd5dc7ea34aafb44b3430ee839e52ea36f4cfa457d9b41
3
+ size 328782656
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/dsrl/20260324_011140/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/lyfdyucy