Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1150000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1200000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1350000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1400000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.043504832867536494,-0.005857940252080525,-0.042526916194125866,-0.005472976873102807,34.29653433387341,8.293999999999464,0.9,4422.92,-0.1,-222.84,163.88,0.5449089241027832,1050000
|
| 3 |
+
0.0,0.0,-0.024217975661516098,-0.013471516297320834,-0.022701753329069,-0.005184098166303314,33.5201768147862,7.370999999999393,0.9,11845.36,-0.18,-230.2,145.42,0.46598066329956056,1100000
|
| 4 |
+
0.0,0.0,-0.02731690622803005,0.0008942340399534852,-0.025470366277342598,0.0005565664810217357,32.86921409026775,6.198999999999741,0.98,18909.72,-0.02,-183.74,121.98,0.4080416011810303,1150000
|
| 5 |
+
0.0,0.0,-0.049340528748432956,0.007231048632606063,-0.04730501505531233,0.0037027342005502674,33.253277713236756,6.156999999999756,0.96,25345.68,-0.06,-194.98,121.14,0.39780613899230954,1200000
|
| 6 |
+
0.0,0.0,-0.033251766852659716,0.034421625469131786,-0.030627951892593035,0.030355560414232954,33.82301485823177,7.02299999999979,0.96,32215.46,-0.06,-200.22,138.46,0.43850412368774416,1250000
|
| 7 |
+
0.0,0.0,-0.04468238749750187,0.028344665090518143,-0.04120743843171445,0.027072688171037466,33.596430086850745,4.178999999999788,1.0,37835.34,0.0,-119.44,81.58,0.2731659460067749,1300000
|
| 8 |
+
0.0,0.0,-0.05363877900677943,0.04492814309669321,-0.05027015249575274,0.04204988290134937,33.15737252952398,5.4909999999996755,0.96,42654.66,-0.06,-175.36,107.82,0.34607816219329834,1350000
|
| 9 |
+
0.0,0.0,-0.04074778086443957,0.02444063169423961,-0.037142457771699916,0.02670842262814929,32.432648056613886,4.282999999999793,1.0,47649.96,0.0,-122.8,83.66,0.27738633155822756,1400000
|
| 10 |
+
0.0,0.0,-0.043882307314871014,0.033365694204548546,-0.040009724925212924,0.03556571754457891,32.30897173335463,4.885999999999705,0.98,52434.1,-0.02,-142.18,95.72,0.3111926317214966,1450000
|
| 11 |
+
0.0,0.0,-0.055692062610132965,0.03659639054991016,-0.051874747707163736,0.034186092211345595,33.994866796202054,4.276999999999862,1.0,56968.48,0.0,-120.96,83.54,0.2757084321975708,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.043504832867536494,-0.005857940252080525,-0.042526916194125866,-0.005472976873102807,34.29653433387341,8.293999999999464,0.9,4422.92,-0.1,-222.84,163.88,0.5449089241027832,1050000
|
| 3 |
+
0.0,0.0,-0.024217975661516098,-0.013471516297320834,-0.022701753329069,-0.005184098166303314,33.5201768147862,7.370999999999393,0.9,11845.36,-0.18,-230.2,145.42,0.46598066329956056,1100000
|
| 4 |
+
0.0,0.0,-0.02731690622803005,0.0008942340399534852,-0.025470366277342598,0.0005565664810217357,32.86921409026775,6.198999999999741,0.98,18909.72,-0.02,-183.74,121.98,0.4080416011810303,1150000
|
| 5 |
+
0.0,0.0,-0.049340528748432956,0.007231048632606063,-0.04730501505531233,0.0037027342005502674,33.253277713236756,6.156999999999756,0.96,25345.68,-0.06,-194.98,121.14,0.39780613899230954,1200000
|
| 6 |
+
0.0,0.0,-0.033251766852659716,0.034421625469131786,-0.030627951892593035,0.030355560414232954,33.82301485823177,7.02299999999979,0.96,32215.46,-0.06,-200.22,138.46,0.43850412368774416,1250000
|
| 7 |
+
0.0,0.0,-0.04468238749750187,0.028344665090518143,-0.04120743843171445,0.027072688171037466,33.596430086850745,4.178999999999788,1.0,37835.34,0.0,-119.44,81.58,0.2731659460067749,1300000
|
| 8 |
+
0.0,0.0,-0.05363877900677943,0.04492814309669321,-0.05027015249575274,0.04204988290134937,33.15737252952398,5.4909999999996755,0.96,42654.66,-0.06,-175.36,107.82,0.34607816219329834,1350000
|
| 9 |
+
0.0,0.0,-0.04074778086443957,0.02444063169423961,-0.037142457771699916,0.02670842262814929,32.432648056613886,4.282999999999793,1.0,47649.96,0.0,-122.8,83.66,0.27738633155822756,1400000
|
| 10 |
+
0.0,0.0,-0.043882307314871014,0.033365694204548546,-0.040009724925212924,0.03556571754457891,32.30897173335463,4.885999999999705,0.98,52434.1,-0.02,-142.18,95.72,0.3111926317214966,1450000
|
| 11 |
+
0.0,0.0,-0.055692062610132965,0.03659639054991016,-0.051874747707163736,0.034186092211345595,33.994866796202054,4.276999999999862,1.0,56968.48,0.0,-120.96,83.54,0.2757084321975708,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6464956,151.57722,0.007163675,0.0030462234,-12.074768,0.17292589,-151.49072,151.7532,1.3128544,3.7949963,-70.795906,-154.47537,-193.89467,5.1078506,3.1127567,-2.949452,76.30099,1005000
|
| 3 |
+
0.6485105,146.79274,0.0076541477,-0.0065934774,-13.361425,0.16756466,-146.69046,146.95372,1.5746807,5.1706023,-41.557182,-149.52043,-191.74504,6.745283,3.3696132,-4.8575883,88.63003,1010000
|
| 4 |
+
0.64525586,147.00572,0.007770758,-0.0091342665,-13.675467,0.17948562,-146.89944,147.17607,2.4174645,5.5621743,-41.01098,-149.57582,-193.16957,7.979639,1.3709776,-1.5047313,71.079346,1015000
|
| 5 |
+
0.63883394,144.54778,0.008655294,-0.009785089,-13.630532,0.18681526,-144.42981,144.72481,2.3234909,6.1018195,-44.51125,-148.00513,-200.11287,8.42531,3.4827356,-2.6060915,73.25749,1020000
|
| 6 |
+
0.6435777,139.33673,0.008913718,-0.0021352523,-12.739547,0.20421615,-139.22318,139.53882,1.8558857,7.855736,-22.038013,-142.44089,-199.51778,9.711621,3.1024864,-3.0871446,89.08097,1025000
|
| 7 |
+
0.64866555,135.86174,0.009273562,0.007008288,-11.744272,0.16436714,-135.75282,136.03311,3.3357475,6.2067666,-20.808237,-138.5915,-197.19006,9.542514,1.0498705,-1.0992802,83.02554,1030000
|
| 8 |
+
0.649019,136.32335,0.009138469,0.0039164717,-12.07143,0.18875074,-136.21303,136.51602,3.4171937,10.153538,-23.086048,-139.17169,-195.6537,13.570731,5.2551436,-4.7140436,144.98236,1035000
|
| 9 |
+
0.6393231,134.4324,0.009306475,-0.022307223,-14.896957,0.13545766,-134.29376,134.54555,4.080291,9.577062,-19.443583,-138.30533,-201.1646,13.657352,2.852514,-2.9530969,112.93753,1040000
|
| 10 |
+
0.64937866,135.09111,0.009450281,0.0049868454,-11.972307,0.1760129,-134.97797,135.27211,1.999966,5.074394,-13.707406,-137.73552,-196.076,7.0743604,4.4575896,-4.349462,88.345764,1045000
|
| 11 |
+
0.64400387,135.94951,0.009125749,0.00019272776,-12.478881,0.18479623,-135.83563,136.1345,3.0653298,7.7147174,-9.577094,-138.78268,-197.03235,10.780047,0.88452595,-0.87104815,106.573944,1050000
|
| 12 |
+
0.64533204,134.44623,0.009007195,-0.005250217,-13.082891,0.18030345,-134.32838,134.62128,4.1405897,7.588472,-7.7217517,-138.22826,-198.6875,11.729061,2.0673459,-2.0582304,83.56644,1055000
|
| 13 |
+
0.636829,133.14493,0.008968328,-0.015689613,-14.249447,0.17570888,-133.01714,133.30495,2.7620275,9.705306,-29.735945,-137.09244,-202.00311,12.467334,7.023451,-6.65542,144.72197,1060000
|
| 14 |
+
0.6424235,132.41772,0.0093809115,-0.023239965,-14.977367,0.17354581,-132.27724,132.56802,2.012982,9.585312,-17.369453,-135.43277,-201.27684,11.598293,4.071946,-4.0390773,119.737495,1065000
|
| 15 |
+
0.64226645,128.78539,0.009493685,-0.0052063907,-13.048406,0.19711253,-128.66151,128.9773,2.4989467,8.273597,-21.812529,-131.59843,-199.42223,10.772543,2.291885,-2.786441,100.447395,1070000
|
| 16 |
+
0.6494754,132.58534,0.009366402,-0.003478368,-12.8713665,0.19981475,-132.46478,132.78168,2.4093106,10.638217,-7.313128,-135.82703,-202.58841,13.047527,8.683023,-8.241741,156.12833,1075000
|
| 17 |
+
0.6391464,132.66927,0.009232,-0.0072721234,-13.287708,0.17731173,-132.5466,132.8393,3.7323816,10.33302,-9.757318,-136.00179,-201.96973,14.065402,8.590516,-5.1886845,150.99756,1080000
|
| 18 |
+
0.64403164,131.04622,0.009804857,-0.00083475973,-12.585137,0.18893978,-130.92282,131.23431,5.302259,7.8610206,-4.65475,-133.72044,-200.44604,13.16328,2.188338,-2.0905042,124.93063,1085000
|
| 19 |
+
0.6405302,130.4898,0.009314617,-0.013506362,-13.950018,0.1624625,-130.35986,130.63876,5.47509,8.86723,-4.94899,-133.30392,-197.39832,14.34232,2.5606823,-3.241087,127.28847,1090000
|
| 20 |
+
0.642231,128.53061,0.0091807125,0.00983672,-11.428545,0.15545717,-128.42569,128.6959,4.0513597,7.3872504,-7.3206973,-131.25467,-196.49045,11.43861,4.312066,-4.5787525,112.990036,1095000
|
| 21 |
+
0.63821286,125.3012,0.009375393,-0.0011153272,-12.618963,0.17982708,-125.1829,125.47991,3.3594525,16.832909,-10.902427,-128.49922,-201.95685,20.192362,12.081791,-11.287716,222.06155,1100000
|
| 22 |
+
0.6391037,129.383,0.009236451,-0.01274685,-13.880059,0.1843239,-129.2548,129.55458,3.482558,11.127075,-17.885136,-133.7312,-196.6523,14.609633,2.169407,-1.9778278,134.06787,1105000
|
| 23 |
+
0.6378062,128.66994,0.009167755,-0.015629072,-14.204787,0.16459247,-128.53972,128.81891,2.488557,9.1795,-7.582003,-131.70236,-199.71085,11.6680565,5.7105875,-5.259641,104.23355,1110000
|
| 24 |
+
0.6373791,125.73598,0.009174248,-0.004175306,-12.9551115,0.13900429,-125.61713,125.87081,2.6657567,13.092148,0.45087546,-129.28801,-198.20631,15.757904,7.525411,-8.492876,163.36597,1115000
|
| 25 |
+
0.6406654,127.259224,0.00898818,0.008359645,-11.569929,0.1835387,-127.155235,127.451126,2.2040398,13.830764,-5.3187113,-130.4257,-200.84705,16.034803,5.974059,-5.3755093,124.958145,1120000
|
| 26 |
+
0.6325392,132.24692,0.00901013,-0.017898234,-14.486457,0.19923258,-132.11641,132.42825,5.006565,8.807695,-9.609513,-135.89394,-199.02777,13.8142605,2.5000587,-2.5419643,149.8818,1125000
|
| 27 |
+
0.64280957,129.91394,0.0093098255,-0.007008943,-13.252854,0.16812113,-129.79056,130.07506,3.2459145,9.242699,-11.305132,-133.42838,-198.78586,12.488613,2.7497218,-2.8461416,128.08379,1130000
|
| 28 |
+
0.6360216,126.08401,0.008981415,-0.014331877,-14.095726,0.1821321,-125.95741,126.2518,3.9134774,9.082964,1.7933187,-130.18504,-201.86671,12.996441,3.8123417,-3.6377184,136.441,1135000
|
| 29 |
+
0.636382,124.70767,0.008865839,-0.00035969785,-12.540571,0.18880431,-124.59649,124.89612,4.050621,8.832672,-6.534545,-128.21623,-196.91035,12.883293,2.8421605,-2.2754269,130.32579,1140000
|
| 30 |
+
0.6504776,128.10019,0.008851974,0.007689001,-11.63138,0.16067816,-127.99723,128.26855,3.6161458,10.093371,-2.3105562,-130.68279,-200.06606,13.7095175,6.768597,-5.4132333,165.2433,1145000
|
| 31 |
+
0.64407223,128.86893,0.009051435,0.0006959043,-12.423117,0.15228572,-128.75647,129.02191,2.9644039,8.396022,-2.6708305,-131.18652,-202.96336,11.360426,3.1548195,-2.3944194,109.14513,1150000
|
| 32 |
+
0.6422238,126.62654,0.009084243,0.0018990714,-12.290949,0.18313959,-126.51488,126.81158,3.7675316,13.460883,-5.232151,-129.2733,-201.30688,17.228415,4.1794944,-3.6322865,206.66385,1155000
|
| 33 |
+
0.6417494,128.65085,0.009113943,0.007644988,-11.661177,0.19036144,-128.54456,128.84886,6.00014,10.239601,-10.139838,-131.6443,-202.76094,16.239742,2.317663,-4.1540713,226.0728,1160000
|
| 34 |
+
0.63586605,129.32718,0.009144476,-0.015846755,-14.232932,0.199867,-129.19702,129.51118,3.888094,12.516783,-1.3985913,-132.35118,-202.68343,16.404877,6.3585105,-7.5735793,172.31331,1165000
|
| 35 |
+
0.65388334,127.05216,0.008854052,0.01958317,-10.288225,0.14390266,-126.96106,127.21565,2.662054,7.9065003,1.9545878,-129.38643,-204.8477,10.568554,4.9893517,-4.965696,111.33298,1170000
|
| 36 |
+
0.65561783,130.54114,0.008850987,0.0064637573,-11.769713,0.16935171,-130.43695,130.71696,2.807752,10.909976,1.8020799,-132.77983,-203.77383,13.717728,4.137025,-4.4331803,136.76862,1175000
|
| 37 |
+
0.6428333,126.00345,0.008959968,0.005531757,-11.882614,0.17874773,-125.89698,126.18773,2.882508,6.9471164,2.7062669,-128.91145,-201.24953,9.829624,0.91137815,-1.3622543,95.32741,1180000
|
| 38 |
+
0.6323903,123.80432,0.008797768,-0.021070607,-14.894995,0.17445897,-123.67328,123.95771,3.4094124,11.554057,-4.6875105,-127.09167,-204.56668,14.9634695,1.6218823,-1.7460337,122.47629,1185000
|
| 39 |
+
0.6390684,125.59163,0.008802808,-0.01169949,-13.829063,0.1422596,-125.469894,125.72219,6.0784597,13.713409,-11.053524,-128.1754,-202.93205,19.79187,4.6216,-5.3881717,209.31912,1190000
|
| 40 |
+
0.64209855,125.03865,0.008843326,-0.0031213118,-12.852957,0.17306283,-124.92498,125.208595,3.120889,12.012288,-1.3130747,-127.801735,-204.46663,15.133177,5.682155,-4.559839,153.46265,1195000
|
| 41 |
+
0.639845,125.57135,0.008710562,-0.0017355898,-12.699251,0.1507714,-125.460724,125.72039,3.2449036,11.044777,-2.1551902,-129.29973,-203.25385,14.2896805,3.5389664,-1.7415601,118.15797,1200000
|
| 42 |
+
0.6365927,123.513885,0.008850227,-0.013229156,-13.9947815,0.13717224,-123.390045,123.637825,5.272592,9.120862,1.5905051,-126.579735,-197.11165,14.393454,3.3959823,-3.4227388,160.44345,1205000
|
| 43 |
+
0.6377818,126.26075,0.008581363,-0.0038449492,-12.948058,0.16699764,-126.14963,126.423904,3.2589996,12.157851,-5.4255233,-128.64915,-200.31987,15.416851,2.7532537,-2.9979026,132.21031,1210000
|
| 44 |
+
0.64191145,125.2381,0.008487448,-0.0009835822,-12.615887,0.19271159,-125.13101,125.429825,2.847297,7.25464,-4.5831203,-127.806175,-202.49307,10.101937,1.7426533,-1.3942971,123.19255,1215000
|
| 45 |
+
0.6442653,122.16271,0.008483009,0.0032995099,-12.111045,0.19857192,-122.05997,122.36458,5.7100224,13.719977,-6.751171,-125.046326,-200.3074,19.43,6.008419,-5.6346292,247.12329,1220000
|
| 46 |
+
0.63809055,120.153564,0.008549256,0.008832987,-11.466812,0.17138883,-120.05553,120.333786,6.3368998,14.133936,-1.2633395,-123.53754,-203.11551,20.470837,1.7265916,-1.5316513,160.27095,1225000
|
| 47 |
+
0.64832115,123.75131,0.00851894,0.0072635575,-11.647364,0.19047374,-123.652084,123.94905,4.8593974,9.749782,-8.255757,-126.80877,-202.2139,14.609179,1.4506383,-1.3270575,126.69564,1230000
|
| 48 |
+
0.64333874,123.90573,0.00867035,0.0037379852,-12.068877,0.19873086,-123.80109,124.1082,8.692974,10.450952,-6.800746,-126.41674,-201.64906,19.143925,3.6231515,-6.001799,257.29578,1235000
|
| 49 |
+
0.64641243,120.812515,0.008614642,0.0106301,-11.266043,0.1674346,-120.71547,120.99058,3.0775013,10.436999,2.9849367,-123.97329,-204.82623,13.514501,4.078586,-2.9906776,135.68394,1240000
|
| 50 |
+
0.63434446,123.53998,0.008458104,-0.011317373,-13.838051,0.17098293,-123.422935,123.699646,4.8024125,10.068221,-5.464667,-126.662865,-202.21553,14.870634,5.533489,-5.5058017,170.53964,1245000
|
| 51 |
+
0.64390785,112.63048,0.0084747905,0.017908752,-10.386821,0.15335074,-112.54245,112.801735,4.2674394,10.7258,-1.962584,-116.05459,-202.04427,14.993238,2.3802266,-2.3485296,158.86298,1250000
|
| 52 |
+
0.64503086,125.545006,0.00843565,-0.0024837225,-12.794432,0.18797176,-125.43708,125.73049,9.915013,12.713843,-5.4828587,-128.79488,-201.61841,22.628857,5.254665,-6.7980423,231.11667,1255000
|
| 53 |
+
0.6377623,121.95765,0.008362758,-0.00981207,-13.6733055,0.16554749,-121.84331,122.11339,7.838669,15.225031,0.82913685,-125.13714,-197.80081,23.0637,10.601127,-9.955818,316.13382,1260000
|
| 54 |
+
0.6364712,121.50835,0.008628652,0.0036475118,-12.077279,0.14906493,-121.404144,121.66106,3.6728635,8.627863,-2.7202306,-124.20597,-203.62886,12.300726,2.995927,-2.7178357,140.22125,1265000
|
| 55 |
+
0.6384205,122.24304,0.008649204,0.001405103,-12.337545,0.15509467,-122.13632,122.39954,4.996223,12.109792,-2.7970958,-124.68972,-202.11456,17.106014,2.5861683,-2.3071039,187.39102,1270000
|
| 56 |
+
0.6389597,118.99133,0.008594107,0.005971525,-11.8051605,0.20636079,-118.88987,119.20367,3.1167715,11.405807,-5.5785055,-121.33942,-203.35966,14.522578,2.3739934,-1.6800555,130.84299,1275000
|
| 57 |
+
0.6359179,123.08945,0.008521955,-0.009002596,-13.5564,0.19083732,-122.97392,123.27128,4.358337,18.70556,3.1824603,-127.05816,-200.75018,23.063898,14.361351,-15.372471,229.92308,1280000
|
| 58 |
+
0.6419461,118.11688,0.008566657,0.009389806,-11.403913,0.16377495,-118.019196,118.29005,3.9648106,9.125285,0.15734282,-120.35874,-202.1696,13.0900955,1.6499809,-2.2292151,138.6709,1285000
|
| 59 |
+
0.63882256,112.715324,0.008548469,-0.0071785226,-13.339744,0.16356003,-112.60129,112.871704,4.638349,12.575909,3.5655165,-115.871376,-200.3826,17.214258,3.0247793,-2.6979148,161.75012,1290000
|
| 60 |
+
0.6424936,117.54994,0.008566485,0.010061585,-11.325471,0.18161687,-117.45293,117.74162,3.9961832,13.665807,3.401253,-120.256996,-201.92415,17.66199,5.090977,-5.0399137,173.90207,1295000
|
| 61 |
+
0.64270675,119.7292,0.008463951,-0.0022989605,-12.771618,0.1723569,-119.6211,119.89926,3.6395497,15.300061,4.845348,-122.97654,-196.39244,18.939611,4.640162,-4.2943377,210.31013,1300000
|
| 62 |
+
0.645325,121.60801,0.0083509665,0.0101601,-11.283362,0.15814507,-121.51379,121.77631,3.8809152,8.985576,4.098552,-124.499565,-200.29033,12.866491,1.5339854,-0.9207981,110.86883,1305000
|
| 63 |
+
0.6478857,120.922134,0.008460251,0.0055018063,-11.849688,0.16526932,-120.821884,121.0929,11.982508,14.533193,0.9592593,-124.13686,-200.07486,26.515701,7.859707,-8.004476,382.2781,1310000
|
| 64 |
+
0.6379398,118.120224,0.008483009,0.019180866,-10.238908,0.15787676,-118.03337,118.29728,4.564119,9.470704,-5.4410324,-120.669876,-198.38023,14.034822,1.2594509,-1.7199771,151.67752,1315000
|
| 65 |
+
0.63231796,118.41519,0.008654213,-0.013166638,-14.021414,0.14538072,-118.29385,118.5474,5.9773026,14.172032,-7.497801,-121.41494,-193.85854,20.149334,5.8131456,-3.9362595,208.99655,1320000
|
| 66 |
+
0.6375815,118.18234,0.008469368,-0.0036455786,-12.930443,0.15901148,-118.07283,118.33771,3.804334,13.431457,-2.1490757,-120.77998,-203.72165,17.23579,8.685775,-9.09581,179.94495,1325000
|
| 67 |
+
0.6379457,117.34464,0.008688634,0.0032942658,-12.120853,0.165101,-117.23933,117.51304,4.3795476,15.701273,-2.8713224,-119.50265,-203.27878,20.08082,1.4432031,-2.6795182,180.13635,1330000
|
| 68 |
+
0.63924766,120.284996,0.008468456,-0.001299097,-12.653404,0.19148558,-120.17784,120.47518,5.8742166,12.139681,-1.4999378,-122.95701,-201.67087,18.013897,2.3578143,-2.1283352,184.82932,1335000
|
| 69 |
+
0.64267373,121.050995,0.008231669,0.0088841645,-11.420733,0.16929322,-120.956985,121.22917,4.8664274,10.29299,-1.9322164,-124.02047,-196.72676,15.159417,5.69005,-6.505579,197.15292,1340000
|
| 70 |
+
0.63940036,124.813934,0.008588777,-0.011172677,-13.800846,0.17148969,-124.695404,124.97425,6.6876817,11.79515,-5.056322,-127.91778,-199.87653,18.482832,3.2305074,-3.2951133,154.86705,1345000
|
| 71 |
+
0.64167345,112.08322,0.008302412,0.010813034,-11.197603,0.16848129,-111.99026,112.26251,3.9780164,10.461127,4.622429,-113.81133,-201.26454,14.439144,3.3838787,-3.665567,149.76682,1350000
|
| 72 |
+
0.65090865,115.87819,0.0084658675,0.010205697,-11.294489,0.19894356,-115.78258,116.08734,7.0498843,10.017176,-2.9643302,-118.21453,-199.08992,17.06706,1.3811994,-2.5185146,140.4136,1355000
|
| 73 |
+
0.64304596,112.37104,0.008471375,0.00957541,-11.369675,0.1457988,-112.274734,112.52641,5.3214355,12.3923435,0.44466034,-115.12563,-200.91249,17.71378,4.2721434,-5.222407,198.55353,1360000
|
| 74 |
+
0.6387522,118.62284,0.008457975,-0.019442802,-14.798754,0.16256729,-118.49767,118.76597,3.9437203,14.712496,-1.6654229,-121.63851,-206.41031,18.656216,4.09527,-4.5309825,175.78758,1365000
|
| 75 |
+
0.6456484,114.77827,0.008308527,0.003009323,-12.137803,0.18477058,-114.677414,114.96604,5.7419357,11.320409,6.6998367,-117.58404,-201.4152,17.062344,5.748235,-5.339521,265.34454,1370000
|
| 76 |
+
0.6378013,114.16199,0.00816541,-0.0070461407,-13.362926,0.14416456,-114.05287,114.2991,3.6956613,22.404892,0.10665945,-117.61509,-205.22922,26.100554,6.600313,-6.155339,191.74365,1375000
|
| 77 |
+
0.6459477,114.38164,0.008185536,0.010746435,-11.187143,0.124752715,-114.29007,114.51714,4.681916,13.739982,-5.445271,-116.909355,-201.98363,18.421898,1.9464821,-2.240349,160.58154,1380000
|
| 78 |
+
0.6445333,115.26684,0.008436281,-0.006832273,-13.309868,0.14616936,-115.15456,115.40617,3.4809537,9.775042,-2.5053573,-118.42301,-201.33513,13.255995,0.8097689,-0.7310865,109.825516,1385000
|
| 79 |
+
0.6320904,118.525,0.008313869,-0.015282939,-14.338246,0.13292366,-118.405785,118.64265,5.633813,14.853152,-3.7496064,-121.652016,-201.20619,20.486965,3.667048,-3.7088795,240.86015,1390000
|
| 80 |
+
0.6341433,115.41601,0.00833085,-0.008510223,-13.521531,0.15638202,-115.30336,115.56388,4.4898973,12.76034,-2.5649076,-118.18115,-197.46117,17.250237,4.356512,-4.2793927,182.92776,1395000
|
| 81 |
+
0.6449634,113.39052,0.008163576,0.0053331186,-11.846718,0.13563514,-113.29381,113.53149,4.549793,11.668037,-2.943189,-116.63705,-197.69258,16.21783,4.900224,-5.04923,176.61917,1400000
|
| 82 |
+
0.6458037,115.16055,0.008291592,0.009968033,-11.297814,0.13465148,-115.06688,115.305176,5.5485835,9.695594,-0.563121,-117.71999,-200.9672,15.244177,1.1296862,-1.6612698,130.34991,1405000
|
| 83 |
+
0.63218415,116.27744,0.008283597,-0.010190069,-13.73015,0.1707437,-116.16371,116.437996,4.516593,11.390043,3.7037055,-119.488525,-194.13121,15.906636,1.4770594,-1.4525577,158.77158,1410000
|
| 84 |
+
0.64072126,113.15425,0.008438083,-0.006715664,-13.295876,0.16714543,-113.04205,113.31468,12.210792,15.632541,-0.8360191,-115.784744,-195.87413,27.843332,3.5338476,-5.9131756,342.94904,1415000
|
| 85 |
+
0.6386226,115.450775,0.0083728805,-0.007773111,-13.428368,0.15366492,-115.33835,115.596664,3.2448585,11.966582,-2.115785,-118.21908,-200.26035,15.211441,2.4489152,-3.8340757,130.34662,1420000
|
| 86 |
+
0.64757687,112.40498,0.0082875835,0.0019464728,-12.265134,0.1555057,-112.30334,112.56243,5.1392417,11.615745,7.797314,-115.95095,-201.6697,16.754986,4.964534,-4.6030493,179.96808,1425000
|
| 87 |
+
0.6520716,114.23018,0.008327574,0.0149779515,-10.701403,0.13902606,-114.14107,114.38418,4.8725886,13.973075,5.479182,-117.206055,-204.58499,18.845663,5.7739096,-3.6685035,250.10512,1430000
|
| 88 |
+
0.6499517,114.815445,0.008397266,0.024186827,-9.6196785,0.1572241,-114.734665,114.99686,6.1431,10.785691,9.1892805,-116.882256,-200.15195,16.928791,2.3317187,-3.5325522,192.5989,1435000
|
| 89 |
+
0.6375859,107.76594,0.008115615,-0.0032826655,-12.904488,0.14776699,-107.66121,107.91042,5.9325495,15.1486845,-2.0654595,-111.16676,-203.6631,21.081234,4.4551206,-3.905351,246.47073,1440000
|
| 90 |
+
0.63675565,117.264755,0.008218004,-0.009037974,-13.599777,0.15862146,-117.15299,117.41434,4.999454,13.559099,2.59945,-120.30129,-201.97122,18.558554,3.370185,-3.5824456,207.18903,1445000
|
| 91 |
+
0.6420816,109.15242,0.008316058,0.0060964855,-11.766902,0.1491107,-109.054565,109.307625,5.317029,15.136037,2.8440726,-112.24021,-201.54616,20.453066,4.0835447,-4.414639,255.98898,1450000
|
| 92 |
+
0.63789666,115.18889,0.008059769,-0.0048187086,-13.097872,0.15004465,-115.08333,115.334114,9.9313965,12.84404,0.93658507,-118.77798,-199.78664,22.775436,3.2961953,-3.0255702,203.02255,1455000
|
| 93 |
+
0.65320647,113.06468,0.008223642,0.003284144,-12.100646,0.14753109,-112.965164,113.21549,7.130184,11.4464445,-1.8999853,-115.73754,-197.84517,18.57663,3.4193685,-5.001981,234.15259,1460000
|
| 94 |
+
0.63703895,114.537476,0.008075006,-0.008281838,-13.525614,0.13240968,-114.42825,114.6616,3.9057863,14.351865,-2.7221718,-117.0071,-199.36969,18.25765,3.6481392,-3.2062519,162.30798,1465000
|
| 95 |
+
0.6479511,110.243645,0.008303327,0.0015585921,-12.312293,0.13051736,-110.14142,110.37572,5.964334,11.3368845,2.9748137,-113.16431,-200.42761,17.301218,2.6076434,-2.8435645,155.75356,1470000
|
| 96 |
+
0.64085615,114.12944,0.008219062,0.009555784,-11.337363,0.13872507,-114.036255,114.27772,4.510007,16.413332,4.231467,-116.95464,-201.2083,20.92334,5.6581864,-4.115401,220.28476,1475000
|
| 97 |
+
0.63489974,115.0514,0.008079085,-0.015721159,-14.445909,0.1431398,-114.93469,115.17882,4.748133,15.099256,3.3816657,-118.35817,-200.3992,19.84739,1.9742584,-1.7815018,176.95139,1480000
|
| 98 |
+
0.6381157,112.236015,0.00825708,-0.00018435145,-12.522326,0.12792695,-112.132614,112.36376,5.443579,14.448076,-0.11809485,-114.08894,-199.83012,19.891655,3.4171395,-3.9279017,232.76663,1485000
|
| 99 |
+
0.63452584,109.78712,0.00816363,0.011003947,-11.152077,0.15117763,-109.696075,109.949295,3.9466782,11.68613,2.2374516,-111.75942,-199.57167,15.632808,10.596968,-10.831001,174.63707,1490000
|
| 100 |
+
0.6380096,105.72828,0.008215869,-0.0026068625,-12.817296,0.11779083,-105.62297,105.84346,8.83377,16.716166,-1.4239688,-108.58125,-202.38547,25.549934,4.6741896,-4.989168,218.33177,1495000
|
| 101 |
+
0.6370428,105.64186,0.008218272,-0.006745454,-13.320787,0.16893467,-105.532394,105.804054,6.3070335,16.137564,5.2815933,-108.39858,-204.39442,22.444597,4.4047685,-4.551241,314.36758,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/alpha,actor/alpha_loss,actor/entropy,actor/flow_loss,actor/q,actor/total_loss,critic/critic_loss,critic/distill_loss,critic/q_max,critic/q_mean,critic/q_min,critic/total_loss,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.6464956,151.57722,0.007163675,0.0030462234,-12.074768,0.17292589,-151.49072,151.7532,1.3128544,3.7949963,-70.795906,-154.47537,-193.89467,5.1078506,3.1127567,-2.949452,76.30099,1005000
|
| 3 |
+
0.6485105,146.79274,0.0076541477,-0.0065934774,-13.361425,0.16756466,-146.69046,146.95372,1.5746807,5.1706023,-41.557182,-149.52043,-191.74504,6.745283,3.3696132,-4.8575883,88.63003,1010000
|
| 4 |
+
0.64525586,147.00572,0.007770758,-0.0091342665,-13.675467,0.17948562,-146.89944,147.17607,2.4174645,5.5621743,-41.01098,-149.57582,-193.16957,7.979639,1.3709776,-1.5047313,71.079346,1015000
|
| 5 |
+
0.63883394,144.54778,0.008655294,-0.009785089,-13.630532,0.18681526,-144.42981,144.72481,2.3234909,6.1018195,-44.51125,-148.00513,-200.11287,8.42531,3.4827356,-2.6060915,73.25749,1020000
|
| 6 |
+
0.6435777,139.33673,0.008913718,-0.0021352523,-12.739547,0.20421615,-139.22318,139.53882,1.8558857,7.855736,-22.038013,-142.44089,-199.51778,9.711621,3.1024864,-3.0871446,89.08097,1025000
|
| 7 |
+
0.64866555,135.86174,0.009273562,0.007008288,-11.744272,0.16436714,-135.75282,136.03311,3.3357475,6.2067666,-20.808237,-138.5915,-197.19006,9.542514,1.0498705,-1.0992802,83.02554,1030000
|
| 8 |
+
0.649019,136.32335,0.009138469,0.0039164717,-12.07143,0.18875074,-136.21303,136.51602,3.4171937,10.153538,-23.086048,-139.17169,-195.6537,13.570731,5.2551436,-4.7140436,144.98236,1035000
|
| 9 |
+
0.6393231,134.4324,0.009306475,-0.022307223,-14.896957,0.13545766,-134.29376,134.54555,4.080291,9.577062,-19.443583,-138.30533,-201.1646,13.657352,2.852514,-2.9530969,112.93753,1040000
|
| 10 |
+
0.64937866,135.09111,0.009450281,0.0049868454,-11.972307,0.1760129,-134.97797,135.27211,1.999966,5.074394,-13.707406,-137.73552,-196.076,7.0743604,4.4575896,-4.349462,88.345764,1045000
|
| 11 |
+
0.64400387,135.94951,0.009125749,0.00019272776,-12.478881,0.18479623,-135.83563,136.1345,3.0653298,7.7147174,-9.577094,-138.78268,-197.03235,10.780047,0.88452595,-0.87104815,106.573944,1050000
|
| 12 |
+
0.64533204,134.44623,0.009007195,-0.005250217,-13.082891,0.18030345,-134.32838,134.62128,4.1405897,7.588472,-7.7217517,-138.22826,-198.6875,11.729061,2.0673459,-2.0582304,83.56644,1055000
|
| 13 |
+
0.636829,133.14493,0.008968328,-0.015689613,-14.249447,0.17570888,-133.01714,133.30495,2.7620275,9.705306,-29.735945,-137.09244,-202.00311,12.467334,7.023451,-6.65542,144.72197,1060000
|
| 14 |
+
0.6424235,132.41772,0.0093809115,-0.023239965,-14.977367,0.17354581,-132.27724,132.56802,2.012982,9.585312,-17.369453,-135.43277,-201.27684,11.598293,4.071946,-4.0390773,119.737495,1065000
|
| 15 |
+
0.64226645,128.78539,0.009493685,-0.0052063907,-13.048406,0.19711253,-128.66151,128.9773,2.4989467,8.273597,-21.812529,-131.59843,-199.42223,10.772543,2.291885,-2.786441,100.447395,1070000
|
| 16 |
+
0.6494754,132.58534,0.009366402,-0.003478368,-12.8713665,0.19981475,-132.46478,132.78168,2.4093106,10.638217,-7.313128,-135.82703,-202.58841,13.047527,8.683023,-8.241741,156.12833,1075000
|
| 17 |
+
0.6391464,132.66927,0.009232,-0.0072721234,-13.287708,0.17731173,-132.5466,132.8393,3.7323816,10.33302,-9.757318,-136.00179,-201.96973,14.065402,8.590516,-5.1886845,150.99756,1080000
|
| 18 |
+
0.64403164,131.04622,0.009804857,-0.00083475973,-12.585137,0.18893978,-130.92282,131.23431,5.302259,7.8610206,-4.65475,-133.72044,-200.44604,13.16328,2.188338,-2.0905042,124.93063,1085000
|
| 19 |
+
0.6405302,130.4898,0.009314617,-0.013506362,-13.950018,0.1624625,-130.35986,130.63876,5.47509,8.86723,-4.94899,-133.30392,-197.39832,14.34232,2.5606823,-3.241087,127.28847,1090000
|
| 20 |
+
0.642231,128.53061,0.0091807125,0.00983672,-11.428545,0.15545717,-128.42569,128.6959,4.0513597,7.3872504,-7.3206973,-131.25467,-196.49045,11.43861,4.312066,-4.5787525,112.990036,1095000
|
| 21 |
+
0.63821286,125.3012,0.009375393,-0.0011153272,-12.618963,0.17982708,-125.1829,125.47991,3.3594525,16.832909,-10.902427,-128.49922,-201.95685,20.192362,12.081791,-11.287716,222.06155,1100000
|
| 22 |
+
0.6391037,129.383,0.009236451,-0.01274685,-13.880059,0.1843239,-129.2548,129.55458,3.482558,11.127075,-17.885136,-133.7312,-196.6523,14.609633,2.169407,-1.9778278,134.06787,1105000
|
| 23 |
+
0.6378062,128.66994,0.009167755,-0.015629072,-14.204787,0.16459247,-128.53972,128.81891,2.488557,9.1795,-7.582003,-131.70236,-199.71085,11.6680565,5.7105875,-5.259641,104.23355,1110000
|
| 24 |
+
0.6373791,125.73598,0.009174248,-0.004175306,-12.9551115,0.13900429,-125.61713,125.87081,2.6657567,13.092148,0.45087546,-129.28801,-198.20631,15.757904,7.525411,-8.492876,163.36597,1115000
|
| 25 |
+
0.6406654,127.259224,0.00898818,0.008359645,-11.569929,0.1835387,-127.155235,127.451126,2.2040398,13.830764,-5.3187113,-130.4257,-200.84705,16.034803,5.974059,-5.3755093,124.958145,1120000
|
| 26 |
+
0.6325392,132.24692,0.00901013,-0.017898234,-14.486457,0.19923258,-132.11641,132.42825,5.006565,8.807695,-9.609513,-135.89394,-199.02777,13.8142605,2.5000587,-2.5419643,149.8818,1125000
|
| 27 |
+
0.64280957,129.91394,0.0093098255,-0.007008943,-13.252854,0.16812113,-129.79056,130.07506,3.2459145,9.242699,-11.305132,-133.42838,-198.78586,12.488613,2.7497218,-2.8461416,128.08379,1130000
|
| 28 |
+
0.6360216,126.08401,0.008981415,-0.014331877,-14.095726,0.1821321,-125.95741,126.2518,3.9134774,9.082964,1.7933187,-130.18504,-201.86671,12.996441,3.8123417,-3.6377184,136.441,1135000
|
| 29 |
+
0.636382,124.70767,0.008865839,-0.00035969785,-12.540571,0.18880431,-124.59649,124.89612,4.050621,8.832672,-6.534545,-128.21623,-196.91035,12.883293,2.8421605,-2.2754269,130.32579,1140000
|
| 30 |
+
0.6504776,128.10019,0.008851974,0.007689001,-11.63138,0.16067816,-127.99723,128.26855,3.6161458,10.093371,-2.3105562,-130.68279,-200.06606,13.7095175,6.768597,-5.4132333,165.2433,1145000
|
| 31 |
+
0.64407223,128.86893,0.009051435,0.0006959043,-12.423117,0.15228572,-128.75647,129.02191,2.9644039,8.396022,-2.6708305,-131.18652,-202.96336,11.360426,3.1548195,-2.3944194,109.14513,1150000
|
| 32 |
+
0.6422238,126.62654,0.009084243,0.0018990714,-12.290949,0.18313959,-126.51488,126.81158,3.7675316,13.460883,-5.232151,-129.2733,-201.30688,17.228415,4.1794944,-3.6322865,206.66385,1155000
|
| 33 |
+
0.6417494,128.65085,0.009113943,0.007644988,-11.661177,0.19036144,-128.54456,128.84886,6.00014,10.239601,-10.139838,-131.6443,-202.76094,16.239742,2.317663,-4.1540713,226.0728,1160000
|
| 34 |
+
0.63586605,129.32718,0.009144476,-0.015846755,-14.232932,0.199867,-129.19702,129.51118,3.888094,12.516783,-1.3985913,-132.35118,-202.68343,16.404877,6.3585105,-7.5735793,172.31331,1165000
|
| 35 |
+
0.65388334,127.05216,0.008854052,0.01958317,-10.288225,0.14390266,-126.96106,127.21565,2.662054,7.9065003,1.9545878,-129.38643,-204.8477,10.568554,4.9893517,-4.965696,111.33298,1170000
|
| 36 |
+
0.65561783,130.54114,0.008850987,0.0064637573,-11.769713,0.16935171,-130.43695,130.71696,2.807752,10.909976,1.8020799,-132.77983,-203.77383,13.717728,4.137025,-4.4331803,136.76862,1175000
|
| 37 |
+
0.6428333,126.00345,0.008959968,0.005531757,-11.882614,0.17874773,-125.89698,126.18773,2.882508,6.9471164,2.7062669,-128.91145,-201.24953,9.829624,0.91137815,-1.3622543,95.32741,1180000
|
| 38 |
+
0.6323903,123.80432,0.008797768,-0.021070607,-14.894995,0.17445897,-123.67328,123.95771,3.4094124,11.554057,-4.6875105,-127.09167,-204.56668,14.9634695,1.6218823,-1.7460337,122.47629,1185000
|
| 39 |
+
0.6390684,125.59163,0.008802808,-0.01169949,-13.829063,0.1422596,-125.469894,125.72219,6.0784597,13.713409,-11.053524,-128.1754,-202.93205,19.79187,4.6216,-5.3881717,209.31912,1190000
|
| 40 |
+
0.64209855,125.03865,0.008843326,-0.0031213118,-12.852957,0.17306283,-124.92498,125.208595,3.120889,12.012288,-1.3130747,-127.801735,-204.46663,15.133177,5.682155,-4.559839,153.46265,1195000
|
| 41 |
+
0.639845,125.57135,0.008710562,-0.0017355898,-12.699251,0.1507714,-125.460724,125.72039,3.2449036,11.044777,-2.1551902,-129.29973,-203.25385,14.2896805,3.5389664,-1.7415601,118.15797,1200000
|
| 42 |
+
0.6365927,123.513885,0.008850227,-0.013229156,-13.9947815,0.13717224,-123.390045,123.637825,5.272592,9.120862,1.5905051,-126.579735,-197.11165,14.393454,3.3959823,-3.4227388,160.44345,1205000
|
| 43 |
+
0.6377818,126.26075,0.008581363,-0.0038449492,-12.948058,0.16699764,-126.14963,126.423904,3.2589996,12.157851,-5.4255233,-128.64915,-200.31987,15.416851,2.7532537,-2.9979026,132.21031,1210000
|
| 44 |
+
0.64191145,125.2381,0.008487448,-0.0009835822,-12.615887,0.19271159,-125.13101,125.429825,2.847297,7.25464,-4.5831203,-127.806175,-202.49307,10.101937,1.7426533,-1.3942971,123.19255,1215000
|
| 45 |
+
0.6442653,122.16271,0.008483009,0.0032995099,-12.111045,0.19857192,-122.05997,122.36458,5.7100224,13.719977,-6.751171,-125.046326,-200.3074,19.43,6.008419,-5.6346292,247.12329,1220000
|
| 46 |
+
0.63809055,120.153564,0.008549256,0.008832987,-11.466812,0.17138883,-120.05553,120.333786,6.3368998,14.133936,-1.2633395,-123.53754,-203.11551,20.470837,1.7265916,-1.5316513,160.27095,1225000
|
| 47 |
+
0.64832115,123.75131,0.00851894,0.0072635575,-11.647364,0.19047374,-123.652084,123.94905,4.8593974,9.749782,-8.255757,-126.80877,-202.2139,14.609179,1.4506383,-1.3270575,126.69564,1230000
|
| 48 |
+
0.64333874,123.90573,0.00867035,0.0037379852,-12.068877,0.19873086,-123.80109,124.1082,8.692974,10.450952,-6.800746,-126.41674,-201.64906,19.143925,3.6231515,-6.001799,257.29578,1235000
|
| 49 |
+
0.64641243,120.812515,0.008614642,0.0106301,-11.266043,0.1674346,-120.71547,120.99058,3.0775013,10.436999,2.9849367,-123.97329,-204.82623,13.514501,4.078586,-2.9906776,135.68394,1240000
|
| 50 |
+
0.63434446,123.53998,0.008458104,-0.011317373,-13.838051,0.17098293,-123.422935,123.699646,4.8024125,10.068221,-5.464667,-126.662865,-202.21553,14.870634,5.533489,-5.5058017,170.53964,1245000
|
| 51 |
+
0.64390785,112.63048,0.0084747905,0.017908752,-10.386821,0.15335074,-112.54245,112.801735,4.2674394,10.7258,-1.962584,-116.05459,-202.04427,14.993238,2.3802266,-2.3485296,158.86298,1250000
|
| 52 |
+
0.64503086,125.545006,0.00843565,-0.0024837225,-12.794432,0.18797176,-125.43708,125.73049,9.915013,12.713843,-5.4828587,-128.79488,-201.61841,22.628857,5.254665,-6.7980423,231.11667,1255000
|
| 53 |
+
0.6377623,121.95765,0.008362758,-0.00981207,-13.6733055,0.16554749,-121.84331,122.11339,7.838669,15.225031,0.82913685,-125.13714,-197.80081,23.0637,10.601127,-9.955818,316.13382,1260000
|
| 54 |
+
0.6364712,121.50835,0.008628652,0.0036475118,-12.077279,0.14906493,-121.404144,121.66106,3.6728635,8.627863,-2.7202306,-124.20597,-203.62886,12.300726,2.995927,-2.7178357,140.22125,1265000
|
| 55 |
+
0.6384205,122.24304,0.008649204,0.001405103,-12.337545,0.15509467,-122.13632,122.39954,4.996223,12.109792,-2.7970958,-124.68972,-202.11456,17.106014,2.5861683,-2.3071039,187.39102,1270000
|
| 56 |
+
0.6389597,118.99133,0.008594107,0.005971525,-11.8051605,0.20636079,-118.88987,119.20367,3.1167715,11.405807,-5.5785055,-121.33942,-203.35966,14.522578,2.3739934,-1.6800555,130.84299,1275000
|
| 57 |
+
0.6359179,123.08945,0.008521955,-0.009002596,-13.5564,0.19083732,-122.97392,123.27128,4.358337,18.70556,3.1824603,-127.05816,-200.75018,23.063898,14.361351,-15.372471,229.92308,1280000
|
| 58 |
+
0.6419461,118.11688,0.008566657,0.009389806,-11.403913,0.16377495,-118.019196,118.29005,3.9648106,9.125285,0.15734282,-120.35874,-202.1696,13.0900955,1.6499809,-2.2292151,138.6709,1285000
|
| 59 |
+
0.63882256,112.715324,0.008548469,-0.0071785226,-13.339744,0.16356003,-112.60129,112.871704,4.638349,12.575909,3.5655165,-115.871376,-200.3826,17.214258,3.0247793,-2.6979148,161.75012,1290000
|
| 60 |
+
0.6424936,117.54994,0.008566485,0.010061585,-11.325471,0.18161687,-117.45293,117.74162,3.9961832,13.665807,3.401253,-120.256996,-201.92415,17.66199,5.090977,-5.0399137,173.90207,1295000
|
| 61 |
+
0.64270675,119.7292,0.008463951,-0.0022989605,-12.771618,0.1723569,-119.6211,119.89926,3.6395497,15.300061,4.845348,-122.97654,-196.39244,18.939611,4.640162,-4.2943377,210.31013,1300000
|
| 62 |
+
0.645325,121.60801,0.0083509665,0.0101601,-11.283362,0.15814507,-121.51379,121.77631,3.8809152,8.985576,4.098552,-124.499565,-200.29033,12.866491,1.5339854,-0.9207981,110.86883,1305000
|
| 63 |
+
0.6478857,120.922134,0.008460251,0.0055018063,-11.849688,0.16526932,-120.821884,121.0929,11.982508,14.533193,0.9592593,-124.13686,-200.07486,26.515701,7.859707,-8.004476,382.2781,1310000
|
| 64 |
+
0.6379398,118.120224,0.008483009,0.019180866,-10.238908,0.15787676,-118.03337,118.29728,4.564119,9.470704,-5.4410324,-120.669876,-198.38023,14.034822,1.2594509,-1.7199771,151.67752,1315000
|
| 65 |
+
0.63231796,118.41519,0.008654213,-0.013166638,-14.021414,0.14538072,-118.29385,118.5474,5.9773026,14.172032,-7.497801,-121.41494,-193.85854,20.149334,5.8131456,-3.9362595,208.99655,1320000
|
| 66 |
+
0.6375815,118.18234,0.008469368,-0.0036455786,-12.930443,0.15901148,-118.07283,118.33771,3.804334,13.431457,-2.1490757,-120.77998,-203.72165,17.23579,8.685775,-9.09581,179.94495,1325000
|
| 67 |
+
0.6379457,117.34464,0.008688634,0.0032942658,-12.120853,0.165101,-117.23933,117.51304,4.3795476,15.701273,-2.8713224,-119.50265,-203.27878,20.08082,1.4432031,-2.6795182,180.13635,1330000
|
| 68 |
+
0.63924766,120.284996,0.008468456,-0.001299097,-12.653404,0.19148558,-120.17784,120.47518,5.8742166,12.139681,-1.4999378,-122.95701,-201.67087,18.013897,2.3578143,-2.1283352,184.82932,1335000
|
| 69 |
+
0.64267373,121.050995,0.008231669,0.0088841645,-11.420733,0.16929322,-120.956985,121.22917,4.8664274,10.29299,-1.9322164,-124.02047,-196.72676,15.159417,5.69005,-6.505579,197.15292,1340000
|
| 70 |
+
0.63940036,124.813934,0.008588777,-0.011172677,-13.800846,0.17148969,-124.695404,124.97425,6.6876817,11.79515,-5.056322,-127.91778,-199.87653,18.482832,3.2305074,-3.2951133,154.86705,1345000
|
| 71 |
+
0.64167345,112.08322,0.008302412,0.010813034,-11.197603,0.16848129,-111.99026,112.26251,3.9780164,10.461127,4.622429,-113.81133,-201.26454,14.439144,3.3838787,-3.665567,149.76682,1350000
|
| 72 |
+
0.65090865,115.87819,0.0084658675,0.010205697,-11.294489,0.19894356,-115.78258,116.08734,7.0498843,10.017176,-2.9643302,-118.21453,-199.08992,17.06706,1.3811994,-2.5185146,140.4136,1355000
|
| 73 |
+
0.64304596,112.37104,0.008471375,0.00957541,-11.369675,0.1457988,-112.274734,112.52641,5.3214355,12.3923435,0.44466034,-115.12563,-200.91249,17.71378,4.2721434,-5.222407,198.55353,1360000
|
| 74 |
+
0.6387522,118.62284,0.008457975,-0.019442802,-14.798754,0.16256729,-118.49767,118.76597,3.9437203,14.712496,-1.6654229,-121.63851,-206.41031,18.656216,4.09527,-4.5309825,175.78758,1365000
|
| 75 |
+
0.6456484,114.77827,0.008308527,0.003009323,-12.137803,0.18477058,-114.677414,114.96604,5.7419357,11.320409,6.6998367,-117.58404,-201.4152,17.062344,5.748235,-5.339521,265.34454,1370000
|
| 76 |
+
0.6378013,114.16199,0.00816541,-0.0070461407,-13.362926,0.14416456,-114.05287,114.2991,3.6956613,22.404892,0.10665945,-117.61509,-205.22922,26.100554,6.600313,-6.155339,191.74365,1375000
|
| 77 |
+
0.6459477,114.38164,0.008185536,0.010746435,-11.187143,0.124752715,-114.29007,114.51714,4.681916,13.739982,-5.445271,-116.909355,-201.98363,18.421898,1.9464821,-2.240349,160.58154,1380000
|
| 78 |
+
0.6445333,115.26684,0.008436281,-0.006832273,-13.309868,0.14616936,-115.15456,115.40617,3.4809537,9.775042,-2.5053573,-118.42301,-201.33513,13.255995,0.8097689,-0.7310865,109.825516,1385000
|
| 79 |
+
0.6320904,118.525,0.008313869,-0.015282939,-14.338246,0.13292366,-118.405785,118.64265,5.633813,14.853152,-3.7496064,-121.652016,-201.20619,20.486965,3.667048,-3.7088795,240.86015,1390000
|
| 80 |
+
0.6341433,115.41601,0.00833085,-0.008510223,-13.521531,0.15638202,-115.30336,115.56388,4.4898973,12.76034,-2.5649076,-118.18115,-197.46117,17.250237,4.356512,-4.2793927,182.92776,1395000
|
| 81 |
+
0.6449634,113.39052,0.008163576,0.0053331186,-11.846718,0.13563514,-113.29381,113.53149,4.549793,11.668037,-2.943189,-116.63705,-197.69258,16.21783,4.900224,-5.04923,176.61917,1400000
|
| 82 |
+
0.6458037,115.16055,0.008291592,0.009968033,-11.297814,0.13465148,-115.06688,115.305176,5.5485835,9.695594,-0.563121,-117.71999,-200.9672,15.244177,1.1296862,-1.6612698,130.34991,1405000
|
| 83 |
+
0.63218415,116.27744,0.008283597,-0.010190069,-13.73015,0.1707437,-116.16371,116.437996,4.516593,11.390043,3.7037055,-119.488525,-194.13121,15.906636,1.4770594,-1.4525577,158.77158,1410000
|
| 84 |
+
0.64072126,113.15425,0.008438083,-0.006715664,-13.295876,0.16714543,-113.04205,113.31468,12.210792,15.632541,-0.8360191,-115.784744,-195.87413,27.843332,3.5338476,-5.9131756,342.94904,1415000
|
| 85 |
+
0.6386226,115.450775,0.0083728805,-0.007773111,-13.428368,0.15366492,-115.33835,115.596664,3.2448585,11.966582,-2.115785,-118.21908,-200.26035,15.211441,2.4489152,-3.8340757,130.34662,1420000
|
| 86 |
+
0.64757687,112.40498,0.0082875835,0.0019464728,-12.265134,0.1555057,-112.30334,112.56243,5.1392417,11.615745,7.797314,-115.95095,-201.6697,16.754986,4.964534,-4.6030493,179.96808,1425000
|
| 87 |
+
0.6520716,114.23018,0.008327574,0.0149779515,-10.701403,0.13902606,-114.14107,114.38418,4.8725886,13.973075,5.479182,-117.206055,-204.58499,18.845663,5.7739096,-3.6685035,250.10512,1430000
|
| 88 |
+
0.6499517,114.815445,0.008397266,0.024186827,-9.6196785,0.1572241,-114.734665,114.99686,6.1431,10.785691,9.1892805,-116.882256,-200.15195,16.928791,2.3317187,-3.5325522,192.5989,1435000
|
| 89 |
+
0.6375859,107.76594,0.008115615,-0.0032826655,-12.904488,0.14776699,-107.66121,107.91042,5.9325495,15.1486845,-2.0654595,-111.16676,-203.6631,21.081234,4.4551206,-3.905351,246.47073,1440000
|
| 90 |
+
0.63675565,117.264755,0.008218004,-0.009037974,-13.599777,0.15862146,-117.15299,117.41434,4.999454,13.559099,2.59945,-120.30129,-201.97122,18.558554,3.370185,-3.5824456,207.18903,1445000
|
| 91 |
+
0.6420816,109.15242,0.008316058,0.0060964855,-11.766902,0.1491107,-109.054565,109.307625,5.317029,15.136037,2.8440726,-112.24021,-201.54616,20.453066,4.0835447,-4.414639,255.98898,1450000
|
| 92 |
+
0.63789666,115.18889,0.008059769,-0.0048187086,-13.097872,0.15004465,-115.08333,115.334114,9.9313965,12.84404,0.93658507,-118.77798,-199.78664,22.775436,3.2961953,-3.0255702,203.02255,1455000
|
| 93 |
+
0.65320647,113.06468,0.008223642,0.003284144,-12.100646,0.14753109,-112.965164,113.21549,7.130184,11.4464445,-1.8999853,-115.73754,-197.84517,18.57663,3.4193685,-5.001981,234.15259,1460000
|
| 94 |
+
0.63703895,114.537476,0.008075006,-0.008281838,-13.525614,0.13240968,-114.42825,114.6616,3.9057863,14.351865,-2.7221718,-117.0071,-199.36969,18.25765,3.6481392,-3.2062519,162.30798,1465000
|
| 95 |
+
0.6479511,110.243645,0.008303327,0.0015585921,-12.312293,0.13051736,-110.14142,110.37572,5.964334,11.3368845,2.9748137,-113.16431,-200.42761,17.301218,2.6076434,-2.8435645,155.75356,1470000
|
| 96 |
+
0.64085615,114.12944,0.008219062,0.009555784,-11.337363,0.13872507,-114.036255,114.27772,4.510007,16.413332,4.231467,-116.95464,-201.2083,20.92334,5.6581864,-4.115401,220.28476,1475000
|
| 97 |
+
0.63489974,115.0514,0.008079085,-0.015721159,-14.445909,0.1431398,-114.93469,115.17882,4.748133,15.099256,3.3816657,-118.35817,-200.3992,19.84739,1.9742584,-1.7815018,176.95139,1480000
|
| 98 |
+
0.6381157,112.236015,0.00825708,-0.00018435145,-12.522326,0.12792695,-112.132614,112.36376,5.443579,14.448076,-0.11809485,-114.08894,-199.83012,19.891655,3.4171395,-3.9279017,232.76663,1485000
|
| 99 |
+
0.63452584,109.78712,0.00816363,0.011003947,-11.152077,0.15117763,-109.696075,109.949295,3.9466782,11.68613,2.2374516,-111.75942,-199.57167,15.632808,10.596968,-10.831001,174.63707,1490000
|
| 100 |
+
0.6380096,105.72828,0.008215869,-0.0026068625,-12.817296,0.11779083,-105.62297,105.84346,8.83377,16.716166,-1.4239688,-108.58125,-202.38547,25.549934,4.6741896,-4.989168,218.33177,1495000
|
| 101 |
+
0.6370428,105.64186,0.008218272,-0.006745454,-13.320787,0.16893467,-105.532394,105.804054,6.3070335,16.137564,5.2815933,-108.39858,-204.39442,22.444597,4.4047685,-4.551241,314.36758,1500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27e8655bf53f3cf68845860e307068ddd2e9084832588261eadb2090bba0238d
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03942aa23eea35529e8b4422621b04666be2e192dd2546428456ce04d241086f
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d301de6eb6322fd84904d5757a6262a470e4e215e638652cf9d244fb131f43f
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15332136044d9d4a9e3c3ecd64830913210f14097989ad2e5b6d28c2e7def400
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:937052ff0e4c7a49a0b3be089f7ea90f31b3782c322994c23bf248d240ac8019
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dce426dd982d419a41e51776843f5b65b852a086b61ae3a3cad0bd1052e10f27
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c618310f547b111590079f46c646eec2aa3a15ddcea75052ff2722942a1a2468
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:140a417a6e464d18712233880d67b2dec1923412e0f2d3857631f2e29ea60667
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d342a818f9400df3630f2a8214e397374d2ae50518e4499bb70a2b7b725341c
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/params_1500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db68e0bcd54cd7b79ca4036905e52107728f6341dd2eb839cd6efbd73cc94b4a
|
| 3 |
+
size 326957888
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/dsrl/20260319_233535/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/w9njshu8
|