Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1150000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1200000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1350000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1400000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.03944106585958781,0.010951551183863194,-0.03890626863625167,0.02193431620104874,24.228930673386245,17.47799999999885,0.64,8682.42,-0.48,-540.56,347.56,1.1677243280410767,950000
|
| 3 |
+
0.0,0.0,-0.016454078678092513,-0.011432444778034859,-0.016434835240382917,-0.005665241751223759,30.224188174537538,12.995999999999508,0.82,24243.0,-0.24,-389.84,257.92,0.8911804628372192,1000000
|
| 4 |
+
0.0,0.0,-0.000512296937340202,-0.02322448319926973,-0.001107614498103114,-0.021793916812578036,34.99726867807401,10.16399999999985,1.0,36197.0,0.0,-294.54,201.28,0.7151017570495606,1050000
|
| 5 |
+
0.0,0.0,0.03185028694847118,-0.03400549557750653,0.03085300659801127,-0.04623708726406382,34.812326373585165,8.316999999999759,1.0,45454.84,0.0,-240.12,164.34,0.5945564556121826,1100000
|
| 6 |
+
0.0,0.0,0.011784493442112423,-0.03286198175559225,0.011308978246590062,-0.009826260149764458,34.97126587325053,8.193999999999658,0.98,54381.84,-0.04,-236.96,161.88,0.5836142444610596,1150000
|
| 7 |
+
0.0,0.0,0.021102003340687413,-0.0365353369118965,0.019754362631279908,-0.04200714963880849,34.73818400982454,8.300999999999648,0.98,63047.5,-0.02,-245.22,164.02,0.5934643983840943,1200000
|
| 8 |
+
0.0,0.0,0.022559802338538618,-0.047957703139550376,0.020939598944322887,-0.05284023556984499,35.74020720560284,7.338999999999666,1.0,70943.68,0.0,-203.36,144.78,0.5244375085830688,1250000
|
| 9 |
+
0.0,0.0,0.019019124156426266,-0.046045888523418045,0.017180015136950503,-0.050411817207970035,35.80620382744072,7.556999999999575,0.98,78663.94,-0.02,-217.12,149.14,0.5328059005737305,1300000
|
| 10 |
+
0.0,0.0,0.027810149333562587,-0.0521947669352374,0.026262484322791973,-0.0629219281005782,35.48085617030734,7.516999999999711,1.0,86286.94,0.0,-219.76,148.34,0.5299419498443604,1350000
|
| 11 |
+
0.0,0.0,0.01164892688108399,-0.03591399275911569,0.010308361102338669,-0.039355796482038304,34.46641384189337,8.50399999999966,0.98,94499.32,-0.02,-250.92,168.08,0.6014986753463745,1400000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.03944106585958781,0.010951551183863194,-0.03890626863625167,0.02193431620104874,24.228930673386245,17.47799999999885,0.64,8682.42,-0.48,-540.56,347.56,1.1677243280410767,950000
|
| 3 |
+
0.0,0.0,-0.016454078678092513,-0.011432444778034859,-0.016434835240382917,-0.005665241751223759,30.224188174537538,12.995999999999508,0.82,24243.0,-0.24,-389.84,257.92,0.8911804628372192,1000000
|
| 4 |
+
0.0,0.0,-0.000512296937340202,-0.02322448319926973,-0.001107614498103114,-0.021793916812578036,34.99726867807401,10.16399999999985,1.0,36197.0,0.0,-294.54,201.28,0.7151017570495606,1050000
|
| 5 |
+
0.0,0.0,0.03185028694847118,-0.03400549557750653,0.03085300659801127,-0.04623708726406382,34.812326373585165,8.316999999999759,1.0,45454.84,0.0,-240.12,164.34,0.5945564556121826,1100000
|
| 6 |
+
0.0,0.0,0.011784493442112423,-0.03286198175559225,0.011308978246590062,-0.009826260149764458,34.97126587325053,8.193999999999658,0.98,54381.84,-0.04,-236.96,161.88,0.5836142444610596,1150000
|
| 7 |
+
0.0,0.0,0.021102003340687413,-0.0365353369118965,0.019754362631279908,-0.04200714963880849,34.73818400982454,8.300999999999648,0.98,63047.5,-0.02,-245.22,164.02,0.5934643983840943,1200000
|
| 8 |
+
0.0,0.0,0.022559802338538618,-0.047957703139550376,0.020939598944322887,-0.05284023556984499,35.74020720560284,7.338999999999666,1.0,70943.68,0.0,-203.36,144.78,0.5244375085830688,1250000
|
| 9 |
+
0.0,0.0,0.019019124156426266,-0.046045888523418045,0.017180015136950503,-0.050411817207970035,35.80620382744072,7.556999999999575,0.98,78663.94,-0.02,-217.12,149.14,0.5328059005737305,1300000
|
| 10 |
+
0.0,0.0,0.027810149333562587,-0.0521947669352374,0.026262484322791973,-0.0629219281005782,35.48085617030734,7.516999999999711,1.0,86286.94,0.0,-219.76,148.34,0.5299419498443604,1350000
|
| 11 |
+
0.0,0.0,0.01164892688108399,-0.03591399275911569,0.010308361102338669,-0.039355796482038304,34.46641384189337,8.50399999999966,0.98,94499.32,-0.02,-250.92,168.08,0.6014986753463745,1400000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.18966179,6.7653995,-20.126276,-178.11469,-202.92091,1.6431085,-1.8655854,38.24298,905000
|
| 3 |
+
0.18578145,7.477689,-83.22344,-177.72717,-203.3036,0.6432909,-0.6410496,29.622086,910000
|
| 4 |
+
0.19692901,8.698405,-72.10777,-177.07178,-203.2007,0.32873407,-0.30973366,20.996105,915000
|
| 5 |
+
0.17013285,9.054554,-63.831528,-175.56255,-203.86385,0.3087135,-0.31753153,23.431908,920000
|
| 6 |
+
0.172735,10.83856,-57.797153,-172.64624,-202.46979,0.3237254,-0.3125539,21.555908,925000
|
| 7 |
+
0.17407195,19.260248,-58.483948,-172.32869,-203.31917,1.5385495,-1.3258097,44.282845,930000
|
| 8 |
+
0.18090695,15.310005,-58.466343,-170.50322,-203.01674,0.43596098,-0.309015,34.584084,935000
|
| 9 |
+
0.20529777,14.332511,-50.035126,-169.82698,-202.82964,0.34842628,-0.5162208,30.430597,940000
|
| 10 |
+
0.18358293,9.023501,-90.49739,-169.37503,-203.70975,0.3964815,-0.28057137,29.511843,945000
|
| 11 |
+
0.20256825,17.129393,-45.745117,-166.42369,-203.44432,0.49787417,-0.25722575,35.127563,950000
|
| 12 |
+
0.18285123,20.25358,-44.591343,-166.12444,-203.65419,0.9704574,-1.0938437,41.08338,955000
|
| 13 |
+
0.18907589,12.6300955,-13.341955,-164.28622,-203.7614,0.4330974,-0.41664279,33.178093,960000
|
| 14 |
+
0.19324552,16.14883,-40.531803,-164.0002,-204.94356,0.8801897,-0.83253056,39.90714,965000
|
| 15 |
+
0.20542364,31.180775,-20.04135,-158.15463,-204.23723,0.5540628,-0.5698024,52.332436,970000
|
| 16 |
+
0.17378373,18.005442,-39.71998,-161.27725,-205.27576,0.5684463,-0.59509176,42.107414,975000
|
| 17 |
+
0.17719296,15.847678,-13.145182,-159.67484,-203.38889,1.0835689,-1.0736346,56.330574,980000
|
| 18 |
+
0.18116891,21.572588,-4.1624527,-157.81749,-203.88383,2.2403352,-2.2724118,91.12161,985000
|
| 19 |
+
0.18645494,21.449448,-41.354538,-156.87137,-204.82465,1.0677905,-1.0572845,73.8971,990000
|
| 20 |
+
0.18522213,17.534863,-21.013788,-157.51114,-204.18983,1.3709271,-1.4008812,46.576218,995000
|
| 21 |
+
0.15818149,16.850538,-16.20519,-151.85481,-203.41533,0.6744793,-0.6710634,48.384827,1000000
|
| 22 |
+
0.1664196,23.95124,-35.391724,-157.24402,-204.29277,0.5188542,-0.6363758,54.97317,1005000
|
| 23 |
+
0.17085174,14.143054,-14.06295,-152.82396,-205.26453,0.44848546,-0.39803973,38.7817,1010000
|
| 24 |
+
0.18375774,20.474298,0.8385193,-149.58452,-204.53085,0.9625078,-1.1721357,60.06286,1015000
|
| 25 |
+
0.19389208,21.592514,-26.178839,-152.47856,-204.23634,0.68536776,-0.9390727,55.82074,1020000
|
| 26 |
+
0.1933236,16.414211,-26.508972,-153.63513,-203.21771,0.9311064,-0.9138135,51.151657,1025000
|
| 27 |
+
0.17648816,21.114164,-4.5305305,-152.07927,-204.85468,0.69814235,-0.5650126,52.807392,1030000
|
| 28 |
+
0.17980632,16.455885,3.5878756,-151.3574,-203.81378,1.4236696,-1.3832209,76.51,1035000
|
| 29 |
+
0.13024934,17.775324,-29.370283,-146.78136,-200.96695,1.0427796,-0.68198556,50.231415,1040000
|
| 30 |
+
0.17145303,23.644445,-4.746052,-145.8927,-203.92325,2.265358,-2.218687,101.10012,1045000
|
| 31 |
+
0.17266712,17.97437,-20.396284,-146.44165,-203.08308,0.51400924,-0.6492056,50.64456,1050000
|
| 32 |
+
0.15826833,15.804746,-4.4666247,-143.82994,-204.09157,0.9739423,-0.9438526,47.295036,1055000
|
| 33 |
+
0.16841012,18.827106,-17.95805,-150.54207,-204.47247,0.84246397,-1.0346713,59.066486,1060000
|
| 34 |
+
0.1749284,24.119877,-1.4558277,-146.99217,-204.71558,1.341043,-0.7528471,78.73086,1065000
|
| 35 |
+
0.18438336,13.998569,-8.787376,-144.45569,-205.23105,0.6875024,-1.1476943,55.313416,1070000
|
| 36 |
+
0.19444224,23.82794,-6.4940205,-148.74841,-204.19522,0.7739351,-0.7213713,50.742718,1075000
|
| 37 |
+
0.18684912,16.485378,2.0644536,-146.81766,-205.65263,0.5038934,-0.5593821,49.305374,1080000
|
| 38 |
+
0.17982545,14.2273245,-8.900905,-146.42581,-201.78365,0.7622176,-0.73159957,43.7922,1085000
|
| 39 |
+
0.15173486,12.815518,-15.899203,-144.46924,-205.08629,1.2746345,-1.4480327,73.05667,1090000
|
| 40 |
+
0.16680588,15.618423,0.7458807,-144.47078,-201.79413,1.2066892,-1.4692711,60.0987,1095000
|
| 41 |
+
0.17755131,18.583633,-1.4944447,-141.31638,-205.3619,0.55768824,-0.5592019,43.728043,1100000
|
| 42 |
+
0.17811257,22.339937,-1.2031765,-146.54776,-204.84966,1.2947464,-1.4122505,82.0036,1105000
|
| 43 |
+
0.15213689,18.199278,-16.50453,-146.4121,-204.03188,1.8539157,-1.6663227,65.092476,1110000
|
| 44 |
+
0.15412563,19.714024,-7.5301266,-143.01262,-205.30873,0.69826525,-0.8444862,54.45173,1115000
|
| 45 |
+
0.17219512,21.880974,-12.639673,-143.2178,-203.98312,0.5349717,-0.5043898,43.429443,1120000
|
| 46 |
+
0.20286341,16.449188,-23.990665,-138.75322,-202.4721,1.2379079,-1.741777,61.44374,1125000
|
| 47 |
+
0.17903654,15.322121,-12.184996,-143.9921,-204.72963,1.345032,-1.4817891,49.277878,1130000
|
| 48 |
+
0.18399072,12.217189,-3.8892384,-139.36166,-203.93509,0.547896,-0.46872187,46.854034,1135000
|
| 49 |
+
0.19633368,16.166677,0.9685967,-143.4053,-204.7286,0.7526735,-0.7575725,51.185116,1140000
|
| 50 |
+
0.18780988,23.15817,-12.203989,-140.8118,-206.58495,1.839274,-1.7409148,81.2856,1145000
|
| 51 |
+
0.15954559,15.835648,-2.688039,-133.84047,-204.14964,0.8554473,-0.62537277,48.845703,1150000
|
| 52 |
+
0.18219803,20.200058,1.3323915,-144.22533,-203.5371,0.7348884,-0.725095,64.45744,1155000
|
| 53 |
+
0.1878626,14.351596,2.916746,-139.77762,-205.86278,0.4859673,-0.38466582,39.930923,1160000
|
| 54 |
+
0.21281782,20.278189,2.4459367,-142.29922,-205.52757,1.7444717,-1.9571614,49.065403,1165000
|
| 55 |
+
0.14940876,19.937586,0.8626706,-138.52249,-204.45801,1.2208756,-1.0030751,57.04455,1170000
|
| 56 |
+
0.1648784,22.212929,-6.913545,-135.53287,-205.23424,0.88384,-0.8625692,53.243107,1175000
|
| 57 |
+
0.19732986,20.277973,-12.239784,-142.58476,-205.2713,0.654126,-0.61679375,59.13831,1180000
|
| 58 |
+
0.16233256,15.968183,0.7977252,-136.48044,-204.69936,4.064038,-3.8394744,80.92444,1185000
|
| 59 |
+
0.16069782,17.24055,-1.3626871,-134.72119,-204.03738,1.1260667,-0.8595922,55.2034,1190000
|
| 60 |
+
0.15968344,15.573676,2.676263,-136.35213,-206.45816,0.818334,-0.7807407,46.09977,1195000
|
| 61 |
+
0.14733833,15.992648,-3.1255825,-140.31352,-204.60075,1.4619527,-1.1057086,56.196037,1200000
|
| 62 |
+
0.14880987,13.228736,-7.17874,-137.18614,-204.56825,0.32066235,-0.35599577,34.432983,1205000
|
| 63 |
+
0.16506287,15.302955,-8.603916,-138.52464,-204.49088,0.86375076,-0.6668957,49.33357,1210000
|
| 64 |
+
0.17788559,23.639303,-3.131779,-135.5211,-203.35966,1.6010504,-0.5405533,68.15269,1215000
|
| 65 |
+
0.21585451,22.857025,-9.024269,-138.98189,-201.75662,1.3717732,-1.4120892,80.24815,1220000
|
| 66 |
+
0.19225226,19.850237,-8.977592,-138.28755,-205.00415,0.71532434,-0.65977156,64.8663,1225000
|
| 67 |
+
0.19589671,19.645966,3.060331,-133.09085,-205.04033,3.2060766,-1.2423942,64.944984,1230000
|
| 68 |
+
0.19416869,10.189251,2.5420659,-134.89156,-203.2502,0.7562388,-0.6809339,50.482002,1235000
|
| 69 |
+
0.19001108,17.561146,0.35603136,-137.55907,-205.3603,0.8963432,-1.0822905,61.068153,1240000
|
| 70 |
+
0.1834346,11.757024,-6.904485,-143.71594,-205.51091,0.6865231,-0.72172046,46.74719,1245000
|
| 71 |
+
0.16829522,18.535257,4.1067424,-131.93912,-204.89311,2.5548768,-2.543158,64.574295,1250000
|
| 72 |
+
0.18723561,13.435847,-4.2907147,-135.8025,-204.21709,1.317136,-1.1674777,57.6724,1255000
|
| 73 |
+
0.16211487,20.214573,3.138769,-129.41,-203.81099,0.83016413,-0.76781344,51.175514,1260000
|
| 74 |
+
0.16172963,22.126616,-0.90905166,-135.79607,-203.99023,0.7816759,-1.3213891,62.78894,1265000
|
| 75 |
+
0.13934624,12.977097,0.91940486,-132.04906,-204.02516,0.5118471,-0.461077,44.71924,1270000
|
| 76 |
+
0.2067027,26.363714,1.2019508,-132.76053,-204.58078,1.106244,-1.0971463,61.727486,1275000
|
| 77 |
+
0.18460377,8.913628,4.0454288,-131.46582,-202.8688,0.7758538,-0.8656192,41.436512,1280000
|
| 78 |
+
0.18247177,20.222433,-4.7243075,-135.16281,-203.41708,3.0583358,-2.3157718,77.414764,1285000
|
| 79 |
+
0.16811168,12.401019,-6.0972104,-133.84792,-204.05522,0.3684411,-0.33519515,35.31093,1290000
|
| 80 |
+
0.18681282,9.4927635,-5.3117023,-134.2708,-203.41776,1.5815449,-1.5798165,50.58082,1295000
|
| 81 |
+
0.16620468,14.965568,1.3483164,-130.37813,-202.11714,0.6709148,-0.6501946,48.12304,1300000
|
| 82 |
+
0.15152058,11.453309,2.39286,-133.31055,-204.18697,0.4198118,-0.6729851,49.442036,1305000
|
| 83 |
+
0.18171036,16.006989,6.1019444,-136.26785,-201.89294,0.5424408,-0.63604397,48.07852,1310000
|
| 84 |
+
0.15714678,13.572802,-2.2762518,-129.96504,-201.22127,1.1674874,-1.0309496,45.43833,1315000
|
| 85 |
+
0.1499154,12.515073,-0.4853516,-134.20976,-203.82965,0.7396925,-0.43500248,43.653004,1320000
|
| 86 |
+
0.15493341,22.520658,0.3087534,-128.32408,-204.43846,0.9323146,-1.6264292,78.256935,1325000
|
| 87 |
+
0.18568563,12.363844,-3.6269197,-127.864944,-203.2563,0.78956217,-0.89266914,47.150944,1330000
|
| 88 |
+
0.19432136,15.336352,1.0837134,-133.16577,-204.63611,1.4471616,-1.2871381,63.81024,1335000
|
| 89 |
+
0.19228105,20.825586,-11.578099,-127.441795,-204.28377,1.0599501,-0.5443374,60.30703,1340000
|
| 90 |
+
0.1682543,12.055411,-2.0422754,-131.04121,-201.41977,0.8014154,-0.82155347,39.45122,1345000
|
| 91 |
+
0.17165527,21.178057,-12.502699,-128.03438,-205.04521,1.5227485,-1.468615,59.45584,1350000
|
| 92 |
+
0.2017889,11.888599,-6.472643,-131.6687,-204.67348,0.4643479,-0.60227305,37.13265,1355000
|
| 93 |
+
0.17701411,15.525665,-10.992606,-129.4215,-205.04813,1.4845752,-1.2089874,60.08654,1360000
|
| 94 |
+
0.15271631,13.743464,-3.907232,-129.80183,-205.63962,1.3363987,-1.7984676,54.81939,1365000
|
| 95 |
+
0.18705332,22.866938,0.31807157,-128.36053,-203.76588,0.6902745,-0.7187773,53.184647,1370000
|
| 96 |
+
0.1594123,10.016909,-2.2965689,-129.70638,-203.65987,0.51202416,-0.49064383,36.153915,1375000
|
| 97 |
+
0.12423457,16.014067,2.3878918,-128.20413,-205.83711,0.8357486,-1.0570552,48.89298,1380000
|
| 98 |
+
0.15630981,17.020266,-4.8874407,-128.17052,-204.78407,1.2363224,-1.3578056,70.834625,1385000
|
| 99 |
+
0.15202,12.676305,6.641866,-123.36086,-204.08578,2.2171984,-2.2176073,55.980934,1390000
|
| 100 |
+
0.15710202,20.907286,1.7254207,-124.530846,-204.04941,0.62736285,-0.69745183,49.990177,1395000
|
| 101 |
+
0.14785576,19.811743,1.6807994,-122.87799,-203.47556,2.5076933,-2.5137196,78.811165,1400000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.18966179,6.7653995,-20.126276,-178.11469,-202.92091,1.6431085,-1.8655854,38.24298,905000
|
| 3 |
+
0.18578145,7.477689,-83.22344,-177.72717,-203.3036,0.6432909,-0.6410496,29.622086,910000
|
| 4 |
+
0.19692901,8.698405,-72.10777,-177.07178,-203.2007,0.32873407,-0.30973366,20.996105,915000
|
| 5 |
+
0.17013285,9.054554,-63.831528,-175.56255,-203.86385,0.3087135,-0.31753153,23.431908,920000
|
| 6 |
+
0.172735,10.83856,-57.797153,-172.64624,-202.46979,0.3237254,-0.3125539,21.555908,925000
|
| 7 |
+
0.17407195,19.260248,-58.483948,-172.32869,-203.31917,1.5385495,-1.3258097,44.282845,930000
|
| 8 |
+
0.18090695,15.310005,-58.466343,-170.50322,-203.01674,0.43596098,-0.309015,34.584084,935000
|
| 9 |
+
0.20529777,14.332511,-50.035126,-169.82698,-202.82964,0.34842628,-0.5162208,30.430597,940000
|
| 10 |
+
0.18358293,9.023501,-90.49739,-169.37503,-203.70975,0.3964815,-0.28057137,29.511843,945000
|
| 11 |
+
0.20256825,17.129393,-45.745117,-166.42369,-203.44432,0.49787417,-0.25722575,35.127563,950000
|
| 12 |
+
0.18285123,20.25358,-44.591343,-166.12444,-203.65419,0.9704574,-1.0938437,41.08338,955000
|
| 13 |
+
0.18907589,12.6300955,-13.341955,-164.28622,-203.7614,0.4330974,-0.41664279,33.178093,960000
|
| 14 |
+
0.19324552,16.14883,-40.531803,-164.0002,-204.94356,0.8801897,-0.83253056,39.90714,965000
|
| 15 |
+
0.20542364,31.180775,-20.04135,-158.15463,-204.23723,0.5540628,-0.5698024,52.332436,970000
|
| 16 |
+
0.17378373,18.005442,-39.71998,-161.27725,-205.27576,0.5684463,-0.59509176,42.107414,975000
|
| 17 |
+
0.17719296,15.847678,-13.145182,-159.67484,-203.38889,1.0835689,-1.0736346,56.330574,980000
|
| 18 |
+
0.18116891,21.572588,-4.1624527,-157.81749,-203.88383,2.2403352,-2.2724118,91.12161,985000
|
| 19 |
+
0.18645494,21.449448,-41.354538,-156.87137,-204.82465,1.0677905,-1.0572845,73.8971,990000
|
| 20 |
+
0.18522213,17.534863,-21.013788,-157.51114,-204.18983,1.3709271,-1.4008812,46.576218,995000
|
| 21 |
+
0.15818149,16.850538,-16.20519,-151.85481,-203.41533,0.6744793,-0.6710634,48.384827,1000000
|
| 22 |
+
0.1664196,23.95124,-35.391724,-157.24402,-204.29277,0.5188542,-0.6363758,54.97317,1005000
|
| 23 |
+
0.17085174,14.143054,-14.06295,-152.82396,-205.26453,0.44848546,-0.39803973,38.7817,1010000
|
| 24 |
+
0.18375774,20.474298,0.8385193,-149.58452,-204.53085,0.9625078,-1.1721357,60.06286,1015000
|
| 25 |
+
0.19389208,21.592514,-26.178839,-152.47856,-204.23634,0.68536776,-0.9390727,55.82074,1020000
|
| 26 |
+
0.1933236,16.414211,-26.508972,-153.63513,-203.21771,0.9311064,-0.9138135,51.151657,1025000
|
| 27 |
+
0.17648816,21.114164,-4.5305305,-152.07927,-204.85468,0.69814235,-0.5650126,52.807392,1030000
|
| 28 |
+
0.17980632,16.455885,3.5878756,-151.3574,-203.81378,1.4236696,-1.3832209,76.51,1035000
|
| 29 |
+
0.13024934,17.775324,-29.370283,-146.78136,-200.96695,1.0427796,-0.68198556,50.231415,1040000
|
| 30 |
+
0.17145303,23.644445,-4.746052,-145.8927,-203.92325,2.265358,-2.218687,101.10012,1045000
|
| 31 |
+
0.17266712,17.97437,-20.396284,-146.44165,-203.08308,0.51400924,-0.6492056,50.64456,1050000
|
| 32 |
+
0.15826833,15.804746,-4.4666247,-143.82994,-204.09157,0.9739423,-0.9438526,47.295036,1055000
|
| 33 |
+
0.16841012,18.827106,-17.95805,-150.54207,-204.47247,0.84246397,-1.0346713,59.066486,1060000
|
| 34 |
+
0.1749284,24.119877,-1.4558277,-146.99217,-204.71558,1.341043,-0.7528471,78.73086,1065000
|
| 35 |
+
0.18438336,13.998569,-8.787376,-144.45569,-205.23105,0.6875024,-1.1476943,55.313416,1070000
|
| 36 |
+
0.19444224,23.82794,-6.4940205,-148.74841,-204.19522,0.7739351,-0.7213713,50.742718,1075000
|
| 37 |
+
0.18684912,16.485378,2.0644536,-146.81766,-205.65263,0.5038934,-0.5593821,49.305374,1080000
|
| 38 |
+
0.17982545,14.2273245,-8.900905,-146.42581,-201.78365,0.7622176,-0.73159957,43.7922,1085000
|
| 39 |
+
0.15173486,12.815518,-15.899203,-144.46924,-205.08629,1.2746345,-1.4480327,73.05667,1090000
|
| 40 |
+
0.16680588,15.618423,0.7458807,-144.47078,-201.79413,1.2066892,-1.4692711,60.0987,1095000
|
| 41 |
+
0.17755131,18.583633,-1.4944447,-141.31638,-205.3619,0.55768824,-0.5592019,43.728043,1100000
|
| 42 |
+
0.17811257,22.339937,-1.2031765,-146.54776,-204.84966,1.2947464,-1.4122505,82.0036,1105000
|
| 43 |
+
0.15213689,18.199278,-16.50453,-146.4121,-204.03188,1.8539157,-1.6663227,65.092476,1110000
|
| 44 |
+
0.15412563,19.714024,-7.5301266,-143.01262,-205.30873,0.69826525,-0.8444862,54.45173,1115000
|
| 45 |
+
0.17219512,21.880974,-12.639673,-143.2178,-203.98312,0.5349717,-0.5043898,43.429443,1120000
|
| 46 |
+
0.20286341,16.449188,-23.990665,-138.75322,-202.4721,1.2379079,-1.741777,61.44374,1125000
|
| 47 |
+
0.17903654,15.322121,-12.184996,-143.9921,-204.72963,1.345032,-1.4817891,49.277878,1130000
|
| 48 |
+
0.18399072,12.217189,-3.8892384,-139.36166,-203.93509,0.547896,-0.46872187,46.854034,1135000
|
| 49 |
+
0.19633368,16.166677,0.9685967,-143.4053,-204.7286,0.7526735,-0.7575725,51.185116,1140000
|
| 50 |
+
0.18780988,23.15817,-12.203989,-140.8118,-206.58495,1.839274,-1.7409148,81.2856,1145000
|
| 51 |
+
0.15954559,15.835648,-2.688039,-133.84047,-204.14964,0.8554473,-0.62537277,48.845703,1150000
|
| 52 |
+
0.18219803,20.200058,1.3323915,-144.22533,-203.5371,0.7348884,-0.725095,64.45744,1155000
|
| 53 |
+
0.1878626,14.351596,2.916746,-139.77762,-205.86278,0.4859673,-0.38466582,39.930923,1160000
|
| 54 |
+
0.21281782,20.278189,2.4459367,-142.29922,-205.52757,1.7444717,-1.9571614,49.065403,1165000
|
| 55 |
+
0.14940876,19.937586,0.8626706,-138.52249,-204.45801,1.2208756,-1.0030751,57.04455,1170000
|
| 56 |
+
0.1648784,22.212929,-6.913545,-135.53287,-205.23424,0.88384,-0.8625692,53.243107,1175000
|
| 57 |
+
0.19732986,20.277973,-12.239784,-142.58476,-205.2713,0.654126,-0.61679375,59.13831,1180000
|
| 58 |
+
0.16233256,15.968183,0.7977252,-136.48044,-204.69936,4.064038,-3.8394744,80.92444,1185000
|
| 59 |
+
0.16069782,17.24055,-1.3626871,-134.72119,-204.03738,1.1260667,-0.8595922,55.2034,1190000
|
| 60 |
+
0.15968344,15.573676,2.676263,-136.35213,-206.45816,0.818334,-0.7807407,46.09977,1195000
|
| 61 |
+
0.14733833,15.992648,-3.1255825,-140.31352,-204.60075,1.4619527,-1.1057086,56.196037,1200000
|
| 62 |
+
0.14880987,13.228736,-7.17874,-137.18614,-204.56825,0.32066235,-0.35599577,34.432983,1205000
|
| 63 |
+
0.16506287,15.302955,-8.603916,-138.52464,-204.49088,0.86375076,-0.6668957,49.33357,1210000
|
| 64 |
+
0.17788559,23.639303,-3.131779,-135.5211,-203.35966,1.6010504,-0.5405533,68.15269,1215000
|
| 65 |
+
0.21585451,22.857025,-9.024269,-138.98189,-201.75662,1.3717732,-1.4120892,80.24815,1220000
|
| 66 |
+
0.19225226,19.850237,-8.977592,-138.28755,-205.00415,0.71532434,-0.65977156,64.8663,1225000
|
| 67 |
+
0.19589671,19.645966,3.060331,-133.09085,-205.04033,3.2060766,-1.2423942,64.944984,1230000
|
| 68 |
+
0.19416869,10.189251,2.5420659,-134.89156,-203.2502,0.7562388,-0.6809339,50.482002,1235000
|
| 69 |
+
0.19001108,17.561146,0.35603136,-137.55907,-205.3603,0.8963432,-1.0822905,61.068153,1240000
|
| 70 |
+
0.1834346,11.757024,-6.904485,-143.71594,-205.51091,0.6865231,-0.72172046,46.74719,1245000
|
| 71 |
+
0.16829522,18.535257,4.1067424,-131.93912,-204.89311,2.5548768,-2.543158,64.574295,1250000
|
| 72 |
+
0.18723561,13.435847,-4.2907147,-135.8025,-204.21709,1.317136,-1.1674777,57.6724,1255000
|
| 73 |
+
0.16211487,20.214573,3.138769,-129.41,-203.81099,0.83016413,-0.76781344,51.175514,1260000
|
| 74 |
+
0.16172963,22.126616,-0.90905166,-135.79607,-203.99023,0.7816759,-1.3213891,62.78894,1265000
|
| 75 |
+
0.13934624,12.977097,0.91940486,-132.04906,-204.02516,0.5118471,-0.461077,44.71924,1270000
|
| 76 |
+
0.2067027,26.363714,1.2019508,-132.76053,-204.58078,1.106244,-1.0971463,61.727486,1275000
|
| 77 |
+
0.18460377,8.913628,4.0454288,-131.46582,-202.8688,0.7758538,-0.8656192,41.436512,1280000
|
| 78 |
+
0.18247177,20.222433,-4.7243075,-135.16281,-203.41708,3.0583358,-2.3157718,77.414764,1285000
|
| 79 |
+
0.16811168,12.401019,-6.0972104,-133.84792,-204.05522,0.3684411,-0.33519515,35.31093,1290000
|
| 80 |
+
0.18681282,9.4927635,-5.3117023,-134.2708,-203.41776,1.5815449,-1.5798165,50.58082,1295000
|
| 81 |
+
0.16620468,14.965568,1.3483164,-130.37813,-202.11714,0.6709148,-0.6501946,48.12304,1300000
|
| 82 |
+
0.15152058,11.453309,2.39286,-133.31055,-204.18697,0.4198118,-0.6729851,49.442036,1305000
|
| 83 |
+
0.18171036,16.006989,6.1019444,-136.26785,-201.89294,0.5424408,-0.63604397,48.07852,1310000
|
| 84 |
+
0.15714678,13.572802,-2.2762518,-129.96504,-201.22127,1.1674874,-1.0309496,45.43833,1315000
|
| 85 |
+
0.1499154,12.515073,-0.4853516,-134.20976,-203.82965,0.7396925,-0.43500248,43.653004,1320000
|
| 86 |
+
0.15493341,22.520658,0.3087534,-128.32408,-204.43846,0.9323146,-1.6264292,78.256935,1325000
|
| 87 |
+
0.18568563,12.363844,-3.6269197,-127.864944,-203.2563,0.78956217,-0.89266914,47.150944,1330000
|
| 88 |
+
0.19432136,15.336352,1.0837134,-133.16577,-204.63611,1.4471616,-1.2871381,63.81024,1335000
|
| 89 |
+
0.19228105,20.825586,-11.578099,-127.441795,-204.28377,1.0599501,-0.5443374,60.30703,1340000
|
| 90 |
+
0.1682543,12.055411,-2.0422754,-131.04121,-201.41977,0.8014154,-0.82155347,39.45122,1345000
|
| 91 |
+
0.17165527,21.178057,-12.502699,-128.03438,-205.04521,1.5227485,-1.468615,59.45584,1350000
|
| 92 |
+
0.2017889,11.888599,-6.472643,-131.6687,-204.67348,0.4643479,-0.60227305,37.13265,1355000
|
| 93 |
+
0.17701411,15.525665,-10.992606,-129.4215,-205.04813,1.4845752,-1.2089874,60.08654,1360000
|
| 94 |
+
0.15271631,13.743464,-3.907232,-129.80183,-205.63962,1.3363987,-1.7984676,54.81939,1365000
|
| 95 |
+
0.18705332,22.866938,0.31807157,-128.36053,-203.76588,0.6902745,-0.7187773,53.184647,1370000
|
| 96 |
+
0.1594123,10.016909,-2.2965689,-129.70638,-203.65987,0.51202416,-0.49064383,36.153915,1375000
|
| 97 |
+
0.12423457,16.014067,2.3878918,-128.20413,-205.83711,0.8357486,-1.0570552,48.89298,1380000
|
| 98 |
+
0.15630981,17.020266,-4.8874407,-128.17052,-204.78407,1.2363224,-1.3578056,70.834625,1385000
|
| 99 |
+
0.15202,12.676305,6.641866,-123.36086,-204.08578,2.2171984,-2.2176073,55.980934,1390000
|
| 100 |
+
0.15710202,20.907286,1.7254207,-124.530846,-204.04941,0.62736285,-0.69745183,49.990177,1395000
|
| 101 |
+
0.14785576,19.811743,1.6807994,-122.87799,-203.47556,2.5076933,-2.5137196,78.811165,1400000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e2a8d2582d2e4cbfb0d47f08ef407af694674699184d62a18865953b0ef03cde
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:611c11c4edd8d35b99a1bb6f32c915dbc539e31b3042b97a43e2dec241693413
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78c43d8704346cd8c1e9a72e47021bb780f84e3841b77bad399087fcdfdb1769
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fcb34972ab0a3f26ece0696838044fb4de902a691b737d72a05830d14b1c1637
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cac5500bc6f113266dc68ea8f79a43e7aaef4f3e02d8f4c110ecdd89f16159f1
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d27f53fec60537cde453d9a76e829afe8994a16d1d339226d99eaaadaa7acf9b
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de336776f9f5637546e051059bc6cab724af5ec5441edf4bcff016abff8a8912
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33c558898eb0fda130a754d8f5ca3ba94274fc0783479d42e2b63d0f1e17c531
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_1400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55beab2b76e5cd7bfce0583f2b06a40fd8393d6bc76876ffbeb969de6a7fbba1
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d28b0987a5458761bccd9319f11fa01a42e608d28739070e7e45975b75f7d420
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_154231/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/z7kwyg2h
|