Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1150000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1200000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1250000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1300000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.04834808773306796,0.0024242952288087757,-0.04877495695374537,-0.011087034739438392,27.740988757496712,15.299999999999237,0.72,6967.92,-0.38,-474.26,304.0,1.4444676160812377,850000
|
| 3 |
+
0.0,0.0,-0.017262025915525527,-0.006300677028598212,-0.017284734144297285,-0.006855641727052645,32.12171920363137,11.17699999999964,0.96,21757.58,-0.04,-306.4,221.54,1.0344842433929444,900000
|
| 4 |
+
0.0,0.0,-0.0159671456073352,-0.023675515139856516,-0.016356022576918094,-0.024405166777818493,33.0580056117063,9.542999999999743,0.96,32305.04,-0.06,-278.58,188.86,0.9580865240097046,950000
|
| 5 |
+
0.0,0.0,-0.012241503111951263,-0.028171760479748117,-0.013032450206747901,-0.03407390250650832,35.096849679471376,9.163999999999556,0.94,41848.76,-0.06,-270.84,181.28,0.8595411682128906,1000000
|
| 6 |
+
0.0,0.0,-0.015289849056180319,-0.04174269420130647,-0.017076711818576295,-0.04455605328312581,35.7423327201537,8.564999999999593,0.98,51415.98,-0.02,-237.88,169.3,0.8489974021911622,1050000
|
| 7 |
+
0.0,0.0,-0.026454022284669202,-0.02047045320208188,-0.02783721216161655,-0.05984535760214319,35.52410436480693,8.001999999999628,1.0,59638.12,0.0,-231.38,158.04,0.7408837509155274,1100000
|
| 8 |
+
0.0,0.0,-0.02755107453147506,-0.04945286489869499,-0.02928695104086867,-0.0523090483566154,35.502013140483584,7.641999999999681,1.0,67804.98,0.0,-220.5,150.84,0.7186903429031372,1150000
|
| 9 |
+
0.0,0.0,-0.014854582031732986,-0.048864258186160095,-0.0168468803212466,-0.05380164840271906,35.441806167147114,7.804999999999537,1.0,75692.7,0.0,-228.5,154.1,0.7721294927597045,1200000
|
| 10 |
+
0.0,0.0,-0.013983927917195348,-0.045660203374221914,-0.015971225177941608,-0.05250781570232599,35.493595971043845,6.887999999999597,1.0,83097.74,0.0,-195.44,135.76,0.7025510549545289,1250000
|
| 11 |
+
0.0,0.0,-0.023434763581043072,-0.0373385093505252,-0.025249917933365163,-0.05404927162845681,35.718600596164556,7.035999999999632,1.0,90195.58,0.0,-200.04,138.72,0.6563148593902588,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.04834808773306796,0.0024242952288087757,-0.04877495695374537,-0.011087034739438392,27.740988757496712,15.299999999999237,0.72,6967.92,-0.38,-474.26,304.0,1.4444676160812377,850000
|
| 3 |
+
0.0,0.0,-0.017262025915525527,-0.006300677028598212,-0.017284734144297285,-0.006855641727052645,32.12171920363137,11.17699999999964,0.96,21757.58,-0.04,-306.4,221.54,1.0344842433929444,900000
|
| 4 |
+
0.0,0.0,-0.0159671456073352,-0.023675515139856516,-0.016356022576918094,-0.024405166777818493,33.0580056117063,9.542999999999743,0.96,32305.04,-0.06,-278.58,188.86,0.9580865240097046,950000
|
| 5 |
+
0.0,0.0,-0.012241503111951263,-0.028171760479748117,-0.013032450206747901,-0.03407390250650832,35.096849679471376,9.163999999999556,0.94,41848.76,-0.06,-270.84,181.28,0.8595411682128906,1000000
|
| 6 |
+
0.0,0.0,-0.015289849056180319,-0.04174269420130647,-0.017076711818576295,-0.04455605328312581,35.7423327201537,8.564999999999593,0.98,51415.98,-0.02,-237.88,169.3,0.8489974021911622,1050000
|
| 7 |
+
0.0,0.0,-0.026454022284669202,-0.02047045320208188,-0.02783721216161655,-0.05984535760214319,35.52410436480693,8.001999999999628,1.0,59638.12,0.0,-231.38,158.04,0.7408837509155274,1100000
|
| 8 |
+
0.0,0.0,-0.02755107453147506,-0.04945286489869499,-0.02928695104086867,-0.0523090483566154,35.502013140483584,7.641999999999681,1.0,67804.98,0.0,-220.5,150.84,0.7186903429031372,1150000
|
| 9 |
+
0.0,0.0,-0.014854582031732986,-0.048864258186160095,-0.0168468803212466,-0.05380164840271906,35.441806167147114,7.804999999999537,1.0,75692.7,0.0,-228.5,154.1,0.7721294927597045,1200000
|
| 10 |
+
0.0,0.0,-0.013983927917195348,-0.045660203374221914,-0.015971225177941608,-0.05250781570232599,35.493595971043845,6.887999999999597,1.0,83097.74,0.0,-195.44,135.76,0.7025510549545289,1250000
|
| 11 |
+
0.0,0.0,-0.023434763581043072,-0.0373385093505252,-0.025249917933365163,-0.05404927162845681,35.718600596164556,7.035999999999632,1.0,90195.58,0.0,-200.04,138.72,0.6563148593902588,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.19163115,5.4860816,-65.41156,-179.21597,-203.38411,0.15292308,-0.3364205,23.40784,805000
|
| 3 |
+
0.1990489,12.147468,-65.06758,-175.69025,-202.83069,1.9529915,-2.1699572,48.966057,810000
|
| 4 |
+
0.19627969,10.275043,-58.25093,-173.09874,-202.89688,0.48070687,-0.28851038,27.959702,815000
|
| 5 |
+
0.16838402,12.674997,-43.609287,-170.68323,-203.2387,0.8095621,-0.6069069,45.464073,820000
|
| 6 |
+
0.1667155,13.549662,-68.03748,-171.61992,-203.5886,1.0048846,-1.1577011,40.322163,825000
|
| 7 |
+
0.17544317,15.803561,-48.5852,-169.73445,-203.21309,0.5677552,-0.5486258,32.97197,830000
|
| 8 |
+
0.17893624,12.616503,-74.173,-168.4823,-203.09692,0.35286537,-0.374383,29.365097,835000
|
| 9 |
+
0.18574941,13.056,-64.56665,-170.59074,-203.3541,0.3865687,-0.3973379,28.420738,840000
|
| 10 |
+
0.17160892,14.590924,-8.245461,-167.72124,-204.08583,0.6546803,-0.7213175,41.164112,845000
|
| 11 |
+
0.17477486,19.98483,-19.216795,-167.16924,-203.92732,1.1248447,-1.1558326,46.42296,850000
|
| 12 |
+
0.18163717,22.718012,-19.855923,-165.05783,-204.32697,1.4335797,-1.5846692,81.43682,855000
|
| 13 |
+
0.19211537,20.999817,-49.020336,-165.26794,-205.10857,0.47924903,-0.6523689,43.93007,860000
|
| 14 |
+
0.17977603,14.79975,-46.364594,-164.03606,-204.7577,1.1745778,-1.1244776,50.5031,865000
|
| 15 |
+
0.15849096,15.400049,-22.203169,-160.19623,-203.94156,0.3099309,-0.40358943,31.2959,870000
|
| 16 |
+
0.16000983,14.744242,-13.230563,-163.09073,-204.54314,0.6567961,-0.6723865,44.86216,875000
|
| 17 |
+
0.16651414,18.748552,-46.170868,-164.26736,-204.23035,0.76245713,-0.58303076,45.892456,880000
|
| 18 |
+
0.14049016,27.938185,-38.740578,-160.87144,-205.24687,0.6517787,-0.8649406,63.329933,885000
|
| 19 |
+
0.1786808,14.163048,-29.86051,-158.76868,-205.80464,0.4860505,-0.6653072,39.582092,890000
|
| 20 |
+
0.15179606,11.448034,-49.66014,-161.61758,-203.9703,0.5922028,-0.5196074,33.41645,895000
|
| 21 |
+
0.20717937,25.618326,-33.93301,-155.83012,-205.35954,0.6297391,-0.6817681,65.123405,900000
|
| 22 |
+
0.17922929,24.72885,-38.420723,-158.96153,-205.25406,0.78222215,-0.82017756,54.116066,905000
|
| 23 |
+
0.16577333,15.721422,-17.726217,-153.43037,-204.86523,0.50530374,-0.63591325,55.230797,910000
|
| 24 |
+
0.20382972,15.670525,2.2476401,-152.311,-203.48805,2.1319332,-1.8801454,78.28584,915000
|
| 25 |
+
0.17388734,13.362697,-35.713432,-153.17789,-204.0599,0.6603566,-0.65831465,45.959293,920000
|
| 26 |
+
0.18057923,17.327057,-8.712413,-154.1237,-204.23317,0.429153,-0.4965472,39.560997,925000
|
| 27 |
+
0.17297077,23.141449,-19.394371,-153.48352,-204.34747,0.85873044,-0.9374865,54.96856,930000
|
| 28 |
+
0.18933159,21.199425,1.8921646,-154.74217,-203.27805,0.9025653,-1.0687853,62.997604,935000
|
| 29 |
+
0.21640593,21.786642,-19.800322,-147.42317,-203.63905,0.8115125,-0.79783255,58.721764,940000
|
| 30 |
+
0.174616,21.751755,-20.36728,-152.57722,-204.28996,4.354339,-6.211622,128.87491,945000
|
| 31 |
+
0.18863282,17.136255,-1.5790136,-152.37602,-205.6054,0.65898466,-0.64215994,48.11245,950000
|
| 32 |
+
0.17783253,14.1343565,-8.742115,-148.35466,-207.21323,0.47238922,-0.7907025,41.193626,955000
|
| 33 |
+
0.16733003,18.488981,-7.2000227,-149.33748,-205.63675,0.5108047,-0.38816804,47.10669,960000
|
| 34 |
+
0.1789094,14.782559,-3.363383,-149.0581,-205.28802,0.7774256,-0.68689835,38.37953,965000
|
| 35 |
+
0.17809284,15.275153,-12.297973,-147.19275,-204.06505,0.47355586,-0.52409434,43.20215,970000
|
| 36 |
+
0.1696537,14.041457,-7.2465405,-150.04253,-205.54099,0.39492053,-0.66098464,49.471737,975000
|
| 37 |
+
0.16975015,20.481232,0.8035289,-149.10794,-204.90855,0.8549061,-1.6622858,63.99198,980000
|
| 38 |
+
0.17105651,18.117441,-11.342842,-149.3637,-204.74326,1.0308651,-0.90075433,65.80948,985000
|
| 39 |
+
0.15810251,18.076914,-5.3629537,-146.81834,-206.4077,0.6090453,-0.42226472,51.323185,990000
|
| 40 |
+
0.20511845,16.73802,-0.28137732,-147.23853,-204.61414,0.7392179,-0.72151244,68.94312,995000
|
| 41 |
+
0.14965379,10.6398535,-26.425014,-149.29933,-205.49408,0.6171757,-0.59480125,39.60276,1000000
|
| 42 |
+
0.15731752,27.519077,-14.180409,-146.47607,-204.43114,0.85756904,-0.77976817,64.69421,1005000
|
| 43 |
+
0.15921767,18.86062,-7.3245015,-147.12823,-206.50945,0.58542114,-0.5542049,47.451122,1010000
|
| 44 |
+
0.16905905,12.624014,-6.7701325,-144.17342,-203.97144,0.49889705,-0.62741214,49.778736,1015000
|
| 45 |
+
0.18545161,22.525137,-5.408343,-147.16731,-204.39279,0.6993448,-0.66177064,53.236893,1020000
|
| 46 |
+
0.19785307,24.351088,-7.1167936,-143.97704,-204.80576,0.92024636,-0.8272266,74.56436,1025000
|
| 47 |
+
0.18370232,13.545804,-0.09209582,-144.69685,-205.84154,1.2040262,-1.3043759,56.09876,1030000
|
| 48 |
+
0.20267029,20.254576,2.4070392,-139.96468,-204.1063,1.1987478,-1.1418129,77.31898,1035000
|
| 49 |
+
0.13334583,18.215527,-5.143928,-144.20148,-203.78194,1.3822793,-1.3817767,67.72133,1040000
|
| 50 |
+
0.17690292,16.206114,-4.775739,-142.88835,-206.145,1.5328859,-2.1311948,69.94844,1045000
|
| 51 |
+
0.15658183,16.787134,-6.8602767,-135.31621,-205.99231,0.81117296,-0.7226322,56.396366,1050000
|
| 52 |
+
0.15240595,17.76365,-2.6573296,-143.06519,-204.23506,1.8375157,-1.4359926,57.871246,1055000
|
| 53 |
+
0.17416984,17.027536,2.7934651,-142.17455,-206.0853,0.87300044,-0.8392278,46.88498,1060000
|
| 54 |
+
0.17464201,24.37073,-4.6002436,-144.61766,-204.46474,2.525474,-2.542672,78.960236,1065000
|
| 55 |
+
0.19395038,16.973204,-0.09160593,-140.59392,-204.30322,0.59762764,-0.7666816,51.10031,1070000
|
| 56 |
+
0.1828544,25.052662,-12.607353,-140.1961,-204.19386,1.0196748,-0.9931431,56.725998,1075000
|
| 57 |
+
0.18718445,12.038123,1.7966727,-141.13638,-205.0957,1.0896536,-0.970424,44.60383,1080000
|
| 58 |
+
0.16780493,13.462778,1.5886917,-138.2436,-204.27675,0.7288219,-1.2104937,58.954613,1085000
|
| 59 |
+
0.14756969,21.840885,2.5855722,-133.467,-204.68384,1.8535074,-2.077314,83.867805,1090000
|
| 60 |
+
0.15361436,27.42775,2.9968953,-135.41321,-205.11176,4.0266666,-3.1980472,107.109375,1095000
|
| 61 |
+
0.16415507,14.692209,-10.302925,-138.98328,-203.32494,0.47497964,-0.51940393,38.48414,1100000
|
| 62 |
+
0.18947148,19.937195,-6.334673,-141.41931,-203.91121,0.409286,-0.42615205,41.68306,1105000
|
| 63 |
+
0.15527219,16.677444,-9.798074,-137.03178,-204.43163,0.72023904,-0.71319807,46.6004,1110000
|
| 64 |
+
0.13739914,15.514816,1.0275265,-136.16887,-203.1357,1.2480527,-1.4006593,64.89555,1115000
|
| 65 |
+
0.16729328,19.118479,-10.601808,-137.3438,-203.48616,0.6869195,-1.3107257,66.68603,1120000
|
| 66 |
+
0.18025342,28.60259,-9.811867,-139.8452,-204.98076,3.264272,-3.2921903,85.20741,1125000
|
| 67 |
+
0.1634078,16.807302,-2.0892384,-134.95836,-204.15869,0.7092155,-0.7494135,46.946358,1130000
|
| 68 |
+
0.17495596,15.24809,4.374434,-140.06909,-205.72256,1.5286187,-1.4275043,61.154564,1135000
|
| 69 |
+
0.1856824,30.826918,-0.4679095,-137.41727,-204.18214,1.1271417,-1.1284374,72.60702,1140000
|
| 70 |
+
0.17355108,19.56673,-7.4275055,-142.68384,-204.7733,1.8295041,-1.6733404,57.928665,1145000
|
| 71 |
+
0.15618396,14.530588,1.8895048,-133.54033,-205.42479,1.0591004,-1.639343,71.62099,1150000
|
| 72 |
+
0.17349805,20.024717,-10.915146,-141.46028,-204.48926,0.48151633,-0.63168,49.549957,1155000
|
| 73 |
+
0.18547598,16.964796,1.1494305,-133.03516,-207.58632,0.61920416,-0.8049648,55.79588,1160000
|
| 74 |
+
0.1920405,19.273289,-4.101992,-139.78899,-204.45648,1.5227253,-0.7360604,58.417435,1165000
|
| 75 |
+
0.13097595,21.72232,1.3701007,-138.84387,-204.08298,1.7438239,-1.7526248,54.53219,1170000
|
| 76 |
+
0.13861366,26.9698,0.8902358,-132.68018,-204.23927,0.6161068,-0.5610276,50.22919,1175000
|
| 77 |
+
0.18220311,9.373388,5.4802756,-131.91277,-205.31177,0.6429295,-0.6181268,45.651566,1180000
|
| 78 |
+
0.16291884,22.30477,-3.2483304,-137.5695,-204.52182,1.2470182,-1.2232312,54.15845,1185000
|
| 79 |
+
0.1602237,14.604668,-6.749087,-136.75476,-204.59897,0.9593741,-0.74818087,62.527737,1190000
|
| 80 |
+
0.16792516,16.274387,-3.47189,-138.56126,-203.82433,0.46189052,-0.58345544,51.104015,1195000
|
| 81 |
+
0.15029117,14.625856,3.241666,-131.05888,-204.68013,1.592909,-1.5711684,71.36868,1200000
|
| 82 |
+
0.14161444,19.353195,-3.1919322,-136.53241,-204.67456,0.838689,-0.840996,52.354935,1205000
|
| 83 |
+
0.1683988,15.534362,-2.2670913,-138.21236,-204.384,0.7729328,-0.60827535,41.7293,1210000
|
| 84 |
+
0.17360994,26.07736,0.40532762,-130.36473,-205.93802,3.7432404,-3.6807697,132.47565,1215000
|
| 85 |
+
0.20748639,17.427362,-10.107617,-138.5313,-203.73378,1.2832019,-1.4784558,65.46312,1220000
|
| 86 |
+
0.1717824,8.87088,-2.033472,-132.57059,-206.32999,6.964064,-8.732254,112.70442,1225000
|
| 87 |
+
0.16744193,15.553255,-5.87613,-130.42978,-204.14008,0.669633,-0.6729018,52.057602,1230000
|
| 88 |
+
0.18163669,16.635944,9.162799,-135.83733,-205.61433,0.7255026,-0.87982345,46.43923,1235000
|
| 89 |
+
0.16588852,19.966341,5.515588,-131.311,-205.14398,2.2906704,-2.2482827,65.92576,1240000
|
| 90 |
+
0.15831614,13.542414,-4.187847,-134.98466,-204.20116,0.84853506,-0.6773904,48.25647,1245000
|
| 91 |
+
0.15597862,24.916,-5.213908,-127.26377,-203.88597,0.8429725,-0.74871504,63.97934,1250000
|
| 92 |
+
0.17827255,10.46835,2.314133,-134.38672,-203.58289,1.4655261,-1.219285,44.949654,1255000
|
| 93 |
+
0.15824288,19.889265,-0.27049896,-133.052,-204.94693,0.65346706,-0.537415,39.6315,1260000
|
| 94 |
+
0.16860507,22.946096,1.2511687,-130.88567,-204.38545,2.2891157,-3.613165,110.63397,1265000
|
| 95 |
+
0.14066926,29.362226,-0.14089715,-130.47221,-205.4651,3.1765583,-2.2446198,83.8238,1270000
|
| 96 |
+
0.19983312,45.94797,-2.429355,-129.4088,-204.50946,3.9307196,-2.8941274,122.34256,1275000
|
| 97 |
+
0.17177022,16.605116,3.6775484,-129.7658,-203.83942,3.4372573,-6.5797057,112.45616,1280000
|
| 98 |
+
0.1615827,16.768194,-2.0011957,-130.28773,-202.30699,3.860466,-3.3275135,77.22124,1285000
|
| 99 |
+
0.15667114,14.644324,7.0928226,-126.05338,-203.63075,0.42761925,-0.3913635,38.409485,1290000
|
| 100 |
+
0.17991875,11.763688,1.2886019,-121.57708,-205.36113,1.2308215,-1.2024912,60.266277,1295000
|
| 101 |
+
0.165813,24.008991,-3.0335212,-125.20862,-205.32379,1.8774577,-0.80214775,72.57019,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.19163115,5.4860816,-65.41156,-179.21597,-203.38411,0.15292308,-0.3364205,23.40784,805000
|
| 3 |
+
0.1990489,12.147468,-65.06758,-175.69025,-202.83069,1.9529915,-2.1699572,48.966057,810000
|
| 4 |
+
0.19627969,10.275043,-58.25093,-173.09874,-202.89688,0.48070687,-0.28851038,27.959702,815000
|
| 5 |
+
0.16838402,12.674997,-43.609287,-170.68323,-203.2387,0.8095621,-0.6069069,45.464073,820000
|
| 6 |
+
0.1667155,13.549662,-68.03748,-171.61992,-203.5886,1.0048846,-1.1577011,40.322163,825000
|
| 7 |
+
0.17544317,15.803561,-48.5852,-169.73445,-203.21309,0.5677552,-0.5486258,32.97197,830000
|
| 8 |
+
0.17893624,12.616503,-74.173,-168.4823,-203.09692,0.35286537,-0.374383,29.365097,835000
|
| 9 |
+
0.18574941,13.056,-64.56665,-170.59074,-203.3541,0.3865687,-0.3973379,28.420738,840000
|
| 10 |
+
0.17160892,14.590924,-8.245461,-167.72124,-204.08583,0.6546803,-0.7213175,41.164112,845000
|
| 11 |
+
0.17477486,19.98483,-19.216795,-167.16924,-203.92732,1.1248447,-1.1558326,46.42296,850000
|
| 12 |
+
0.18163717,22.718012,-19.855923,-165.05783,-204.32697,1.4335797,-1.5846692,81.43682,855000
|
| 13 |
+
0.19211537,20.999817,-49.020336,-165.26794,-205.10857,0.47924903,-0.6523689,43.93007,860000
|
| 14 |
+
0.17977603,14.79975,-46.364594,-164.03606,-204.7577,1.1745778,-1.1244776,50.5031,865000
|
| 15 |
+
0.15849096,15.400049,-22.203169,-160.19623,-203.94156,0.3099309,-0.40358943,31.2959,870000
|
| 16 |
+
0.16000983,14.744242,-13.230563,-163.09073,-204.54314,0.6567961,-0.6723865,44.86216,875000
|
| 17 |
+
0.16651414,18.748552,-46.170868,-164.26736,-204.23035,0.76245713,-0.58303076,45.892456,880000
|
| 18 |
+
0.14049016,27.938185,-38.740578,-160.87144,-205.24687,0.6517787,-0.8649406,63.329933,885000
|
| 19 |
+
0.1786808,14.163048,-29.86051,-158.76868,-205.80464,0.4860505,-0.6653072,39.582092,890000
|
| 20 |
+
0.15179606,11.448034,-49.66014,-161.61758,-203.9703,0.5922028,-0.5196074,33.41645,895000
|
| 21 |
+
0.20717937,25.618326,-33.93301,-155.83012,-205.35954,0.6297391,-0.6817681,65.123405,900000
|
| 22 |
+
0.17922929,24.72885,-38.420723,-158.96153,-205.25406,0.78222215,-0.82017756,54.116066,905000
|
| 23 |
+
0.16577333,15.721422,-17.726217,-153.43037,-204.86523,0.50530374,-0.63591325,55.230797,910000
|
| 24 |
+
0.20382972,15.670525,2.2476401,-152.311,-203.48805,2.1319332,-1.8801454,78.28584,915000
|
| 25 |
+
0.17388734,13.362697,-35.713432,-153.17789,-204.0599,0.6603566,-0.65831465,45.959293,920000
|
| 26 |
+
0.18057923,17.327057,-8.712413,-154.1237,-204.23317,0.429153,-0.4965472,39.560997,925000
|
| 27 |
+
0.17297077,23.141449,-19.394371,-153.48352,-204.34747,0.85873044,-0.9374865,54.96856,930000
|
| 28 |
+
0.18933159,21.199425,1.8921646,-154.74217,-203.27805,0.9025653,-1.0687853,62.997604,935000
|
| 29 |
+
0.21640593,21.786642,-19.800322,-147.42317,-203.63905,0.8115125,-0.79783255,58.721764,940000
|
| 30 |
+
0.174616,21.751755,-20.36728,-152.57722,-204.28996,4.354339,-6.211622,128.87491,945000
|
| 31 |
+
0.18863282,17.136255,-1.5790136,-152.37602,-205.6054,0.65898466,-0.64215994,48.11245,950000
|
| 32 |
+
0.17783253,14.1343565,-8.742115,-148.35466,-207.21323,0.47238922,-0.7907025,41.193626,955000
|
| 33 |
+
0.16733003,18.488981,-7.2000227,-149.33748,-205.63675,0.5108047,-0.38816804,47.10669,960000
|
| 34 |
+
0.1789094,14.782559,-3.363383,-149.0581,-205.28802,0.7774256,-0.68689835,38.37953,965000
|
| 35 |
+
0.17809284,15.275153,-12.297973,-147.19275,-204.06505,0.47355586,-0.52409434,43.20215,970000
|
| 36 |
+
0.1696537,14.041457,-7.2465405,-150.04253,-205.54099,0.39492053,-0.66098464,49.471737,975000
|
| 37 |
+
0.16975015,20.481232,0.8035289,-149.10794,-204.90855,0.8549061,-1.6622858,63.99198,980000
|
| 38 |
+
0.17105651,18.117441,-11.342842,-149.3637,-204.74326,1.0308651,-0.90075433,65.80948,985000
|
| 39 |
+
0.15810251,18.076914,-5.3629537,-146.81834,-206.4077,0.6090453,-0.42226472,51.323185,990000
|
| 40 |
+
0.20511845,16.73802,-0.28137732,-147.23853,-204.61414,0.7392179,-0.72151244,68.94312,995000
|
| 41 |
+
0.14965379,10.6398535,-26.425014,-149.29933,-205.49408,0.6171757,-0.59480125,39.60276,1000000
|
| 42 |
+
0.15731752,27.519077,-14.180409,-146.47607,-204.43114,0.85756904,-0.77976817,64.69421,1005000
|
| 43 |
+
0.15921767,18.86062,-7.3245015,-147.12823,-206.50945,0.58542114,-0.5542049,47.451122,1010000
|
| 44 |
+
0.16905905,12.624014,-6.7701325,-144.17342,-203.97144,0.49889705,-0.62741214,49.778736,1015000
|
| 45 |
+
0.18545161,22.525137,-5.408343,-147.16731,-204.39279,0.6993448,-0.66177064,53.236893,1020000
|
| 46 |
+
0.19785307,24.351088,-7.1167936,-143.97704,-204.80576,0.92024636,-0.8272266,74.56436,1025000
|
| 47 |
+
0.18370232,13.545804,-0.09209582,-144.69685,-205.84154,1.2040262,-1.3043759,56.09876,1030000
|
| 48 |
+
0.20267029,20.254576,2.4070392,-139.96468,-204.1063,1.1987478,-1.1418129,77.31898,1035000
|
| 49 |
+
0.13334583,18.215527,-5.143928,-144.20148,-203.78194,1.3822793,-1.3817767,67.72133,1040000
|
| 50 |
+
0.17690292,16.206114,-4.775739,-142.88835,-206.145,1.5328859,-2.1311948,69.94844,1045000
|
| 51 |
+
0.15658183,16.787134,-6.8602767,-135.31621,-205.99231,0.81117296,-0.7226322,56.396366,1050000
|
| 52 |
+
0.15240595,17.76365,-2.6573296,-143.06519,-204.23506,1.8375157,-1.4359926,57.871246,1055000
|
| 53 |
+
0.17416984,17.027536,2.7934651,-142.17455,-206.0853,0.87300044,-0.8392278,46.88498,1060000
|
| 54 |
+
0.17464201,24.37073,-4.6002436,-144.61766,-204.46474,2.525474,-2.542672,78.960236,1065000
|
| 55 |
+
0.19395038,16.973204,-0.09160593,-140.59392,-204.30322,0.59762764,-0.7666816,51.10031,1070000
|
| 56 |
+
0.1828544,25.052662,-12.607353,-140.1961,-204.19386,1.0196748,-0.9931431,56.725998,1075000
|
| 57 |
+
0.18718445,12.038123,1.7966727,-141.13638,-205.0957,1.0896536,-0.970424,44.60383,1080000
|
| 58 |
+
0.16780493,13.462778,1.5886917,-138.2436,-204.27675,0.7288219,-1.2104937,58.954613,1085000
|
| 59 |
+
0.14756969,21.840885,2.5855722,-133.467,-204.68384,1.8535074,-2.077314,83.867805,1090000
|
| 60 |
+
0.15361436,27.42775,2.9968953,-135.41321,-205.11176,4.0266666,-3.1980472,107.109375,1095000
|
| 61 |
+
0.16415507,14.692209,-10.302925,-138.98328,-203.32494,0.47497964,-0.51940393,38.48414,1100000
|
| 62 |
+
0.18947148,19.937195,-6.334673,-141.41931,-203.91121,0.409286,-0.42615205,41.68306,1105000
|
| 63 |
+
0.15527219,16.677444,-9.798074,-137.03178,-204.43163,0.72023904,-0.71319807,46.6004,1110000
|
| 64 |
+
0.13739914,15.514816,1.0275265,-136.16887,-203.1357,1.2480527,-1.4006593,64.89555,1115000
|
| 65 |
+
0.16729328,19.118479,-10.601808,-137.3438,-203.48616,0.6869195,-1.3107257,66.68603,1120000
|
| 66 |
+
0.18025342,28.60259,-9.811867,-139.8452,-204.98076,3.264272,-3.2921903,85.20741,1125000
|
| 67 |
+
0.1634078,16.807302,-2.0892384,-134.95836,-204.15869,0.7092155,-0.7494135,46.946358,1130000
|
| 68 |
+
0.17495596,15.24809,4.374434,-140.06909,-205.72256,1.5286187,-1.4275043,61.154564,1135000
|
| 69 |
+
0.1856824,30.826918,-0.4679095,-137.41727,-204.18214,1.1271417,-1.1284374,72.60702,1140000
|
| 70 |
+
0.17355108,19.56673,-7.4275055,-142.68384,-204.7733,1.8295041,-1.6733404,57.928665,1145000
|
| 71 |
+
0.15618396,14.530588,1.8895048,-133.54033,-205.42479,1.0591004,-1.639343,71.62099,1150000
|
| 72 |
+
0.17349805,20.024717,-10.915146,-141.46028,-204.48926,0.48151633,-0.63168,49.549957,1155000
|
| 73 |
+
0.18547598,16.964796,1.1494305,-133.03516,-207.58632,0.61920416,-0.8049648,55.79588,1160000
|
| 74 |
+
0.1920405,19.273289,-4.101992,-139.78899,-204.45648,1.5227253,-0.7360604,58.417435,1165000
|
| 75 |
+
0.13097595,21.72232,1.3701007,-138.84387,-204.08298,1.7438239,-1.7526248,54.53219,1170000
|
| 76 |
+
0.13861366,26.9698,0.8902358,-132.68018,-204.23927,0.6161068,-0.5610276,50.22919,1175000
|
| 77 |
+
0.18220311,9.373388,5.4802756,-131.91277,-205.31177,0.6429295,-0.6181268,45.651566,1180000
|
| 78 |
+
0.16291884,22.30477,-3.2483304,-137.5695,-204.52182,1.2470182,-1.2232312,54.15845,1185000
|
| 79 |
+
0.1602237,14.604668,-6.749087,-136.75476,-204.59897,0.9593741,-0.74818087,62.527737,1190000
|
| 80 |
+
0.16792516,16.274387,-3.47189,-138.56126,-203.82433,0.46189052,-0.58345544,51.104015,1195000
|
| 81 |
+
0.15029117,14.625856,3.241666,-131.05888,-204.68013,1.592909,-1.5711684,71.36868,1200000
|
| 82 |
+
0.14161444,19.353195,-3.1919322,-136.53241,-204.67456,0.838689,-0.840996,52.354935,1205000
|
| 83 |
+
0.1683988,15.534362,-2.2670913,-138.21236,-204.384,0.7729328,-0.60827535,41.7293,1210000
|
| 84 |
+
0.17360994,26.07736,0.40532762,-130.36473,-205.93802,3.7432404,-3.6807697,132.47565,1215000
|
| 85 |
+
0.20748639,17.427362,-10.107617,-138.5313,-203.73378,1.2832019,-1.4784558,65.46312,1220000
|
| 86 |
+
0.1717824,8.87088,-2.033472,-132.57059,-206.32999,6.964064,-8.732254,112.70442,1225000
|
| 87 |
+
0.16744193,15.553255,-5.87613,-130.42978,-204.14008,0.669633,-0.6729018,52.057602,1230000
|
| 88 |
+
0.18163669,16.635944,9.162799,-135.83733,-205.61433,0.7255026,-0.87982345,46.43923,1235000
|
| 89 |
+
0.16588852,19.966341,5.515588,-131.311,-205.14398,2.2906704,-2.2482827,65.92576,1240000
|
| 90 |
+
0.15831614,13.542414,-4.187847,-134.98466,-204.20116,0.84853506,-0.6773904,48.25647,1245000
|
| 91 |
+
0.15597862,24.916,-5.213908,-127.26377,-203.88597,0.8429725,-0.74871504,63.97934,1250000
|
| 92 |
+
0.17827255,10.46835,2.314133,-134.38672,-203.58289,1.4655261,-1.219285,44.949654,1255000
|
| 93 |
+
0.15824288,19.889265,-0.27049896,-133.052,-204.94693,0.65346706,-0.537415,39.6315,1260000
|
| 94 |
+
0.16860507,22.946096,1.2511687,-130.88567,-204.38545,2.2891157,-3.613165,110.63397,1265000
|
| 95 |
+
0.14066926,29.362226,-0.14089715,-130.47221,-205.4651,3.1765583,-2.2446198,83.8238,1270000
|
| 96 |
+
0.19983312,45.94797,-2.429355,-129.4088,-204.50946,3.9307196,-2.8941274,122.34256,1275000
|
| 97 |
+
0.17177022,16.605116,3.6775484,-129.7658,-203.83942,3.4372573,-6.5797057,112.45616,1280000
|
| 98 |
+
0.1615827,16.768194,-2.0011957,-130.28773,-202.30699,3.860466,-3.3275135,77.22124,1285000
|
| 99 |
+
0.15667114,14.644324,7.0928226,-126.05338,-203.63075,0.42761925,-0.3913635,38.409485,1290000
|
| 100 |
+
0.17991875,11.763688,1.2886019,-121.57708,-205.36113,1.2308215,-1.2024912,60.266277,1295000
|
| 101 |
+
0.165813,24.008991,-3.0335212,-125.20862,-205.32379,1.8774577,-0.80214775,72.57019,1300000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08874faa79bfe1eff33279af8ad136f1e24b421ae94f17a288a509bed5be69c1
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0196bb5490853c204487a5f7a1fc15d5db8ce4aca27ebb2785978ce1d3f22649
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac3fc559aeccca3860963aca5dc7cd5f2c8c9ccced75f6cc69df33ce3b6db23a
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c240bdbfff5c511407b5d21d04ede2cbaddef0a6b7a6864853ee9f126fa8ae16
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56cd7396c588939e983e54513c8c7f7d9d534a0ff9ae5d878ddb0d1e6f122a74
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3cd5c9173e8b6370c7aec28503d0b590c3c07cc775b6ad04d769a61d82f6a70
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cd79775f52b7c5dfa34cd9d2b6c1e64336baba8468744d1679e3587447a54b5
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f3eff4618f52bfaa5cc60a6ce6455e229d7b223fdf273583106e8efe4fbd5ab
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e7258ed685682ca2a9139ca779bdf8c70dcff31644ba5fae1eb3c82df1d2a02
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c96bb03d8df48a30230d99d2e3fbb9f36cf33e529864250e222cb20a61c993c9
|
| 3 |
+
size 218098303
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/cgql/20260319_075529/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/de8t9kjm
|