Upload folder using huggingface_hub
Browse files- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/env.csv +0 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/env_sv.csv +0 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/eval.csv +31 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/eval_sv.csv +31 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/flags.json +1 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/offline_agent.csv +201 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/offline_agent_sv.csv +201 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/online_agent.csv +101 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/online_agent_sv.csv +101 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_100000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1000000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1050000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1100000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1150000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1200000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1250000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1300000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1350000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1400000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1450000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_150000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1500000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_200000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_250000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_300000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_350000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_400000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_450000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_50000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_500000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_550000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_600000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_650000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_700000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_750000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_800000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_850000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_900000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_950000.pkl +3 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/progress.tk +1 -0
- pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/token.tk +1 -0
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/eval.csv
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.007092571333430182,0.006535812169901588,-0.006628165615930318,0.011192009575508807,26.971514117663528,25.099999999996967,0.0,12750.0,-1.9,-976.66,500.0,1.6885305261611938,50000
|
| 3 |
+
0.0,0.0,-0.04126623978012787,-0.00908897314551282,-0.04155017897920883,-0.0036517791311925915,21.361326379713443,24.806999999997032,0.02,38539.04,-1.68,-901.0,494.14,1.5461155223846434,100000
|
| 4 |
+
0.0,0.0,-0.03310060261779639,-0.0022762730731864422,-0.033446359855859475,-0.004084015236061084,19.8296621291261,23.747999999997386,0.14,63831.0,-1.38,-841.6,472.96,1.524410653114319,150000
|
| 5 |
+
0.0,0.0,-0.04086084850577247,0.0021804842144520146,-0.04083318357150081,0.00042442465485515064,20.455850299987457,22.679999999997616,0.2,87669.54,-1.14,-726.76,451.6,1.4597340440750122,200000
|
| 6 |
+
0.0,0.0,-0.03802323205092513,0.002777256817215113,-0.03827220616376559,-0.0055142283171202575,20.776273429111505,21.881999999998165,0.34,111204.8,-1.04,-719.98,435.64,1.4487226963043214,250000
|
| 7 |
+
0.0,0.0,-0.04801493852027212,-0.005902096475538104,-0.048554655799281324,-0.013380565432910734,19.442659651600756,21.67399999999793,0.34,133876.0,-0.84,-669.04,431.48,1.434865379333496,300000
|
| 8 |
+
0.0,0.0,-0.038124407461665115,-0.006998066515511824,-0.038008074119664205,-0.004536820446996554,22.077022226698467,20.042999999998116,0.4,155749.72,-0.8,-619.8,398.86,1.3541836643218994,350000
|
| 9 |
+
0.0,0.0,-0.03345637192652937,-0.0022286345076493646,-0.033494263951137214,0.021616097902505533,20.91185260940168,19.966999999998595,0.46,176156.84,-0.64,-557.52,397.34,1.365433735847473,400000
|
| 10 |
+
0.0,0.0,-0.03084894221014221,0.003939330986733625,-0.03090160943240284,-0.006714410663128717,26.31898937067327,18.701999999998797,0.54,195434.54,-0.56,-529.84,372.04,1.258940634727478,450000
|
| 11 |
+
0.0,0.0,-0.031548819859780426,0.006595820104173663,-0.03159527057488044,0.005308280536329282,24.605611112928905,20.31799999999832,0.5,216236.18,-0.7,-636.46,404.36,1.3672734594345093,500000
|
| 12 |
+
0.0,0.0,-0.03015917762159371,-0.00038405222664962356,-0.029847663193762343,0.002665286567114333,28.363565372613,17.350999999998987,0.66,235529.86,-0.5,-523.26,345.02,1.1592978143692017,550000
|
| 13 |
+
0.0,0.0,-0.027638468610540902,-0.00934211704212021,-0.028142246932158586,-0.00841665121442485,23.524672007372896,20.159999999998423,0.44,254513.62,-0.74,-571.76,401.2,1.3588572883605956,600000
|
| 14 |
+
0.0,0.0,-0.05235866038298862,0.008720530697466377,-0.05301325959710397,-0.009585054197107739,19.08666738744678,19.43099999999837,0.44,274369.44,-0.74,-573.2,386.62,1.2976602268218995,650000
|
| 15 |
+
0.0,0.0,-0.05599909640151238,0.001291984666573486,-0.0560314791292305,0.013842303988476674,22.593847101535445,19.5779999999985,0.52,295804.82,-0.52,-554.68,389.56,1.30934250831604,700000
|
| 16 |
+
0.0,0.0,-0.06855224402560235,0.002766607128325533,-0.06834916099664208,0.005674673144820889,18.196885001879576,20.99799999999805,0.36,316075.88,-0.86,-625.36,417.96,1.4336480808258056,750000
|
| 17 |
+
0.0,0.0,-0.04024337968345896,-0.0022791178333897216,-0.04077377470649759,-0.019307207715772524,24.898595868360104,18.65199999999878,0.58,336534.96,-0.5,-540.66,371.04,1.2804498815536498,800000
|
| 18 |
+
0.0,0.0,-0.06548739816600033,-0.007551686038511211,-0.06566181093607495,-0.005366620098398802,26.77337179684326,19.550999999998695,0.5,355529.3,-0.64,-551.06,389.02,1.3232181119918822,850000
|
| 19 |
+
0.0,0.0,-0.025592282896719887,-0.00573298610801595,-0.025634663350138157,-0.004492060032157158,21.79267682997177,20.391999999998443,0.46,375886.26,-0.72,-622.02,405.84,1.3856129598617555,900000
|
| 20 |
+
0.0,0.0,-0.020261845748336497,-0.015870967877013163,-0.019737308678507873,0.01678506520418315,25.89828180572503,19.17499999999865,0.58,397377.32,-0.6,-574.86,381.5,1.3036764240264893,950000
|
| 21 |
+
0.0,0.0,-0.023326746520758154,-0.005248394661360728,-0.023588934709998243,0.0033736258976645424,20.20171825592734,20.429999999998305,0.38,418183.86,-0.84,-606.52,406.6,1.3701397323608397,1000000
|
| 22 |
+
0.0,0.0,-0.014381120067268868,0.00626377078365232,-0.014019014980963813,0.007657983128004196,26.734618188135272,16.571999999999083,0.7,437276.02,-0.48,-523.0,329.44,1.151287136077881,1050000
|
| 23 |
+
0.0,0.0,0.00713979649574249,-0.011708484674966177,0.006728154957348494,-0.012760279955315153,31.81359006477484,12.206999999999775,0.9,451956.96,-0.1,-356.52,242.14,0.8663182401657105,1100000
|
| 24 |
+
0.0,0.0,0.020364889092126727,-0.026486076095780985,0.01942759395548365,-0.020847718115773187,32.8704883097447,10.833999999999563,0.92,464528.78,-0.1,-321.44,214.68,0.7552194213867187,1150000
|
| 25 |
+
0.0,0.0,0.025238347773322387,-0.02869863904144255,0.02429584185127888,-0.004882375896527791,33.87775321337977,10.618999999999403,0.92,475228.14,-0.12,-333.24,210.38,0.745708236694336,1200000
|
| 26 |
+
0.0,0.0,0.04158206370489101,-0.04287489129273211,0.040132590740749936,-0.04383140714614061,35.711028265484366,9.340999999999807,0.98,486070.88,-0.02,-276.04,184.82,0.6631600332260131,1250000
|
| 27 |
+
0.0,0.0,0.03279914666937594,-0.03819842359005565,0.03152105308979359,-0.043658871973237846,33.639823858183355,9.938999999999636,0.92,495740.74,-0.08,-286.88,196.78,0.6976651525497437,1300000
|
| 28 |
+
0.0,0.0,0.05209774922701304,-0.04852581082197604,0.050071701977629134,-0.05036436032110841,35.82515357382583,7.4969999999996695,1.0,504835.82,0.0,-213.28,147.94,0.5361687183380127,1350000
|
| 29 |
+
0.0,0.0,0.03837796482565551,-0.05385657406740703,0.0365277208903335,-0.0497424345536498,36.013196246434006,7.00799999999957,1.0,512273.32,0.0,-198.48,138.16,0.5058957004547119,1400000
|
| 30 |
+
0.0,0.0,0.046385770601066696,-0.053134102752241924,0.04473121968066555,-0.054107361802741116,35.73502312892364,6.8469999999995705,1.0,519296.06,0.0,-193.52,134.94,0.49196084022521974,1450000
|
| 31 |
+
0.0,0.0,0.06467102856644003,-0.054221044721832354,0.06263469716863476,-0.04795067968950092,36.050303475465185,6.601999999999532,1.0,526274.86,0.0,-186.7,130.04,0.4784649658203125,1500000
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/eval_sv.csv
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.007092571333430182,0.006535812169901588,-0.006628165615930318,0.011192009575508807,26.971514117663528,25.099999999996967,0.0,12750.0,-1.9,-976.66,500.0,1.6885305261611938,50000
|
| 3 |
+
0.0,0.0,-0.04126623978012787,-0.00908897314551282,-0.04155017897920883,-0.0036517791311925915,21.361326379713443,24.806999999997032,0.02,38539.04,-1.68,-901.0,494.14,1.5461155223846434,100000
|
| 4 |
+
0.0,0.0,-0.03310060261779639,-0.0022762730731864422,-0.033446359855859475,-0.004084015236061084,19.8296621291261,23.747999999997386,0.14,63831.0,-1.38,-841.6,472.96,1.524410653114319,150000
|
| 5 |
+
0.0,0.0,-0.04086084850577247,0.0021804842144520146,-0.04083318357150081,0.00042442465485515064,20.455850299987457,22.679999999997616,0.2,87669.54,-1.14,-726.76,451.6,1.4597340440750122,200000
|
| 6 |
+
0.0,0.0,-0.03802323205092513,0.002777256817215113,-0.03827220616376559,-0.0055142283171202575,20.776273429111505,21.881999999998165,0.34,111204.8,-1.04,-719.98,435.64,1.4487226963043214,250000
|
| 7 |
+
0.0,0.0,-0.04801493852027212,-0.005902096475538104,-0.048554655799281324,-0.013380565432910734,19.442659651600756,21.67399999999793,0.34,133876.0,-0.84,-669.04,431.48,1.434865379333496,300000
|
| 8 |
+
0.0,0.0,-0.038124407461665115,-0.006998066515511824,-0.038008074119664205,-0.004536820446996554,22.077022226698467,20.042999999998116,0.4,155749.72,-0.8,-619.8,398.86,1.3541836643218994,350000
|
| 9 |
+
0.0,0.0,-0.03345637192652937,-0.0022286345076493646,-0.033494263951137214,0.021616097902505533,20.91185260940168,19.966999999998595,0.46,176156.84,-0.64,-557.52,397.34,1.365433735847473,400000
|
| 10 |
+
0.0,0.0,-0.03084894221014221,0.003939330986733625,-0.03090160943240284,-0.006714410663128717,26.31898937067327,18.701999999998797,0.54,195434.54,-0.56,-529.84,372.04,1.258940634727478,450000
|
| 11 |
+
0.0,0.0,-0.031548819859780426,0.006595820104173663,-0.03159527057488044,0.005308280536329282,24.605611112928905,20.31799999999832,0.5,216236.18,-0.7,-636.46,404.36,1.3672734594345093,500000
|
| 12 |
+
0.0,0.0,-0.03015917762159371,-0.00038405222664962356,-0.029847663193762343,0.002665286567114333,28.363565372613,17.350999999998987,0.66,235529.86,-0.5,-523.26,345.02,1.1592978143692017,550000
|
| 13 |
+
0.0,0.0,-0.027638468610540902,-0.00934211704212021,-0.028142246932158586,-0.00841665121442485,23.524672007372896,20.159999999998423,0.44,254513.62,-0.74,-571.76,401.2,1.3588572883605956,600000
|
| 14 |
+
0.0,0.0,-0.05235866038298862,0.008720530697466377,-0.05301325959710397,-0.009585054197107739,19.08666738744678,19.43099999999837,0.44,274369.44,-0.74,-573.2,386.62,1.2976602268218995,650000
|
| 15 |
+
0.0,0.0,-0.05599909640151238,0.001291984666573486,-0.0560314791292305,0.013842303988476674,22.593847101535445,19.5779999999985,0.52,295804.82,-0.52,-554.68,389.56,1.30934250831604,700000
|
| 16 |
+
0.0,0.0,-0.06855224402560235,0.002766607128325533,-0.06834916099664208,0.005674673144820889,18.196885001879576,20.99799999999805,0.36,316075.88,-0.86,-625.36,417.96,1.4336480808258056,750000
|
| 17 |
+
0.0,0.0,-0.04024337968345896,-0.0022791178333897216,-0.04077377470649759,-0.019307207715772524,24.898595868360104,18.65199999999878,0.58,336534.96,-0.5,-540.66,371.04,1.2804498815536498,800000
|
| 18 |
+
0.0,0.0,-0.06548739816600033,-0.007551686038511211,-0.06566181093607495,-0.005366620098398802,26.77337179684326,19.550999999998695,0.5,355529.3,-0.64,-551.06,389.02,1.3232181119918822,850000
|
| 19 |
+
0.0,0.0,-0.025592282896719887,-0.00573298610801595,-0.025634663350138157,-0.004492060032157158,21.79267682997177,20.391999999998443,0.46,375886.26,-0.72,-622.02,405.84,1.3856129598617555,900000
|
| 20 |
+
0.0,0.0,-0.020261845748336497,-0.015870967877013163,-0.019737308678507873,0.01678506520418315,25.89828180572503,19.17499999999865,0.58,397377.32,-0.6,-574.86,381.5,1.3036764240264893,950000
|
| 21 |
+
0.0,0.0,-0.023326746520758154,-0.005248394661360728,-0.023588934709998243,0.0033736258976645424,20.20171825592734,20.429999999998305,0.38,418183.86,-0.84,-606.52,406.6,1.3701397323608397,1000000
|
| 22 |
+
0.0,0.0,-0.014381120067268868,0.00626377078365232,-0.014019014980963813,0.007657983128004196,26.734618188135272,16.571999999999083,0.7,437276.02,-0.48,-523.0,329.44,1.151287136077881,1050000
|
| 23 |
+
0.0,0.0,0.00713979649574249,-0.011708484674966177,0.006728154957348494,-0.012760279955315153,31.81359006477484,12.206999999999775,0.9,451956.96,-0.1,-356.52,242.14,0.8663182401657105,1100000
|
| 24 |
+
0.0,0.0,0.020364889092126727,-0.026486076095780985,0.01942759395548365,-0.020847718115773187,32.8704883097447,10.833999999999563,0.92,464528.78,-0.1,-321.44,214.68,0.7552194213867187,1150000
|
| 25 |
+
0.0,0.0,0.025238347773322387,-0.02869863904144255,0.02429584185127888,-0.004882375896527791,33.87775321337977,10.618999999999403,0.92,475228.14,-0.12,-333.24,210.38,0.745708236694336,1200000
|
| 26 |
+
0.0,0.0,0.04158206370489101,-0.04287489129273211,0.040132590740749936,-0.04383140714614061,35.711028265484366,9.340999999999807,0.98,486070.88,-0.02,-276.04,184.82,0.6631600332260131,1250000
|
| 27 |
+
0.0,0.0,0.03279914666937594,-0.03819842359005565,0.03152105308979359,-0.043658871973237846,33.639823858183355,9.938999999999636,0.92,495740.74,-0.08,-286.88,196.78,0.6976651525497437,1300000
|
| 28 |
+
0.0,0.0,0.05209774922701304,-0.04852581082197604,0.050071701977629134,-0.05036436032110841,35.82515357382583,7.4969999999996695,1.0,504835.82,0.0,-213.28,147.94,0.5361687183380127,1350000
|
| 29 |
+
0.0,0.0,0.03837796482565551,-0.05385657406740703,0.0365277208903335,-0.0497424345536498,36.013196246434006,7.00799999999957,1.0,512273.32,0.0,-198.48,138.16,0.5058957004547119,1400000
|
| 30 |
+
0.0,0.0,0.046385770601066696,-0.053134102752241924,0.04473121968066555,-0.054107361802741116,35.73502312892364,6.8469999999995705,1.0,519296.06,0.0,-193.52,134.94,0.49196084022521974,1450000
|
| 31 |
+
0.0,0.0,0.06467102856644003,-0.054221044721832354,0.06263469716863476,-0.04795067968950092,36.050303475465185,6.601999999999532,1.0,526274.86,0.0,-186.7,130.04,0.4784649658203125,1500000
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"logtostderr": false, "alsologtostderr": false, "log_dir": "", "v": 0, "verbosity": 0, "logger_levels": {}, "stderrthreshold": "fatal", "showprefixforinfo": true, "run_with_pdb": false, "pdb_post_mortem": false, "pdb": false, "run_with_profiling": false, "profile_file": null, "use_cprofile_for_profiling": true, "only_check_args": false, "pymjcf_debug": false, "pymjcf_debug_full_dump_dir": "", "pymjcf_log_xml": false, "timeout": true, "chex_n_cpu_devices": 1, "chex_assert_multiple_cpu_devices": false, "test_srcdir": "", "test_tmpdir": "/tmp/absl_testing", "test_random_seed": 301, "test_randomize_ordering_seed": "", "xml_output_file": "", "chex_skip_pmap_variant_if_single_device": true, "run_group": "main-experiments", "tags": "CGQL", "seed": 10001, "env_name": "cube-double-play-singletask-task2-v0", "save_dir": "exp/qam-reproduce/main-experiments/cube-double-play-singletask-task2-v0/20260307_005755", "offline_steps": 1000000, "online_steps": 500000, "buffer_size": 1000000, "log_interval": 5000, "eval_interval": 50000, "save_interval": 50000, "start_training": 5000, "utd_ratio": 1, "eval_episodes": 50, "video_episodes": 2, "video_frame_skip": 3, "agent": {"action_chunking": true, "action_dim": 5, "actor_hidden_dims": [512, 512, 512, 512], "actor_layer_norm": false, "agent_name": "cgql", "batch_size": 256, "best_of_n": 1, "discount": 0.99, "flow_steps": 10, "guidance_coef": 0.01, "horizon_length": 5, "inv_temp": 10.0, "isd_clip": 5.0, "lr": 0.0003, "mode": "simple", "noisy_coef": 0.001, "num_qs": 10, "ob_dims": [37], "rho": 0.5, "separate": false, "target_guidance": true, "tau": 0.005, "value_hidden_dims": [512, 512, 512, 512], "value_layer_norm": true}, "dataset_proportion": 1.0, "dataset_replace_interval": 1000, "ogbench_dataset_dir": null, "horizon_length": 5, "sparse": false, "save_all_online_states": false, "save_last_checkpoint": false, "save_replay_buffer": false, "balanced_sampling": false, "?": false, "help": false, "helpshort": false, "helpfull": false, "helpxml": false}
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/offline_agent.csv
ADDED
|
@@ -0,0 +1,201 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.25540215,10.974189,-51.310406,-134.86209,-149.63945,1.0857989,-0.9795562,101.62308,5000
|
| 3 |
+
0.238886,13.487701,-45.120064,-146.16504,-175.55173,2.978727,-3.3418326,198.96143,10000
|
| 4 |
+
0.2434863,16.339731,2.842378,-158.4334,-190.37859,2.837904,-2.7242897,165.41515,15000
|
| 5 |
+
0.22942467,17.516342,-72.94863,-162.07031,-199.11548,3.596026,-3.7701676,195.49704,20000
|
| 6 |
+
0.22063157,10.888938,-81.05209,-169.08699,-195.72134,3.5196416,-4.06929,124.45003,25000
|
| 7 |
+
0.23476799,14.907798,4.7973976,-166.32263,-204.00536,7.6574993,-8.382183,273.2664,30000
|
| 8 |
+
0.19571728,15.314038,-35.305454,-168.17877,-202.35619,3.1402278,-2.7660816,152.43547,35000
|
| 9 |
+
0.21247646,15.560771,-74.41953,-169.05826,-204.03201,0.8477313,-0.70746315,91.43347,40000
|
| 10 |
+
0.21187393,10.761474,-69.903725,-171.46257,-203.24084,1.788118,-1.9197057,83.78401,45000
|
| 11 |
+
0.20850892,16.165735,-61.800583,-171.58778,-205.28502,1.0094855,-1.1396629,85.853935,50000
|
| 12 |
+
0.2409667,10.392382,-46.024055,-172.61172,-203.50204,1.0816896,-1.1937099,68.07026,55000
|
| 13 |
+
0.19807824,11.886193,-47.30768,-171.58931,-204.88792,0.45869732,-0.4865485,62.97229,60000
|
| 14 |
+
0.2002394,13.8417635,-74.85866,-174.89543,-204.86415,0.86080545,-0.9346077,74.132225,65000
|
| 15 |
+
0.23985295,6.632146,-65.03468,-173.74532,-205.17479,0.25249428,-0.36034226,40.08827,70000
|
| 16 |
+
0.19657654,8.901059,-84.86313,-173.78833,-203.68088,0.5138353,-0.4604865,61.967728,75000
|
| 17 |
+
0.17855644,11.720831,-13.429113,-174.718,-204.66193,0.4056168,-0.37693188,51.72174,80000
|
| 18 |
+
0.23821905,10.835658,-58.2096,-176.23041,-206.17693,0.31579083,-0.40894398,51.00181,85000
|
| 19 |
+
0.20860054,10.0476885,-16.45339,-174.36806,-204.30087,0.49631196,-0.41993272,44.99784,90000
|
| 20 |
+
0.19105145,10.022347,-42.95629,-174.10376,-205.26166,0.2995714,-0.33619702,47.351738,95000
|
| 21 |
+
0.21118313,6.408134,-24.462456,-174.40758,-205.04608,0.62183946,-0.6007043,52.10521,100000
|
| 22 |
+
0.22108328,13.210605,-15.524338,-174.6458,-205.19838,2.117079,-2.1060612,73.40668,105000
|
| 23 |
+
0.22795461,11.383198,2.2797587,-175.33475,-203.61235,5.406445,-5.447198,140.15085,110000
|
| 24 |
+
0.18094668,10.537711,1.7294505,-175.97147,-204.93631,0.41404408,-0.38606802,48.81413,115000
|
| 25 |
+
0.20840031,14.568932,-10.738529,-176.24393,-204.53252,0.9881698,-1.1944283,66.68321,120000
|
| 26 |
+
0.18375123,12.059062,-9.280594,-174.40842,-204.95195,5.003008,-4.242748,107.6398,125000
|
| 27 |
+
0.20164472,9.292851,2.5677543,-174.06255,-205.80476,0.33271137,-0.2723577,46.347954,130000
|
| 28 |
+
0.19098242,9.601527,-83.889534,-177.22008,-204.55998,0.48418817,-0.44966847,45.462254,135000
|
| 29 |
+
0.19499543,6.50782,-49.43894,-173.11617,-205.25748,0.3984913,-0.39350155,39.363297,140000
|
| 30 |
+
0.20537147,30.484247,-59.69584,-172.1532,-205.30418,1.5080892,-1.5029309,93.09696,145000
|
| 31 |
+
0.16680363,9.127662,-17.210823,-173.20773,-204.51819,0.25971246,-0.25133267,36.314423,150000
|
| 32 |
+
0.20190442,12.986679,-12.524004,-172.819,-204.77634,2.1801443,-1.6011753,58.862835,155000
|
| 33 |
+
0.18755482,11.956634,-97.60718,-175.48097,-204.19115,0.2769315,-0.37583068,39.593525,160000
|
| 34 |
+
0.18515027,8.692528,2.237268,-174.92413,-203.93483,1.5857209,-1.7179826,45.079033,165000
|
| 35 |
+
0.20941195,9.499224,-65.74033,-175.0416,-205.0735,0.35822284,-0.31277177,39.765358,170000
|
| 36 |
+
0.21535347,7.09039,-34.96859,-175.17276,-205.13516,0.23423736,-0.22946641,33.54837,175000
|
| 37 |
+
0.2008887,12.346757,-63.91099,-174.4281,-204.76788,0.4465866,-0.43599522,39.355663,180000
|
| 38 |
+
0.20915869,10.656283,-87.16193,-174.3223,-204.62358,0.50644976,-0.4802368,41.408447,185000
|
| 39 |
+
0.18619436,8.898512,-60.371918,-176.73882,-203.45851,0.36278498,-0.35838374,43.241543,190000
|
| 40 |
+
0.18762627,9.508407,-0.4343899,-177.361,-203.99606,0.2762337,-0.26653308,30.430433,195000
|
| 41 |
+
0.20323114,7.466835,-69.70901,-176.06212,-204.45634,0.43752846,-0.31933892,48.47429,200000
|
| 42 |
+
0.149149,8.72137,-71.69821,-175.92441,-204.91231,0.28449756,-0.33796155,36.465256,205000
|
| 43 |
+
0.21693437,11.013214,9.617605,-175.90817,-204.07083,0.4408687,-0.38326004,34.807076,210000
|
| 44 |
+
0.16310221,8.086323,-44.038647,-177.63438,-204.8523,0.2781485,-0.56449175,50.1952,215000
|
| 45 |
+
0.18480477,14.997312,3.6649992,-176.11674,-204.64165,0.48845285,-0.51833814,40.4987,220000
|
| 46 |
+
0.19855438,15.625043,-78.96751,-177.41434,-204.49408,0.536582,-0.53602564,46.924194,225000
|
| 47 |
+
0.18435363,15.741793,-31.86943,-174.56174,-204.3722,0.32132497,-0.477739,50.353996,230000
|
| 48 |
+
0.18302897,10.163614,-15.155638,-175.39832,-203.91628,0.310676,-0.30418682,32.975597,235000
|
| 49 |
+
0.17074169,10.666033,-54.93844,-174.59154,-204.2583,0.39192992,-0.3883174,34.97396,240000
|
| 50 |
+
0.22462136,10.256366,-78.193,-178.51389,-203.75601,0.35951412,-0.33460158,32.95401,245000
|
| 51 |
+
0.17855287,10.678003,-74.39879,-175.60118,-203.8619,0.8643082,-1.0243653,44.399002,250000
|
| 52 |
+
0.18033496,8.600341,-65.015274,-175.14507,-204.23727,0.30660152,-0.3148681,27.240978,255000
|
| 53 |
+
0.20033854,16.335545,-104.81373,-177.44077,-203.45596,0.34542868,-0.39387253,38.580883,260000
|
| 54 |
+
0.17611212,8.570842,-59.99251,-177.70596,-204.47925,0.6681185,-0.7233949,44.489777,265000
|
| 55 |
+
0.19722468,12.228405,-64.58595,-175.81438,-203.83583,2.8526893,-2.5207944,55.607323,270000
|
| 56 |
+
0.15080622,12.216154,-78.5184,-176.56688,-203.85136,0.54123867,-0.44015995,51.417202,275000
|
| 57 |
+
0.181729,8.055255,-45.50894,-175.71382,-203.84756,0.33569494,-0.26509184,31.899084,280000
|
| 58 |
+
0.18201496,10.74344,-57.31417,-176.14606,-204.61707,0.6530031,-0.67076063,38.11831,285000
|
| 59 |
+
0.18609384,9.043329,-68.50747,-176.99817,-203.72507,3.1292114,-2.7779293,59.57299,290000
|
| 60 |
+
0.18487953,9.149382,-64.40253,-178.29034,-204.4731,0.38540998,-0.45007154,33.791756,295000
|
| 61 |
+
0.1659853,10.961419,-68.96994,-176.20398,-204.86537,0.37394455,-0.28137177,31.967884,300000
|
| 62 |
+
0.19489208,9.967456,-75.37551,-175.0072,-203.57115,0.2885093,-0.25662684,30.887424,305000
|
| 63 |
+
0.1786471,8.580081,-76.09501,-175.1045,-203.67293,0.5026161,-0.71852833,53.348183,310000
|
| 64 |
+
0.1747536,9.727026,-46.331203,-175.98534,-203.8734,0.37464824,-0.38114658,37.315487,315000
|
| 65 |
+
0.20842317,6.3737907,-82.89411,-179.5978,-204.20189,0.23013249,-0.23184882,21.751581,320000
|
| 66 |
+
0.16623078,8.716532,-51.253788,-174.1461,-203.65283,0.34073305,-0.3351776,29.21607,325000
|
| 67 |
+
0.19954458,11.422931,-57.723885,-176.21062,-204.01224,0.33332935,-0.3794353,31.6975,330000
|
| 68 |
+
0.1993344,14.702046,-6.403887,-172.98393,-204.01909,0.49393123,-0.52635866,34.586,335000
|
| 69 |
+
0.18502632,5.9707885,-44.615,-176.7638,-204.16078,0.13301742,-0.1927584,18.461548,340000
|
| 70 |
+
0.19235294,7.947454,-83.1322,-176.13753,-204.11761,0.3326626,-0.47231954,39.085293,345000
|
| 71 |
+
0.19504118,9.65188,-103.671036,-178.18257,-203.94449,0.35701528,-0.37312052,32.11786,350000
|
| 72 |
+
0.18084197,10.214626,-59.491447,-174.79884,-204.18803,0.23678471,-0.3493546,29.694084,355000
|
| 73 |
+
0.1826394,10.411242,-37.16139,-175.06265,-204.1485,0.37160683,-0.30059543,37.771763,360000
|
| 74 |
+
0.18597266,8.776676,1.3264477,-176.35722,-204.27435,0.45543388,-0.32944667,43.130028,365000
|
| 75 |
+
0.1865386,14.644762,-3.0635018,-174.89801,-203.60727,0.56479883,-0.66281766,41.157833,370000
|
| 76 |
+
0.2007168,7.900989,-43.98884,-174.02432,-203.878,0.377675,-0.31602502,30.287308,375000
|
| 77 |
+
0.16263497,10.409789,-10.44767,-174.74841,-203.62936,0.5006024,-0.3564423,33.285095,380000
|
| 78 |
+
0.17019355,7.8283663,-62.6827,-178.68384,-203.50333,0.24290428,-0.2995929,28.36991,385000
|
| 79 |
+
0.18800713,16.039133,-97.08411,-175.3778,-203.49069,4.6168466,-5.788005,140.10515,390000
|
| 80 |
+
0.1621884,8.175971,0.574664,-177.0053,-204.29678,0.3496675,-0.2341836,23.723028,395000
|
| 81 |
+
0.20187888,7.4770103,-70.87141,-177.35452,-203.76915,0.3232386,-0.29282138,28.242332,400000
|
| 82 |
+
0.20800614,8.942917,0.33533615,-175.78238,-203.50003,0.6467213,-0.6154228,28.404411,405000
|
| 83 |
+
0.18236774,8.681981,-68.225975,-175.13947,-204.17096,0.20659342,-0.38781953,32.189842,410000
|
| 84 |
+
0.18214078,9.452962,-75.18308,-177.27036,-203.48239,0.5225291,-0.21480225,40.187458,415000
|
| 85 |
+
0.17526864,9.006652,-70.76112,-175.79492,-203.95653,0.33445737,-0.3587155,28.740881,420000
|
| 86 |
+
0.17456919,14.652041,-102.572876,-176.85942,-203.96109,2.2507203,-1.7145798,62.233883,425000
|
| 87 |
+
0.20711625,12.709131,1.2175183,-174.9163,-203.37875,1.5218834,-1.6583734,64.66237,430000
|
| 88 |
+
0.17329527,10.782718,-47.29656,-176.58646,-203.40923,0.32239044,-0.20959924,29.168133,435000
|
| 89 |
+
0.17125738,7.262764,-73.422195,-177.12495,-203.55421,0.3278833,-0.17248656,26.447132,440000
|
| 90 |
+
0.18168183,14.086484,-64.99694,-177.5575,-203.8996,0.8533774,-1.1266291,61.042694,445000
|
| 91 |
+
0.2101819,10.9659,-81.92206,-179.24681,-203.63045,0.32431543,-0.29455855,28.798256,450000
|
| 92 |
+
0.17863376,7.5683975,-96.87289,-180.87817,-203.54599,0.3371074,-0.32175097,27.6495,455000
|
| 93 |
+
0.1991334,9.952606,-43.718815,-174.21947,-202.97144,0.5642773,-0.27643144,26.83507,460000
|
| 94 |
+
0.18019494,9.603603,1.9194007,-175.86833,-203.68808,2.22195,-2.0727642,56.075775,465000
|
| 95 |
+
0.19479692,7.4485855,-45.995792,-172.25116,-203.38925,0.31049466,-0.2845689,28.203503,470000
|
| 96 |
+
0.20131885,12.662799,-53.051834,-172.64838,-204.12212,0.556581,-0.57661504,29.343002,475000
|
| 97 |
+
0.20042014,6.9539895,-53.09674,-175.63936,-203.61186,0.3758329,-0.4219207,30.115482,480000
|
| 98 |
+
0.19108993,9.440498,-67.77108,-177.97472,-205.33353,0.35064584,-0.41115624,37.54677,485000
|
| 99 |
+
0.19145632,5.7101383,-63.732777,-176.53185,-204.05122,0.28346556,-0.17327559,21.628132,490000
|
| 100 |
+
0.22412857,7.590519,-65.48031,-178.12634,-204.02579,0.21912844,-0.4339251,34.587692,495000
|
| 101 |
+
0.20809504,5.6422677,-74.8663,-178.93973,-204.54053,0.11741142,-0.27536625,22.479395,500000
|
| 102 |
+
0.17983408,5.9542713,-63.35095,-178.18948,-204.8549,0.26684695,-0.2867067,23.999868,505000
|
| 103 |
+
0.1791244,12.710341,-82.30557,-177.82957,-203.16441,0.38618758,-0.35122076,26.877563,510000
|
| 104 |
+
0.2016632,7.921678,1.9119928,-176.10228,-203.7279,1.9592754,-3.0847511,65.2014,515000
|
| 105 |
+
0.17117189,10.601939,1.323573,-174.0894,-203.5431,0.5357702,-0.35093594,40.373398,520000
|
| 106 |
+
0.1955184,13.821261,-82.80296,-172.9385,-203.7862,3.310864,-3.6234572,66.2062,525000
|
| 107 |
+
0.18308201,20.33069,-97.10309,-178.72057,-203.83197,0.5148756,-0.40725213,40.349606,530000
|
| 108 |
+
0.16661021,10.353349,-37.70305,-176.66496,-203.5977,0.47808212,-0.50937736,30.3852,535000
|
| 109 |
+
0.19834371,8.5529375,0.8800143,-177.1328,-202.86003,0.44981736,-0.42036676,25.796131,540000
|
| 110 |
+
0.20935127,12.4011755,-72.86931,-174.38516,-203.10408,0.3373635,-0.4372619,31.678923,545000
|
| 111 |
+
0.19310363,9.234894,-48.057312,-176.73566,-203.06471,0.5064757,-0.20498134,21.886612,550000
|
| 112 |
+
0.17149091,8.53102,-74.65598,-174.95244,-203.27145,0.33652544,-0.4112741,22.547543,555000
|
| 113 |
+
0.20834485,11.1471405,-70.893295,-177.02837,-203.62126,0.9492786,-0.96698165,27.572254,560000
|
| 114 |
+
0.19884428,11.309203,-83.26866,-177.8103,-203.28601,0.455847,-0.31816268,33.279278,565000
|
| 115 |
+
0.18764558,10.024457,-69.68084,-173.39456,-202.72337,0.51733017,-0.5346291,28.596342,570000
|
| 116 |
+
0.16744545,9.589742,-85.23643,-176.06775,-203.3087,0.2660019,-0.3060756,25.912086,575000
|
| 117 |
+
0.18209806,9.392828,-76.41639,-178.49825,-203.5883,0.31857222,-0.3911255,26.91999,580000
|
| 118 |
+
0.17296046,9.247537,-86.131256,-178.65056,-203.6136,0.3537409,-0.18543923,23.278214,585000
|
| 119 |
+
0.1416823,7.8934073,-95.29657,-177.11339,-203.49,0.35222116,-0.38819164,25.741001,590000
|
| 120 |
+
0.16364354,13.406894,-75.43007,-175.99773,-203.17441,0.3397001,-0.5786744,28.65539,595000
|
| 121 |
+
0.19178584,14.1234045,-31.915878,-175.85153,-203.19176,0.4741148,-0.51731896,36.26206,600000
|
| 122 |
+
0.18353903,12.300928,-61.678112,-176.16862,-203.03154,1.6873281,-1.6272165,35.79017,605000
|
| 123 |
+
0.16485739,9.501182,-64.53064,-177.29771,-203.47067,0.6109389,-0.50918585,34.42812,610000
|
| 124 |
+
0.1558181,10.551704,2.1070507,-173.24113,-202.4765,0.26961997,-0.2529044,27.71278,615000
|
| 125 |
+
0.1783495,11.571052,-52.795013,-173.42348,-202.57703,0.48861352,-0.4369563,33.280354,620000
|
| 126 |
+
0.21134442,11.379229,-71.5627,-175.6222,-203.82458,1.1612065,-1.3439969,39.483215,625000
|
| 127 |
+
0.21542525,7.13398,-63.363552,-178.78716,-203.1557,0.33497152,-0.33824283,22.09592,630000
|
| 128 |
+
0.1725318,17.185179,-41.065006,-173.8333,-204.2577,0.3358809,-0.5341474,45.43016,635000
|
| 129 |
+
0.19532631,7.030933,-104.3283,-179.71342,-203.3166,1.0401255,-0.9294013,28.228909,640000
|
| 130 |
+
0.19826803,11.443084,-75.819,-174.60677,-203.44028,0.47424817,-0.2710683,27.012983,645000
|
| 131 |
+
0.17010707,10.711202,-81.6013,-180.70232,-203.77034,0.20232691,-0.44657215,33.199886,650000
|
| 132 |
+
0.17809609,11.737411,-71.1387,-176.04173,-203.13628,0.22177032,-0.18313825,24.093052,655000
|
| 133 |
+
0.16658844,13.641986,-41.180046,-176.04175,-202.81815,0.5683535,-0.41895932,38.545662,660000
|
| 134 |
+
0.21062283,9.804014,-63.81216,-173.82945,-203.64883,0.39297634,-0.3766547,30.608707,665000
|
| 135 |
+
0.19701226,10.565572,-32.633976,-176.32886,-203.08926,0.48114738,-0.5161284,29.695581,670000
|
| 136 |
+
0.18618184,12.048018,-101.52612,-177.63301,-204.01222,0.21825413,-0.20717955,24.707483,675000
|
| 137 |
+
0.15344617,8.952672,-68.48101,-174.41043,-204.20752,0.26614317,-0.32660607,30.058659,680000
|
| 138 |
+
0.16749488,7.6905055,-54.37334,-177.97234,-204.19432,0.12781537,-0.21798995,17.578716,685000
|
| 139 |
+
0.1898359,7.172278,-56.811264,-178.77849,-203.7864,0.16589817,-0.23359782,20.58165,690000
|
| 140 |
+
0.19481382,5.8471913,-67.5818,-176.8985,-203.04558,0.1354344,-0.17261837,18.409264,695000
|
| 141 |
+
0.18433763,17.525358,-46.541264,-177.3024,-203.33763,0.4119636,-0.23354362,31.87931,700000
|
| 142 |
+
0.18537292,11.137821,-3.8852925,-175.04306,-204.07028,0.27921864,-0.6453871,33.27543,705000
|
| 143 |
+
0.16982934,16.07414,2.6440024,-175.33995,-202.89905,0.3665095,-0.32109278,33.182312,710000
|
| 144 |
+
0.19421667,8.458293,-61.890205,-178.1659,-203.44757,0.3206222,-0.3245213,27.014622,715000
|
| 145 |
+
0.21625805,18.186567,-71.338844,-175.5203,-203.261,0.62988615,-0.57491845,40.63931,720000
|
| 146 |
+
0.16456164,7.604412,-90.71314,-177.91924,-203.41147,2.2395306,-2.269694,34.51136,725000
|
| 147 |
+
0.19586705,6.4284067,-75.81182,-179.28764,-203.84978,0.42892164,-0.3542689,24.498144,730000
|
| 148 |
+
0.19537929,14.818248,-58.250824,-179.83868,-204.09189,0.68647844,-0.67601764,36.169067,735000
|
| 149 |
+
0.16433044,8.262046,-37.566708,-176.84988,-203.0474,0.6030815,-0.25808105,26.844566,740000
|
| 150 |
+
0.20389801,8.609985,-91.76918,-178.12039,-204.01172,0.58710957,-0.5150835,37.19711,745000
|
| 151 |
+
0.14932854,20.293379,-73.2633,-176.31505,-202.73451,1.0744755,-1.0807639,52.10396,750000
|
| 152 |
+
0.17994343,17.076424,-40.651516,-178.72737,-203.5938,0.5592246,-0.39011645,37.475193,755000
|
| 153 |
+
0.21013075,8.119754,-80.57041,-177.22203,-203.08658,0.42089373,-0.2555741,25.980528,760000
|
| 154 |
+
0.17699379,20.796125,0.6790317,-175.08955,-203.4231,0.60283697,-0.5392834,46.59005,765000
|
| 155 |
+
0.18541014,16.57103,-67.66742,-178.88283,-203.26283,0.35717332,-0.35141,26.898758,770000
|
| 156 |
+
0.17163801,14.091037,-42.3174,-176.30136,-203.35449,0.35948148,-0.28304803,28.172668,775000
|
| 157 |
+
0.19974089,14.091771,-70.957794,-178.5283,-203.5635,0.461352,-0.50068015,32.15514,780000
|
| 158 |
+
0.18929888,23.404638,-11.739143,-176.75821,-203.21808,0.47534198,-0.4313756,36.389008,785000
|
| 159 |
+
0.17992416,8.618688,-73.39999,-177.05228,-202.92485,0.2569378,-0.2422928,21.381367,790000
|
| 160 |
+
0.16669992,39.57182,-68.2278,-177.4837,-203.52676,0.8014647,-0.599663,57.07411,795000
|
| 161 |
+
0.22184645,6.4670024,-65.67699,-179.63953,-203.18764,0.21850312,-0.16734204,22.307976,800000
|
| 162 |
+
0.19708456,11.665452,-10.557921,-174.92647,-203.0007,0.59088016,-0.2598145,38.318413,805000
|
| 163 |
+
0.20474786,7.8969855,-6.743909,-175.99991,-202.85736,0.33975035,-0.34594113,26.696884,810000
|
| 164 |
+
0.16486734,9.897898,-72.33111,-178.27483,-203.59271,0.2507502,-0.22966091,21.816359,815000
|
| 165 |
+
0.17501412,11.130804,-59.756325,-178.62816,-203.05255,0.30275416,-0.20521145,22.527536,820000
|
| 166 |
+
0.17853147,7.4163704,-101.91772,-180.9396,-203.00537,0.7358666,-0.7350613,35.52002,825000
|
| 167 |
+
0.18389918,14.636246,-79.69357,-177.71266,-203.44832,0.6074297,-0.20698142,36.13571,830000
|
| 168 |
+
0.19573191,9.317721,-91.723236,-178.49702,-203.24501,0.17878549,-0.46021965,28.71059,835000
|
| 169 |
+
0.16223106,8.761571,-40.76166,-178.6514,-203.03497,1.5373362,-1.7807736,34.17866,840000
|
| 170 |
+
0.19353628,7.0670776,-91.712006,-177.45918,-203.32869,0.30027068,-0.28412616,18.533554,845000
|
| 171 |
+
0.18411365,11.303052,-22.235828,-176.19788,-202.74065,0.21807301,-0.23986627,24.295721,850000
|
| 172 |
+
0.17856139,9.591498,-33.208538,-176.52243,-202.96979,0.31685352,-0.32390782,26.777267,855000
|
| 173 |
+
0.18469197,6.256099,1.026981,-178.13535,-203.71577,0.32762295,-0.30785954,21.339245,860000
|
| 174 |
+
0.17590055,9.375567,-84.88081,-175.40466,-202.96619,0.34743083,-0.47419137,26.347094,865000
|
| 175 |
+
0.1620523,12.150607,-73.870735,-179.8535,-203.2777,0.29588714,-0.5470557,30.55983,870000
|
| 176 |
+
0.1800977,16.39172,-77.871735,-177.92972,-203.26929,0.48615974,-0.55690056,35.918037,875000
|
| 177 |
+
0.17042303,7.2322974,-95.204735,-180.7122,-204.11195,0.20124082,-0.59035957,32.701202,880000
|
| 178 |
+
0.19218528,14.248908,-81.78551,-179.69083,-203.28839,0.29612112,-0.24637285,26.612545,885000
|
| 179 |
+
0.18052623,11.284881,-57.685654,-178.52196,-203.61478,0.42033178,-0.6678503,41.05313,890000
|
| 180 |
+
0.17466336,14.608185,-62.374836,-177.8851,-203.37189,0.49522328,-0.6901214,33.864555,895000
|
| 181 |
+
0.18055347,22.719696,-91.20747,-176.98586,-203.26039,0.6601001,-0.6331504,43.723694,900000
|
| 182 |
+
0.18953308,18.114645,-22.640364,-175.14635,-203.12727,0.8940666,-0.814749,40.20027,905000
|
| 183 |
+
0.17470433,8.481158,-92.515434,-178.66023,-203.37123,0.5888612,-0.5107118,28.072943,910000
|
| 184 |
+
0.17402588,7.05832,-7.4578004,-176.56718,-203.70238,0.3681615,-0.22545142,26.853588,915000
|
| 185 |
+
0.21146473,7.44305,-76.826195,-177.66115,-203.12166,0.1536905,-0.27790952,21.435902,920000
|
| 186 |
+
0.19336364,8.784098,-97.72967,-178.37254,-203.16191,0.4060213,-0.28592318,29.733473,925000
|
| 187 |
+
0.18147945,7.573009,-83.0376,-180.97307,-203.48549,0.2837768,-0.2635515,19.305643,930000
|
| 188 |
+
0.17937857,11.017553,-3.5259583,-179.187,-203.15067,0.3436123,-0.35364234,30.372026,935000
|
| 189 |
+
0.18078054,10.327917,-73.78657,-176.72952,-203.3846,0.4664162,-0.49225008,26.690582,940000
|
| 190 |
+
0.17969218,7.220001,-74.313065,-175.75589,-202.9745,0.3364722,-0.35966638,24.738325,945000
|
| 191 |
+
0.19654562,16.844511,-43.34753,-173.44057,-203.01697,0.37875795,-0.36540884,33.914314,950000
|
| 192 |
+
0.16110492,14.329569,-79.73295,-177.09537,-202.91437,0.22135824,-0.33609667,26.710361,955000
|
| 193 |
+
0.20876661,15.805875,-64.01766,-176.03192,-203.21722,0.4924379,-0.5183765,32.49788,960000
|
| 194 |
+
0.1941939,14.070063,0.7983184,-178.95735,-203.14268,0.21343291,-0.47956648,34.02712,965000
|
| 195 |
+
0.1799463,18.940178,-3.91785,-177.89815,-203.48817,0.33064157,-0.33677244,30.144667,970000
|
| 196 |
+
0.16496721,7.598241,-58.31274,-178.66917,-203.1901,0.22558054,-0.25666,20.138487,975000
|
| 197 |
+
0.21446556,11.647531,-96.66001,-176.00443,-202.4876,0.5250865,-0.3577407,34.529663,980000
|
| 198 |
+
0.16609342,10.979478,-100.81739,-176.26205,-203.24489,0.5349783,-0.569991,44.990177,985000
|
| 199 |
+
0.17175654,6.5255694,-57.88425,-175.15457,-202.69514,0.4399467,-0.16720355,24.377169,990000
|
| 200 |
+
0.19219038,6.967776,-64.30135,-178.49791,-203.90947,0.28859782,-0.26273203,20.119186,995000
|
| 201 |
+
0.15500735,6.2614727,-67.7509,-178.0753,-203.52426,0.3378133,-0.3072808,19.489933,1000000
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/offline_agent_sv.csv
ADDED
|
@@ -0,0 +1,201 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.25540215,10.974189,-51.310406,-134.86209,-149.63945,1.0857989,-0.9795562,101.62308,5000
|
| 3 |
+
0.238886,13.487701,-45.120064,-146.16504,-175.55173,2.978727,-3.3418326,198.96143,10000
|
| 4 |
+
0.2434863,16.339731,2.842378,-158.4334,-190.37859,2.837904,-2.7242897,165.41515,15000
|
| 5 |
+
0.22942467,17.516342,-72.94863,-162.07031,-199.11548,3.596026,-3.7701676,195.49704,20000
|
| 6 |
+
0.22063157,10.888938,-81.05209,-169.08699,-195.72134,3.5196416,-4.06929,124.45003,25000
|
| 7 |
+
0.23476799,14.907798,4.7973976,-166.32263,-204.00536,7.6574993,-8.382183,273.2664,30000
|
| 8 |
+
0.19571728,15.314038,-35.305454,-168.17877,-202.35619,3.1402278,-2.7660816,152.43547,35000
|
| 9 |
+
0.21247646,15.560771,-74.41953,-169.05826,-204.03201,0.8477313,-0.70746315,91.43347,40000
|
| 10 |
+
0.21187393,10.761474,-69.903725,-171.46257,-203.24084,1.788118,-1.9197057,83.78401,45000
|
| 11 |
+
0.20850892,16.165735,-61.800583,-171.58778,-205.28502,1.0094855,-1.1396629,85.853935,50000
|
| 12 |
+
0.2409667,10.392382,-46.024055,-172.61172,-203.50204,1.0816896,-1.1937099,68.07026,55000
|
| 13 |
+
0.19807824,11.886193,-47.30768,-171.58931,-204.88792,0.45869732,-0.4865485,62.97229,60000
|
| 14 |
+
0.2002394,13.8417635,-74.85866,-174.89543,-204.86415,0.86080545,-0.9346077,74.132225,65000
|
| 15 |
+
0.23985295,6.632146,-65.03468,-173.74532,-205.17479,0.25249428,-0.36034226,40.08827,70000
|
| 16 |
+
0.19657654,8.901059,-84.86313,-173.78833,-203.68088,0.5138353,-0.4604865,61.967728,75000
|
| 17 |
+
0.17855644,11.720831,-13.429113,-174.718,-204.66193,0.4056168,-0.37693188,51.72174,80000
|
| 18 |
+
0.23821905,10.835658,-58.2096,-176.23041,-206.17693,0.31579083,-0.40894398,51.00181,85000
|
| 19 |
+
0.20860054,10.0476885,-16.45339,-174.36806,-204.30087,0.49631196,-0.41993272,44.99784,90000
|
| 20 |
+
0.19105145,10.022347,-42.95629,-174.10376,-205.26166,0.2995714,-0.33619702,47.351738,95000
|
| 21 |
+
0.21118313,6.408134,-24.462456,-174.40758,-205.04608,0.62183946,-0.6007043,52.10521,100000
|
| 22 |
+
0.22108328,13.210605,-15.524338,-174.6458,-205.19838,2.117079,-2.1060612,73.40668,105000
|
| 23 |
+
0.22795461,11.383198,2.2797587,-175.33475,-203.61235,5.406445,-5.447198,140.15085,110000
|
| 24 |
+
0.18094668,10.537711,1.7294505,-175.97147,-204.93631,0.41404408,-0.38606802,48.81413,115000
|
| 25 |
+
0.20840031,14.568932,-10.738529,-176.24393,-204.53252,0.9881698,-1.1944283,66.68321,120000
|
| 26 |
+
0.18375123,12.059062,-9.280594,-174.40842,-204.95195,5.003008,-4.242748,107.6398,125000
|
| 27 |
+
0.20164472,9.292851,2.5677543,-174.06255,-205.80476,0.33271137,-0.2723577,46.347954,130000
|
| 28 |
+
0.19098242,9.601527,-83.889534,-177.22008,-204.55998,0.48418817,-0.44966847,45.462254,135000
|
| 29 |
+
0.19499543,6.50782,-49.43894,-173.11617,-205.25748,0.3984913,-0.39350155,39.363297,140000
|
| 30 |
+
0.20537147,30.484247,-59.69584,-172.1532,-205.30418,1.5080892,-1.5029309,93.09696,145000
|
| 31 |
+
0.16680363,9.127662,-17.210823,-173.20773,-204.51819,0.25971246,-0.25133267,36.314423,150000
|
| 32 |
+
0.20190442,12.986679,-12.524004,-172.819,-204.77634,2.1801443,-1.6011753,58.862835,155000
|
| 33 |
+
0.18755482,11.956634,-97.60718,-175.48097,-204.19115,0.2769315,-0.37583068,39.593525,160000
|
| 34 |
+
0.18515027,8.692528,2.237268,-174.92413,-203.93483,1.5857209,-1.7179826,45.079033,165000
|
| 35 |
+
0.20941195,9.499224,-65.74033,-175.0416,-205.0735,0.35822284,-0.31277177,39.765358,170000
|
| 36 |
+
0.21535347,7.09039,-34.96859,-175.17276,-205.13516,0.23423736,-0.22946641,33.54837,175000
|
| 37 |
+
0.2008887,12.346757,-63.91099,-174.4281,-204.76788,0.4465866,-0.43599522,39.355663,180000
|
| 38 |
+
0.20915869,10.656283,-87.16193,-174.3223,-204.62358,0.50644976,-0.4802368,41.408447,185000
|
| 39 |
+
0.18619436,8.898512,-60.371918,-176.73882,-203.45851,0.36278498,-0.35838374,43.241543,190000
|
| 40 |
+
0.18762627,9.508407,-0.4343899,-177.361,-203.99606,0.2762337,-0.26653308,30.430433,195000
|
| 41 |
+
0.20323114,7.466835,-69.70901,-176.06212,-204.45634,0.43752846,-0.31933892,48.47429,200000
|
| 42 |
+
0.149149,8.72137,-71.69821,-175.92441,-204.91231,0.28449756,-0.33796155,36.465256,205000
|
| 43 |
+
0.21693437,11.013214,9.617605,-175.90817,-204.07083,0.4408687,-0.38326004,34.807076,210000
|
| 44 |
+
0.16310221,8.086323,-44.038647,-177.63438,-204.8523,0.2781485,-0.56449175,50.1952,215000
|
| 45 |
+
0.18480477,14.997312,3.6649992,-176.11674,-204.64165,0.48845285,-0.51833814,40.4987,220000
|
| 46 |
+
0.19855438,15.625043,-78.96751,-177.41434,-204.49408,0.536582,-0.53602564,46.924194,225000
|
| 47 |
+
0.18435363,15.741793,-31.86943,-174.56174,-204.3722,0.32132497,-0.477739,50.353996,230000
|
| 48 |
+
0.18302897,10.163614,-15.155638,-175.39832,-203.91628,0.310676,-0.30418682,32.975597,235000
|
| 49 |
+
0.17074169,10.666033,-54.93844,-174.59154,-204.2583,0.39192992,-0.3883174,34.97396,240000
|
| 50 |
+
0.22462136,10.256366,-78.193,-178.51389,-203.75601,0.35951412,-0.33460158,32.95401,245000
|
| 51 |
+
0.17855287,10.678003,-74.39879,-175.60118,-203.8619,0.8643082,-1.0243653,44.399002,250000
|
| 52 |
+
0.18033496,8.600341,-65.015274,-175.14507,-204.23727,0.30660152,-0.3148681,27.240978,255000
|
| 53 |
+
0.20033854,16.335545,-104.81373,-177.44077,-203.45596,0.34542868,-0.39387253,38.580883,260000
|
| 54 |
+
0.17611212,8.570842,-59.99251,-177.70596,-204.47925,0.6681185,-0.7233949,44.489777,265000
|
| 55 |
+
0.19722468,12.228405,-64.58595,-175.81438,-203.83583,2.8526893,-2.5207944,55.607323,270000
|
| 56 |
+
0.15080622,12.216154,-78.5184,-176.56688,-203.85136,0.54123867,-0.44015995,51.417202,275000
|
| 57 |
+
0.181729,8.055255,-45.50894,-175.71382,-203.84756,0.33569494,-0.26509184,31.899084,280000
|
| 58 |
+
0.18201496,10.74344,-57.31417,-176.14606,-204.61707,0.6530031,-0.67076063,38.11831,285000
|
| 59 |
+
0.18609384,9.043329,-68.50747,-176.99817,-203.72507,3.1292114,-2.7779293,59.57299,290000
|
| 60 |
+
0.18487953,9.149382,-64.40253,-178.29034,-204.4731,0.38540998,-0.45007154,33.791756,295000
|
| 61 |
+
0.1659853,10.961419,-68.96994,-176.20398,-204.86537,0.37394455,-0.28137177,31.967884,300000
|
| 62 |
+
0.19489208,9.967456,-75.37551,-175.0072,-203.57115,0.2885093,-0.25662684,30.887424,305000
|
| 63 |
+
0.1786471,8.580081,-76.09501,-175.1045,-203.67293,0.5026161,-0.71852833,53.348183,310000
|
| 64 |
+
0.1747536,9.727026,-46.331203,-175.98534,-203.8734,0.37464824,-0.38114658,37.315487,315000
|
| 65 |
+
0.20842317,6.3737907,-82.89411,-179.5978,-204.20189,0.23013249,-0.23184882,21.751581,320000
|
| 66 |
+
0.16623078,8.716532,-51.253788,-174.1461,-203.65283,0.34073305,-0.3351776,29.21607,325000
|
| 67 |
+
0.19954458,11.422931,-57.723885,-176.21062,-204.01224,0.33332935,-0.3794353,31.6975,330000
|
| 68 |
+
0.1993344,14.702046,-6.403887,-172.98393,-204.01909,0.49393123,-0.52635866,34.586,335000
|
| 69 |
+
0.18502632,5.9707885,-44.615,-176.7638,-204.16078,0.13301742,-0.1927584,18.461548,340000
|
| 70 |
+
0.19235294,7.947454,-83.1322,-176.13753,-204.11761,0.3326626,-0.47231954,39.085293,345000
|
| 71 |
+
0.19504118,9.65188,-103.671036,-178.18257,-203.94449,0.35701528,-0.37312052,32.11786,350000
|
| 72 |
+
0.18084197,10.214626,-59.491447,-174.79884,-204.18803,0.23678471,-0.3493546,29.694084,355000
|
| 73 |
+
0.1826394,10.411242,-37.16139,-175.06265,-204.1485,0.37160683,-0.30059543,37.771763,360000
|
| 74 |
+
0.18597266,8.776676,1.3264477,-176.35722,-204.27435,0.45543388,-0.32944667,43.130028,365000
|
| 75 |
+
0.1865386,14.644762,-3.0635018,-174.89801,-203.60727,0.56479883,-0.66281766,41.157833,370000
|
| 76 |
+
0.2007168,7.900989,-43.98884,-174.02432,-203.878,0.377675,-0.31602502,30.287308,375000
|
| 77 |
+
0.16263497,10.409789,-10.44767,-174.74841,-203.62936,0.5006024,-0.3564423,33.285095,380000
|
| 78 |
+
0.17019355,7.8283663,-62.6827,-178.68384,-203.50333,0.24290428,-0.2995929,28.36991,385000
|
| 79 |
+
0.18800713,16.039133,-97.08411,-175.3778,-203.49069,4.6168466,-5.788005,140.10515,390000
|
| 80 |
+
0.1621884,8.175971,0.574664,-177.0053,-204.29678,0.3496675,-0.2341836,23.723028,395000
|
| 81 |
+
0.20187888,7.4770103,-70.87141,-177.35452,-203.76915,0.3232386,-0.29282138,28.242332,400000
|
| 82 |
+
0.20800614,8.942917,0.33533615,-175.78238,-203.50003,0.6467213,-0.6154228,28.404411,405000
|
| 83 |
+
0.18236774,8.681981,-68.225975,-175.13947,-204.17096,0.20659342,-0.38781953,32.189842,410000
|
| 84 |
+
0.18214078,9.452962,-75.18308,-177.27036,-203.48239,0.5225291,-0.21480225,40.187458,415000
|
| 85 |
+
0.17526864,9.006652,-70.76112,-175.79492,-203.95653,0.33445737,-0.3587155,28.740881,420000
|
| 86 |
+
0.17456919,14.652041,-102.572876,-176.85942,-203.96109,2.2507203,-1.7145798,62.233883,425000
|
| 87 |
+
0.20711625,12.709131,1.2175183,-174.9163,-203.37875,1.5218834,-1.6583734,64.66237,430000
|
| 88 |
+
0.17329527,10.782718,-47.29656,-176.58646,-203.40923,0.32239044,-0.20959924,29.168133,435000
|
| 89 |
+
0.17125738,7.262764,-73.422195,-177.12495,-203.55421,0.3278833,-0.17248656,26.447132,440000
|
| 90 |
+
0.18168183,14.086484,-64.99694,-177.5575,-203.8996,0.8533774,-1.1266291,61.042694,445000
|
| 91 |
+
0.2101819,10.9659,-81.92206,-179.24681,-203.63045,0.32431543,-0.29455855,28.798256,450000
|
| 92 |
+
0.17863376,7.5683975,-96.87289,-180.87817,-203.54599,0.3371074,-0.32175097,27.6495,455000
|
| 93 |
+
0.1991334,9.952606,-43.718815,-174.21947,-202.97144,0.5642773,-0.27643144,26.83507,460000
|
| 94 |
+
0.18019494,9.603603,1.9194007,-175.86833,-203.68808,2.22195,-2.0727642,56.075775,465000
|
| 95 |
+
0.19479692,7.4485855,-45.995792,-172.25116,-203.38925,0.31049466,-0.2845689,28.203503,470000
|
| 96 |
+
0.20131885,12.662799,-53.051834,-172.64838,-204.12212,0.556581,-0.57661504,29.343002,475000
|
| 97 |
+
0.20042014,6.9539895,-53.09674,-175.63936,-203.61186,0.3758329,-0.4219207,30.115482,480000
|
| 98 |
+
0.19108993,9.440498,-67.77108,-177.97472,-205.33353,0.35064584,-0.41115624,37.54677,485000
|
| 99 |
+
0.19145632,5.7101383,-63.732777,-176.53185,-204.05122,0.28346556,-0.17327559,21.628132,490000
|
| 100 |
+
0.22412857,7.590519,-65.48031,-178.12634,-204.02579,0.21912844,-0.4339251,34.587692,495000
|
| 101 |
+
0.20809504,5.6422677,-74.8663,-178.93973,-204.54053,0.11741142,-0.27536625,22.479395,500000
|
| 102 |
+
0.17983408,5.9542713,-63.35095,-178.18948,-204.8549,0.26684695,-0.2867067,23.999868,505000
|
| 103 |
+
0.1791244,12.710341,-82.30557,-177.82957,-203.16441,0.38618758,-0.35122076,26.877563,510000
|
| 104 |
+
0.2016632,7.921678,1.9119928,-176.10228,-203.7279,1.9592754,-3.0847511,65.2014,515000
|
| 105 |
+
0.17117189,10.601939,1.323573,-174.0894,-203.5431,0.5357702,-0.35093594,40.373398,520000
|
| 106 |
+
0.1955184,13.821261,-82.80296,-172.9385,-203.7862,3.310864,-3.6234572,66.2062,525000
|
| 107 |
+
0.18308201,20.33069,-97.10309,-178.72057,-203.83197,0.5148756,-0.40725213,40.349606,530000
|
| 108 |
+
0.16661021,10.353349,-37.70305,-176.66496,-203.5977,0.47808212,-0.50937736,30.3852,535000
|
| 109 |
+
0.19834371,8.5529375,0.8800143,-177.1328,-202.86003,0.44981736,-0.42036676,25.796131,540000
|
| 110 |
+
0.20935127,12.4011755,-72.86931,-174.38516,-203.10408,0.3373635,-0.4372619,31.678923,545000
|
| 111 |
+
0.19310363,9.234894,-48.057312,-176.73566,-203.06471,0.5064757,-0.20498134,21.886612,550000
|
| 112 |
+
0.17149091,8.53102,-74.65598,-174.95244,-203.27145,0.33652544,-0.4112741,22.547543,555000
|
| 113 |
+
0.20834485,11.1471405,-70.893295,-177.02837,-203.62126,0.9492786,-0.96698165,27.572254,560000
|
| 114 |
+
0.19884428,11.309203,-83.26866,-177.8103,-203.28601,0.455847,-0.31816268,33.279278,565000
|
| 115 |
+
0.18764558,10.024457,-69.68084,-173.39456,-202.72337,0.51733017,-0.5346291,28.596342,570000
|
| 116 |
+
0.16744545,9.589742,-85.23643,-176.06775,-203.3087,0.2660019,-0.3060756,25.912086,575000
|
| 117 |
+
0.18209806,9.392828,-76.41639,-178.49825,-203.5883,0.31857222,-0.3911255,26.91999,580000
|
| 118 |
+
0.17296046,9.247537,-86.131256,-178.65056,-203.6136,0.3537409,-0.18543923,23.278214,585000
|
| 119 |
+
0.1416823,7.8934073,-95.29657,-177.11339,-203.49,0.35222116,-0.38819164,25.741001,590000
|
| 120 |
+
0.16364354,13.406894,-75.43007,-175.99773,-203.17441,0.3397001,-0.5786744,28.65539,595000
|
| 121 |
+
0.19178584,14.1234045,-31.915878,-175.85153,-203.19176,0.4741148,-0.51731896,36.26206,600000
|
| 122 |
+
0.18353903,12.300928,-61.678112,-176.16862,-203.03154,1.6873281,-1.6272165,35.79017,605000
|
| 123 |
+
0.16485739,9.501182,-64.53064,-177.29771,-203.47067,0.6109389,-0.50918585,34.42812,610000
|
| 124 |
+
0.1558181,10.551704,2.1070507,-173.24113,-202.4765,0.26961997,-0.2529044,27.71278,615000
|
| 125 |
+
0.1783495,11.571052,-52.795013,-173.42348,-202.57703,0.48861352,-0.4369563,33.280354,620000
|
| 126 |
+
0.21134442,11.379229,-71.5627,-175.6222,-203.82458,1.1612065,-1.3439969,39.483215,625000
|
| 127 |
+
0.21542525,7.13398,-63.363552,-178.78716,-203.1557,0.33497152,-0.33824283,22.09592,630000
|
| 128 |
+
0.1725318,17.185179,-41.065006,-173.8333,-204.2577,0.3358809,-0.5341474,45.43016,635000
|
| 129 |
+
0.19532631,7.030933,-104.3283,-179.71342,-203.3166,1.0401255,-0.9294013,28.228909,640000
|
| 130 |
+
0.19826803,11.443084,-75.819,-174.60677,-203.44028,0.47424817,-0.2710683,27.012983,645000
|
| 131 |
+
0.17010707,10.711202,-81.6013,-180.70232,-203.77034,0.20232691,-0.44657215,33.199886,650000
|
| 132 |
+
0.17809609,11.737411,-71.1387,-176.04173,-203.13628,0.22177032,-0.18313825,24.093052,655000
|
| 133 |
+
0.16658844,13.641986,-41.180046,-176.04175,-202.81815,0.5683535,-0.41895932,38.545662,660000
|
| 134 |
+
0.21062283,9.804014,-63.81216,-173.82945,-203.64883,0.39297634,-0.3766547,30.608707,665000
|
| 135 |
+
0.19701226,10.565572,-32.633976,-176.32886,-203.08926,0.48114738,-0.5161284,29.695581,670000
|
| 136 |
+
0.18618184,12.048018,-101.52612,-177.63301,-204.01222,0.21825413,-0.20717955,24.707483,675000
|
| 137 |
+
0.15344617,8.952672,-68.48101,-174.41043,-204.20752,0.26614317,-0.32660607,30.058659,680000
|
| 138 |
+
0.16749488,7.6905055,-54.37334,-177.97234,-204.19432,0.12781537,-0.21798995,17.578716,685000
|
| 139 |
+
0.1898359,7.172278,-56.811264,-178.77849,-203.7864,0.16589817,-0.23359782,20.58165,690000
|
| 140 |
+
0.19481382,5.8471913,-67.5818,-176.8985,-203.04558,0.1354344,-0.17261837,18.409264,695000
|
| 141 |
+
0.18433763,17.525358,-46.541264,-177.3024,-203.33763,0.4119636,-0.23354362,31.87931,700000
|
| 142 |
+
0.18537292,11.137821,-3.8852925,-175.04306,-204.07028,0.27921864,-0.6453871,33.27543,705000
|
| 143 |
+
0.16982934,16.07414,2.6440024,-175.33995,-202.89905,0.3665095,-0.32109278,33.182312,710000
|
| 144 |
+
0.19421667,8.458293,-61.890205,-178.1659,-203.44757,0.3206222,-0.3245213,27.014622,715000
|
| 145 |
+
0.21625805,18.186567,-71.338844,-175.5203,-203.261,0.62988615,-0.57491845,40.63931,720000
|
| 146 |
+
0.16456164,7.604412,-90.71314,-177.91924,-203.41147,2.2395306,-2.269694,34.51136,725000
|
| 147 |
+
0.19586705,6.4284067,-75.81182,-179.28764,-203.84978,0.42892164,-0.3542689,24.498144,730000
|
| 148 |
+
0.19537929,14.818248,-58.250824,-179.83868,-204.09189,0.68647844,-0.67601764,36.169067,735000
|
| 149 |
+
0.16433044,8.262046,-37.566708,-176.84988,-203.0474,0.6030815,-0.25808105,26.844566,740000
|
| 150 |
+
0.20389801,8.609985,-91.76918,-178.12039,-204.01172,0.58710957,-0.5150835,37.19711,745000
|
| 151 |
+
0.14932854,20.293379,-73.2633,-176.31505,-202.73451,1.0744755,-1.0807639,52.10396,750000
|
| 152 |
+
0.17994343,17.076424,-40.651516,-178.72737,-203.5938,0.5592246,-0.39011645,37.475193,755000
|
| 153 |
+
0.21013075,8.119754,-80.57041,-177.22203,-203.08658,0.42089373,-0.2555741,25.980528,760000
|
| 154 |
+
0.17699379,20.796125,0.6790317,-175.08955,-203.4231,0.60283697,-0.5392834,46.59005,765000
|
| 155 |
+
0.18541014,16.57103,-67.66742,-178.88283,-203.26283,0.35717332,-0.35141,26.898758,770000
|
| 156 |
+
0.17163801,14.091037,-42.3174,-176.30136,-203.35449,0.35948148,-0.28304803,28.172668,775000
|
| 157 |
+
0.19974089,14.091771,-70.957794,-178.5283,-203.5635,0.461352,-0.50068015,32.15514,780000
|
| 158 |
+
0.18929888,23.404638,-11.739143,-176.75821,-203.21808,0.47534198,-0.4313756,36.389008,785000
|
| 159 |
+
0.17992416,8.618688,-73.39999,-177.05228,-202.92485,0.2569378,-0.2422928,21.381367,790000
|
| 160 |
+
0.16669992,39.57182,-68.2278,-177.4837,-203.52676,0.8014647,-0.599663,57.07411,795000
|
| 161 |
+
0.22184645,6.4670024,-65.67699,-179.63953,-203.18764,0.21850312,-0.16734204,22.307976,800000
|
| 162 |
+
0.19708456,11.665452,-10.557921,-174.92647,-203.0007,0.59088016,-0.2598145,38.318413,805000
|
| 163 |
+
0.20474786,7.8969855,-6.743909,-175.99991,-202.85736,0.33975035,-0.34594113,26.696884,810000
|
| 164 |
+
0.16486734,9.897898,-72.33111,-178.27483,-203.59271,0.2507502,-0.22966091,21.816359,815000
|
| 165 |
+
0.17501412,11.130804,-59.756325,-178.62816,-203.05255,0.30275416,-0.20521145,22.527536,820000
|
| 166 |
+
0.17853147,7.4163704,-101.91772,-180.9396,-203.00537,0.7358666,-0.7350613,35.52002,825000
|
| 167 |
+
0.18389918,14.636246,-79.69357,-177.71266,-203.44832,0.6074297,-0.20698142,36.13571,830000
|
| 168 |
+
0.19573191,9.317721,-91.723236,-178.49702,-203.24501,0.17878549,-0.46021965,28.71059,835000
|
| 169 |
+
0.16223106,8.761571,-40.76166,-178.6514,-203.03497,1.5373362,-1.7807736,34.17866,840000
|
| 170 |
+
0.19353628,7.0670776,-91.712006,-177.45918,-203.32869,0.30027068,-0.28412616,18.533554,845000
|
| 171 |
+
0.18411365,11.303052,-22.235828,-176.19788,-202.74065,0.21807301,-0.23986627,24.295721,850000
|
| 172 |
+
0.17856139,9.591498,-33.208538,-176.52243,-202.96979,0.31685352,-0.32390782,26.777267,855000
|
| 173 |
+
0.18469197,6.256099,1.026981,-178.13535,-203.71577,0.32762295,-0.30785954,21.339245,860000
|
| 174 |
+
0.17590055,9.375567,-84.88081,-175.40466,-202.96619,0.34743083,-0.47419137,26.347094,865000
|
| 175 |
+
0.1620523,12.150607,-73.870735,-179.8535,-203.2777,0.29588714,-0.5470557,30.55983,870000
|
| 176 |
+
0.1800977,16.39172,-77.871735,-177.92972,-203.26929,0.48615974,-0.55690056,35.918037,875000
|
| 177 |
+
0.17042303,7.2322974,-95.204735,-180.7122,-204.11195,0.20124082,-0.59035957,32.701202,880000
|
| 178 |
+
0.19218528,14.248908,-81.78551,-179.69083,-203.28839,0.29612112,-0.24637285,26.612545,885000
|
| 179 |
+
0.18052623,11.284881,-57.685654,-178.52196,-203.61478,0.42033178,-0.6678503,41.05313,890000
|
| 180 |
+
0.17466336,14.608185,-62.374836,-177.8851,-203.37189,0.49522328,-0.6901214,33.864555,895000
|
| 181 |
+
0.18055347,22.719696,-91.20747,-176.98586,-203.26039,0.6601001,-0.6331504,43.723694,900000
|
| 182 |
+
0.18953308,18.114645,-22.640364,-175.14635,-203.12727,0.8940666,-0.814749,40.20027,905000
|
| 183 |
+
0.17470433,8.481158,-92.515434,-178.66023,-203.37123,0.5888612,-0.5107118,28.072943,910000
|
| 184 |
+
0.17402588,7.05832,-7.4578004,-176.56718,-203.70238,0.3681615,-0.22545142,26.853588,915000
|
| 185 |
+
0.21146473,7.44305,-76.826195,-177.66115,-203.12166,0.1536905,-0.27790952,21.435902,920000
|
| 186 |
+
0.19336364,8.784098,-97.72967,-178.37254,-203.16191,0.4060213,-0.28592318,29.733473,925000
|
| 187 |
+
0.18147945,7.573009,-83.0376,-180.97307,-203.48549,0.2837768,-0.2635515,19.305643,930000
|
| 188 |
+
0.17937857,11.017553,-3.5259583,-179.187,-203.15067,0.3436123,-0.35364234,30.372026,935000
|
| 189 |
+
0.18078054,10.327917,-73.78657,-176.72952,-203.3846,0.4664162,-0.49225008,26.690582,940000
|
| 190 |
+
0.17969218,7.220001,-74.313065,-175.75589,-202.9745,0.3364722,-0.35966638,24.738325,945000
|
| 191 |
+
0.19654562,16.844511,-43.34753,-173.44057,-203.01697,0.37875795,-0.36540884,33.914314,950000
|
| 192 |
+
0.16110492,14.329569,-79.73295,-177.09537,-202.91437,0.22135824,-0.33609667,26.710361,955000
|
| 193 |
+
0.20876661,15.805875,-64.01766,-176.03192,-203.21722,0.4924379,-0.5183765,32.49788,960000
|
| 194 |
+
0.1941939,14.070063,0.7983184,-178.95735,-203.14268,0.21343291,-0.47956648,34.02712,965000
|
| 195 |
+
0.1799463,18.940178,-3.91785,-177.89815,-203.48817,0.33064157,-0.33677244,30.144667,970000
|
| 196 |
+
0.16496721,7.598241,-58.31274,-178.66917,-203.1901,0.22558054,-0.25666,20.138487,975000
|
| 197 |
+
0.21446556,11.647531,-96.66001,-176.00443,-202.4876,0.5250865,-0.3577407,34.529663,980000
|
| 198 |
+
0.16609342,10.979478,-100.81739,-176.26205,-203.24489,0.5349783,-0.569991,44.990177,985000
|
| 199 |
+
0.17175654,6.5255694,-57.88425,-175.15457,-202.69514,0.4399467,-0.16720355,24.377169,990000
|
| 200 |
+
0.19219038,6.967776,-64.30135,-178.49791,-203.90947,0.28859782,-0.26273203,20.119186,995000
|
| 201 |
+
0.15500735,6.2614727,-67.7509,-178.0753,-203.52426,0.3378133,-0.3072808,19.489933,1000000
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.17085159,7.049066,-98.62268,-179.60777,-203.11652,0.37404484,-0.16007937,21.474182,1005000
|
| 3 |
+
0.1674996,10.488468,2.4964795,-174.81204,-202.84143,0.35853243,-0.35811862,23.793812,1010000
|
| 4 |
+
0.17929062,13.328577,1.9811965,-175.51746,-202.91972,0.4647814,-0.4076433,33.793674,1015000
|
| 5 |
+
0.18806346,8.9897585,-48.111897,-173.75041,-203.64546,0.38026544,-0.33368474,21.937578,1020000
|
| 6 |
+
0.2019521,8.458796,-3.6485577,-176.2535,-203.44928,0.28485933,-0.27029225,22.636356,1025000
|
| 7 |
+
0.16885883,20.599798,-6.8061886,-173.04837,-203.30188,0.5027918,-0.4696217,32.28173,1030000
|
| 8 |
+
0.19943741,15.522296,-39.20431,-172.05603,-204.29662,0.4934651,-0.62153727,46.992325,1035000
|
| 9 |
+
0.13795003,15.7675295,-54.08349,-173.64304,-204.15675,1.3723758,-1.3054451,41.306313,1040000
|
| 10 |
+
0.17240436,17.0584,-53.29777,-170.44566,-203.91562,1.4081193,-1.223259,51.920624,1045000
|
| 11 |
+
0.19355497,13.710713,3.4528742,-168.0985,-204.73875,1.1129904,-1.064931,38.382168,1050000
|
| 12 |
+
0.1589807,13.944994,-7.241106,-166.66808,-204.7057,0.46478295,-0.42065367,33.695065,1055000
|
| 13 |
+
0.17736647,15.521802,-24.714521,-162.07707,-203.95978,0.6083757,-0.70036125,39.59772,1060000
|
| 14 |
+
0.19334781,16.193682,2.3434896,-162.79588,-203.99742,0.36130404,-0.3429139,32.95153,1065000
|
| 15 |
+
0.1942471,15.904495,-13.391419,-159.79881,-203.49149,1.3141446,-0.475943,56.23722,1070000
|
| 16 |
+
0.20149288,11.752619,-55.57696,-161.91895,-203.86203,0.7162124,-0.48754835,37.40966,1075000
|
| 17 |
+
0.20833175,18.460068,-30.930662,-160.12256,-204.04475,1.060346,-1.0614203,71.926414,1080000
|
| 18 |
+
0.18795499,12.137467,-39.47185,-161.24632,-203.83986,0.7162008,-0.41444817,43.44589,1085000
|
| 19 |
+
0.1699501,18.17118,2.9841492,-160.6889,-205.00726,0.77985483,-0.7484192,51.79985,1090000
|
| 20 |
+
0.16853565,18.90743,-16.436184,-158.20338,-204.75342,0.5847015,-0.76732004,52.238716,1095000
|
| 21 |
+
0.17540412,16.746878,-17.701103,-155.41978,-203.99304,0.5345089,-0.53310907,37.89046,1100000
|
| 22 |
+
0.18603742,14.220888,-12.581635,-160.81572,-204.67928,0.8830935,-0.81120616,50.676468,1105000
|
| 23 |
+
0.14273325,19.407522,-38.712193,-151.11707,-203.9958,0.82738304,-0.7503944,58.22881,1110000
|
| 24 |
+
0.16257146,20.868301,-48.76262,-162.10588,-203.92148,0.93872213,-0.9203777,62.550972,1115000
|
| 25 |
+
0.17259376,21.578121,-29.482885,-157.66612,-205.58742,0.6178165,-0.5853679,45.594086,1120000
|
| 26 |
+
0.19412565,17.490479,0.9215142,-155.07759,-204.54848,0.5960144,-0.6216169,42.16543,1125000
|
| 27 |
+
0.15198582,20.7857,-11.790196,-154.4433,-204.58704,0.7796531,-1.195922,49.29669,1130000
|
| 28 |
+
0.19312522,17.213203,-9.775461,-150.70293,-203.89165,1.034475,-0.916951,57.87069,1135000
|
| 29 |
+
0.19745278,28.679358,-26.303251,-152.39061,-204.0561,0.71985567,-0.67050153,55.504715,1140000
|
| 30 |
+
0.1884682,20.802595,-24.155268,-149.91084,-204.15236,1.8560101,-1.8049226,61.42866,1145000
|
| 31 |
+
0.156563,10.343387,-18.532064,-150.26817,-204.27058,0.7220731,-0.90935105,41.87323,1150000
|
| 32 |
+
0.20646226,12.305564,-0.10874537,-152.47331,-204.34912,0.5359289,-0.3114549,41.995007,1155000
|
| 33 |
+
0.19667408,12.275653,-12.036504,-150.95354,-204.01682,0.2903188,-0.2906937,32.092262,1160000
|
| 34 |
+
0.20859885,20.689293,-18.72668,-147.03378,-204.25461,1.2401322,-1.200809,64.27071,1165000
|
| 35 |
+
0.14928228,15.406657,-22.287046,-150.78447,-203.4478,0.6404385,-1.2415981,66.596565,1170000
|
| 36 |
+
0.15776226,23.853958,-12.625277,-147.1321,-203.16731,0.9634579,-0.6510385,57.342834,1175000
|
| 37 |
+
0.19890618,16.446295,-6.346376,-145.1372,-204.91931,1.7139525,-1.5235136,78.74505,1180000
|
| 38 |
+
0.18074624,24.84938,-21.26873,-150.6147,-205.60849,1.9811676,-1.9042488,57.33509,1185000
|
| 39 |
+
0.16104245,20.156034,-21.227335,-149.78386,-204.71599,0.9085499,-0.8922582,61.979034,1190000
|
| 40 |
+
0.17609052,20.412703,-6.7767773,-148.91386,-204.87694,0.7356924,-0.54957175,49.357395,1195000
|
| 41 |
+
0.16623107,16.04174,2.8574297,-143.56032,-203.6013,1.1050996,-1.0979363,47.329712,1200000
|
| 42 |
+
0.15732834,17.493027,-4.724691,-148.3929,-204.20369,0.46382234,-0.50957984,42.175865,1205000
|
| 43 |
+
0.16920963,13.493955,-18.060785,-147.12386,-205.15291,1.5506321,-1.7456461,63.31932,1210000
|
| 44 |
+
0.20368403,21.178806,-7.568404,-143.76378,-204.1027,1.1936176,-0.94255304,61.000114,1215000
|
| 45 |
+
0.19328734,20.978933,-7.260867,-147.69951,-204.19029,1.7797039,-1.6481978,101.32681,1220000
|
| 46 |
+
0.1732368,25.62653,-12.183862,-139.5557,-203.63103,1.1369307,-0.8425873,55.45881,1225000
|
| 47 |
+
0.18826458,16.930517,-7.334058,-142.10152,-204.36394,0.7874187,-1.4805477,81.65501,1230000
|
| 48 |
+
0.2097635,15.200614,-8.966545,-143.9854,-203.01639,0.46038124,-0.86460716,46.81363,1235000
|
| 49 |
+
0.20075685,12.500431,1.7335777,-145.87201,-204.97809,0.45466506,-0.8156587,48.482708,1240000
|
| 50 |
+
0.16856696,15.302246,2.4408662,-144.41928,-202.96945,0.9846677,-0.9530217,49.500603,1245000
|
| 51 |
+
0.16692284,15.02489,-1.0679471,-142.32005,-203.5852,0.5271589,-0.48710543,40.49189,1250000
|
| 52 |
+
0.20121396,15.860654,3.158265,-143.9351,-203.6586,2.3829927,-2.5515509,87.65158,1255000
|
| 53 |
+
0.17514801,25.146868,-4.031881,-141.07271,-200.05165,3.6442034,-3.4508696,116.641014,1260000
|
| 54 |
+
0.16894248,13.118003,-7.768355,-143.81796,-204.92207,0.39634356,-0.4357768,37.03411,1265000
|
| 55 |
+
0.14479363,25.693373,-7.6264696,-139.18155,-203.76492,0.70583045,-0.7011504,54.953575,1270000
|
| 56 |
+
0.21877772,11.354787,-3.408588,-143.75542,-205.1413,0.73722243,-0.83112216,40.04397,1275000
|
| 57 |
+
0.19850266,19.94318,-1.649093,-134.01402,-204.02783,0.41649723,-0.8585996,54.553135,1280000
|
| 58 |
+
0.18868537,13.10483,-10.914517,-138.4415,-203.93376,1.1048626,-1.4491599,57.73112,1285000
|
| 59 |
+
0.1804268,17.593237,-10.496693,-137.81169,-203.46353,0.67144424,-1.3708477,63.42978,1290000
|
| 60 |
+
0.20180252,14.463702,-14.316689,-141.05052,-204.2304,1.8637507,-1.7851158,47.904785,1295000
|
| 61 |
+
0.18130608,13.141129,-3.307333,-143.0512,-203.34691,0.5100179,-0.50149673,37.31802,1300000
|
| 62 |
+
0.17048292,37.984398,-8.86422,-137.6168,-200.799,1.0498763,-1.3286752,66.99131,1305000
|
| 63 |
+
0.16556256,14.847821,1.1811603,-135.82796,-204.95856,0.68895435,-0.8519776,44.442238,1310000
|
| 64 |
+
0.1798667,22.779585,1.6487138,-137.19559,-202.79626,0.6118388,-0.77371633,54.43265,1315000
|
| 65 |
+
0.17433557,27.580328,-10.967104,-136.36287,-203.89284,1.1495152,-1.1917517,73.4247,1320000
|
| 66 |
+
0.17691365,16.941675,-2.3269894,-140.1233,-205.48308,0.87559384,-0.8285228,57.442947,1325000
|
| 67 |
+
0.19343072,11.861135,-2.3013113,-136.9041,-202.89417,0.4583947,-0.6226856,43.354362,1330000
|
| 68 |
+
0.20249288,13.071088,1.9506289,-136.47046,-204.40344,0.33541262,-0.4878722,39.360622,1335000
|
| 69 |
+
0.18850358,12.769602,-13.124337,-136.58597,-202.47374,0.61011547,-0.9946127,58.459206,1340000
|
| 70 |
+
0.17605399,13.55157,-2.0455666,-132.15645,-202.61984,1.1151556,-1.2088608,47.903152,1345000
|
| 71 |
+
0.16767037,10.501389,-5.7719383,-134.20764,-204.23828,0.38624504,-1.2439176,40.683212,1350000
|
| 72 |
+
0.19042969,28.32469,-0.14893296,-129.59402,-203.56296,0.73533744,-0.6991777,51.5915,1355000
|
| 73 |
+
0.17469698,16.15526,1.3339843,-132.25996,-203.94902,0.7096558,-1.7018589,59.27542,1360000
|
| 74 |
+
0.18538254,17.731644,-9.66579,-136.10173,-204.07454,0.56428957,-0.9988655,51.78803,1365000
|
| 75 |
+
0.18844831,15.362925,0.47621718,-128.76518,-204.59404,1.0618224,-0.99344647,49.08532,1370000
|
| 76 |
+
0.1794591,20.205626,0.16661945,-130.71834,-201.29388,1.1696436,-0.8315272,58.9606,1375000
|
| 77 |
+
0.12697402,10.8396635,2.0278559,-128.59256,-201.68924,0.41533506,-0.4643523,35.50453,1380000
|
| 78 |
+
0.151325,24.113157,2.0364635,-136.679,-202.78539,0.9430205,-0.53150773,55.581783,1385000
|
| 79 |
+
0.14865588,20.747189,-12.342482,-130.35217,-204.31876,1.6020198,-2.8733659,68.37834,1390000
|
| 80 |
+
0.16377372,16.719069,-13.024376,-141.69717,-204.80995,0.58462226,-0.70051664,38.499615,1395000
|
| 81 |
+
0.15362185,14.342982,-10.77254,-132.8339,-203.76857,1.1232117,-1.3091458,50.92109,1400000
|
| 82 |
+
0.14255631,23.298084,-2.6110864,-131.9984,-201.22778,0.97839725,-0.94807506,71.08616,1405000
|
| 83 |
+
0.16319996,16.015963,1.1884358,-132.31673,-199.025,0.64064264,-1.4083385,67.14556,1410000
|
| 84 |
+
0.16841525,14.607767,-4.9186826,-129.52168,-202.75894,0.48639596,-1.0512253,53.22072,1415000
|
| 85 |
+
0.16169569,11.904765,3.529375,-129.32794,-203.01837,1.4989306,-1.3704357,69.7836,1420000
|
| 86 |
+
0.17537245,16.360174,-7.3683214,-130.13708,-202.15602,1.2486445,-0.98621815,60.71525,1425000
|
| 87 |
+
0.16337493,15.565186,-0.8249185,-126.85329,-204.9971,0.61653715,-0.73681974,43.034607,1430000
|
| 88 |
+
0.16202167,15.171503,2.7392318,-128.93307,-203.9332,2.7573535,-2.474969,74.37117,1435000
|
| 89 |
+
0.17366575,28.590199,2.296834,-126.87339,-203.16504,1.4433006,-1.6516006,79.64732,1440000
|
| 90 |
+
0.16957931,23.11216,-1.7351726,-128.97374,-199.32388,1.5314946,-0.7808566,50.583405,1445000
|
| 91 |
+
0.16750786,19.202518,-4.3292975,-131.89249,-203.7521,2.4780293,-2.765104,74.13431,1450000
|
| 92 |
+
0.14985475,13.95267,2.7505097,-131.45328,-204.25922,0.34470397,-0.659181,42.90908,1455000
|
| 93 |
+
0.1538345,14.859418,-3.3211017,-126.18047,-202.1669,0.7330548,-0.78662544,47.13583,1460000
|
| 94 |
+
0.15844785,22.811132,-6.9626603,-130.325,-202.84769,4.128011,-3.766036,93.825195,1465000
|
| 95 |
+
0.13953684,19.281681,-1.8400195,-129.24727,-203.30783,0.6995609,-0.8351497,54.293823,1470000
|
| 96 |
+
0.15487185,18.433676,-1.6091748,-130.8004,-202.8574,0.70479965,-0.678793,50.16637,1475000
|
| 97 |
+
0.15267289,15.237981,-0.8261657,-129.98375,-200.70447,0.80038035,-1.3094321,66.11626,1480000
|
| 98 |
+
0.13351944,11.186969,-6.029231,-132.02634,-202.9213,0.8598913,-0.39677283,41.406918,1485000
|
| 99 |
+
0.14290078,22.839794,-1.4702399,-125.6324,-204.51616,0.61196357,-0.6889965,50.50095,1490000
|
| 100 |
+
0.16251379,29.46639,0.12553546,-124.888466,-203.94048,1.463575,-1.5300245,78.53082,1495000
|
| 101 |
+
0.17200536,23.92192,-6.1842484,-121.42336,-204.03441,7.291288,-5.438014,179.91748,1500000
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.17085159,7.049066,-98.62268,-179.60777,-203.11652,0.37404484,-0.16007937,21.474182,1005000
|
| 3 |
+
0.1674996,10.488468,2.4964795,-174.81204,-202.84143,0.35853243,-0.35811862,23.793812,1010000
|
| 4 |
+
0.17929062,13.328577,1.9811965,-175.51746,-202.91972,0.4647814,-0.4076433,33.793674,1015000
|
| 5 |
+
0.18806346,8.9897585,-48.111897,-173.75041,-203.64546,0.38026544,-0.33368474,21.937578,1020000
|
| 6 |
+
0.2019521,8.458796,-3.6485577,-176.2535,-203.44928,0.28485933,-0.27029225,22.636356,1025000
|
| 7 |
+
0.16885883,20.599798,-6.8061886,-173.04837,-203.30188,0.5027918,-0.4696217,32.28173,1030000
|
| 8 |
+
0.19943741,15.522296,-39.20431,-172.05603,-204.29662,0.4934651,-0.62153727,46.992325,1035000
|
| 9 |
+
0.13795003,15.7675295,-54.08349,-173.64304,-204.15675,1.3723758,-1.3054451,41.306313,1040000
|
| 10 |
+
0.17240436,17.0584,-53.29777,-170.44566,-203.91562,1.4081193,-1.223259,51.920624,1045000
|
| 11 |
+
0.19355497,13.710713,3.4528742,-168.0985,-204.73875,1.1129904,-1.064931,38.382168,1050000
|
| 12 |
+
0.1589807,13.944994,-7.241106,-166.66808,-204.7057,0.46478295,-0.42065367,33.695065,1055000
|
| 13 |
+
0.17736647,15.521802,-24.714521,-162.07707,-203.95978,0.6083757,-0.70036125,39.59772,1060000
|
| 14 |
+
0.19334781,16.193682,2.3434896,-162.79588,-203.99742,0.36130404,-0.3429139,32.95153,1065000
|
| 15 |
+
0.1942471,15.904495,-13.391419,-159.79881,-203.49149,1.3141446,-0.475943,56.23722,1070000
|
| 16 |
+
0.20149288,11.752619,-55.57696,-161.91895,-203.86203,0.7162124,-0.48754835,37.40966,1075000
|
| 17 |
+
0.20833175,18.460068,-30.930662,-160.12256,-204.04475,1.060346,-1.0614203,71.926414,1080000
|
| 18 |
+
0.18795499,12.137467,-39.47185,-161.24632,-203.83986,0.7162008,-0.41444817,43.44589,1085000
|
| 19 |
+
0.1699501,18.17118,2.9841492,-160.6889,-205.00726,0.77985483,-0.7484192,51.79985,1090000
|
| 20 |
+
0.16853565,18.90743,-16.436184,-158.20338,-204.75342,0.5847015,-0.76732004,52.238716,1095000
|
| 21 |
+
0.17540412,16.746878,-17.701103,-155.41978,-203.99304,0.5345089,-0.53310907,37.89046,1100000
|
| 22 |
+
0.18603742,14.220888,-12.581635,-160.81572,-204.67928,0.8830935,-0.81120616,50.676468,1105000
|
| 23 |
+
0.14273325,19.407522,-38.712193,-151.11707,-203.9958,0.82738304,-0.7503944,58.22881,1110000
|
| 24 |
+
0.16257146,20.868301,-48.76262,-162.10588,-203.92148,0.93872213,-0.9203777,62.550972,1115000
|
| 25 |
+
0.17259376,21.578121,-29.482885,-157.66612,-205.58742,0.6178165,-0.5853679,45.594086,1120000
|
| 26 |
+
0.19412565,17.490479,0.9215142,-155.07759,-204.54848,0.5960144,-0.6216169,42.16543,1125000
|
| 27 |
+
0.15198582,20.7857,-11.790196,-154.4433,-204.58704,0.7796531,-1.195922,49.29669,1130000
|
| 28 |
+
0.19312522,17.213203,-9.775461,-150.70293,-203.89165,1.034475,-0.916951,57.87069,1135000
|
| 29 |
+
0.19745278,28.679358,-26.303251,-152.39061,-204.0561,0.71985567,-0.67050153,55.504715,1140000
|
| 30 |
+
0.1884682,20.802595,-24.155268,-149.91084,-204.15236,1.8560101,-1.8049226,61.42866,1145000
|
| 31 |
+
0.156563,10.343387,-18.532064,-150.26817,-204.27058,0.7220731,-0.90935105,41.87323,1150000
|
| 32 |
+
0.20646226,12.305564,-0.10874537,-152.47331,-204.34912,0.5359289,-0.3114549,41.995007,1155000
|
| 33 |
+
0.19667408,12.275653,-12.036504,-150.95354,-204.01682,0.2903188,-0.2906937,32.092262,1160000
|
| 34 |
+
0.20859885,20.689293,-18.72668,-147.03378,-204.25461,1.2401322,-1.200809,64.27071,1165000
|
| 35 |
+
0.14928228,15.406657,-22.287046,-150.78447,-203.4478,0.6404385,-1.2415981,66.596565,1170000
|
| 36 |
+
0.15776226,23.853958,-12.625277,-147.1321,-203.16731,0.9634579,-0.6510385,57.342834,1175000
|
| 37 |
+
0.19890618,16.446295,-6.346376,-145.1372,-204.91931,1.7139525,-1.5235136,78.74505,1180000
|
| 38 |
+
0.18074624,24.84938,-21.26873,-150.6147,-205.60849,1.9811676,-1.9042488,57.33509,1185000
|
| 39 |
+
0.16104245,20.156034,-21.227335,-149.78386,-204.71599,0.9085499,-0.8922582,61.979034,1190000
|
| 40 |
+
0.17609052,20.412703,-6.7767773,-148.91386,-204.87694,0.7356924,-0.54957175,49.357395,1195000
|
| 41 |
+
0.16623107,16.04174,2.8574297,-143.56032,-203.6013,1.1050996,-1.0979363,47.329712,1200000
|
| 42 |
+
0.15732834,17.493027,-4.724691,-148.3929,-204.20369,0.46382234,-0.50957984,42.175865,1205000
|
| 43 |
+
0.16920963,13.493955,-18.060785,-147.12386,-205.15291,1.5506321,-1.7456461,63.31932,1210000
|
| 44 |
+
0.20368403,21.178806,-7.568404,-143.76378,-204.1027,1.1936176,-0.94255304,61.000114,1215000
|
| 45 |
+
0.19328734,20.978933,-7.260867,-147.69951,-204.19029,1.7797039,-1.6481978,101.32681,1220000
|
| 46 |
+
0.1732368,25.62653,-12.183862,-139.5557,-203.63103,1.1369307,-0.8425873,55.45881,1225000
|
| 47 |
+
0.18826458,16.930517,-7.334058,-142.10152,-204.36394,0.7874187,-1.4805477,81.65501,1230000
|
| 48 |
+
0.2097635,15.200614,-8.966545,-143.9854,-203.01639,0.46038124,-0.86460716,46.81363,1235000
|
| 49 |
+
0.20075685,12.500431,1.7335777,-145.87201,-204.97809,0.45466506,-0.8156587,48.482708,1240000
|
| 50 |
+
0.16856696,15.302246,2.4408662,-144.41928,-202.96945,0.9846677,-0.9530217,49.500603,1245000
|
| 51 |
+
0.16692284,15.02489,-1.0679471,-142.32005,-203.5852,0.5271589,-0.48710543,40.49189,1250000
|
| 52 |
+
0.20121396,15.860654,3.158265,-143.9351,-203.6586,2.3829927,-2.5515509,87.65158,1255000
|
| 53 |
+
0.17514801,25.146868,-4.031881,-141.07271,-200.05165,3.6442034,-3.4508696,116.641014,1260000
|
| 54 |
+
0.16894248,13.118003,-7.768355,-143.81796,-204.92207,0.39634356,-0.4357768,37.03411,1265000
|
| 55 |
+
0.14479363,25.693373,-7.6264696,-139.18155,-203.76492,0.70583045,-0.7011504,54.953575,1270000
|
| 56 |
+
0.21877772,11.354787,-3.408588,-143.75542,-205.1413,0.73722243,-0.83112216,40.04397,1275000
|
| 57 |
+
0.19850266,19.94318,-1.649093,-134.01402,-204.02783,0.41649723,-0.8585996,54.553135,1280000
|
| 58 |
+
0.18868537,13.10483,-10.914517,-138.4415,-203.93376,1.1048626,-1.4491599,57.73112,1285000
|
| 59 |
+
0.1804268,17.593237,-10.496693,-137.81169,-203.46353,0.67144424,-1.3708477,63.42978,1290000
|
| 60 |
+
0.20180252,14.463702,-14.316689,-141.05052,-204.2304,1.8637507,-1.7851158,47.904785,1295000
|
| 61 |
+
0.18130608,13.141129,-3.307333,-143.0512,-203.34691,0.5100179,-0.50149673,37.31802,1300000
|
| 62 |
+
0.17048292,37.984398,-8.86422,-137.6168,-200.799,1.0498763,-1.3286752,66.99131,1305000
|
| 63 |
+
0.16556256,14.847821,1.1811603,-135.82796,-204.95856,0.68895435,-0.8519776,44.442238,1310000
|
| 64 |
+
0.1798667,22.779585,1.6487138,-137.19559,-202.79626,0.6118388,-0.77371633,54.43265,1315000
|
| 65 |
+
0.17433557,27.580328,-10.967104,-136.36287,-203.89284,1.1495152,-1.1917517,73.4247,1320000
|
| 66 |
+
0.17691365,16.941675,-2.3269894,-140.1233,-205.48308,0.87559384,-0.8285228,57.442947,1325000
|
| 67 |
+
0.19343072,11.861135,-2.3013113,-136.9041,-202.89417,0.4583947,-0.6226856,43.354362,1330000
|
| 68 |
+
0.20249288,13.071088,1.9506289,-136.47046,-204.40344,0.33541262,-0.4878722,39.360622,1335000
|
| 69 |
+
0.18850358,12.769602,-13.124337,-136.58597,-202.47374,0.61011547,-0.9946127,58.459206,1340000
|
| 70 |
+
0.17605399,13.55157,-2.0455666,-132.15645,-202.61984,1.1151556,-1.2088608,47.903152,1345000
|
| 71 |
+
0.16767037,10.501389,-5.7719383,-134.20764,-204.23828,0.38624504,-1.2439176,40.683212,1350000
|
| 72 |
+
0.19042969,28.32469,-0.14893296,-129.59402,-203.56296,0.73533744,-0.6991777,51.5915,1355000
|
| 73 |
+
0.17469698,16.15526,1.3339843,-132.25996,-203.94902,0.7096558,-1.7018589,59.27542,1360000
|
| 74 |
+
0.18538254,17.731644,-9.66579,-136.10173,-204.07454,0.56428957,-0.9988655,51.78803,1365000
|
| 75 |
+
0.18844831,15.362925,0.47621718,-128.76518,-204.59404,1.0618224,-0.99344647,49.08532,1370000
|
| 76 |
+
0.1794591,20.205626,0.16661945,-130.71834,-201.29388,1.1696436,-0.8315272,58.9606,1375000
|
| 77 |
+
0.12697402,10.8396635,2.0278559,-128.59256,-201.68924,0.41533506,-0.4643523,35.50453,1380000
|
| 78 |
+
0.151325,24.113157,2.0364635,-136.679,-202.78539,0.9430205,-0.53150773,55.581783,1385000
|
| 79 |
+
0.14865588,20.747189,-12.342482,-130.35217,-204.31876,1.6020198,-2.8733659,68.37834,1390000
|
| 80 |
+
0.16377372,16.719069,-13.024376,-141.69717,-204.80995,0.58462226,-0.70051664,38.499615,1395000
|
| 81 |
+
0.15362185,14.342982,-10.77254,-132.8339,-203.76857,1.1232117,-1.3091458,50.92109,1400000
|
| 82 |
+
0.14255631,23.298084,-2.6110864,-131.9984,-201.22778,0.97839725,-0.94807506,71.08616,1405000
|
| 83 |
+
0.16319996,16.015963,1.1884358,-132.31673,-199.025,0.64064264,-1.4083385,67.14556,1410000
|
| 84 |
+
0.16841525,14.607767,-4.9186826,-129.52168,-202.75894,0.48639596,-1.0512253,53.22072,1415000
|
| 85 |
+
0.16169569,11.904765,3.529375,-129.32794,-203.01837,1.4989306,-1.3704357,69.7836,1420000
|
| 86 |
+
0.17537245,16.360174,-7.3683214,-130.13708,-202.15602,1.2486445,-0.98621815,60.71525,1425000
|
| 87 |
+
0.16337493,15.565186,-0.8249185,-126.85329,-204.9971,0.61653715,-0.73681974,43.034607,1430000
|
| 88 |
+
0.16202167,15.171503,2.7392318,-128.93307,-203.9332,2.7573535,-2.474969,74.37117,1435000
|
| 89 |
+
0.17366575,28.590199,2.296834,-126.87339,-203.16504,1.4433006,-1.6516006,79.64732,1440000
|
| 90 |
+
0.16957931,23.11216,-1.7351726,-128.97374,-199.32388,1.5314946,-0.7808566,50.583405,1445000
|
| 91 |
+
0.16750786,19.202518,-4.3292975,-131.89249,-203.7521,2.4780293,-2.765104,74.13431,1450000
|
| 92 |
+
0.14985475,13.95267,2.7505097,-131.45328,-204.25922,0.34470397,-0.659181,42.90908,1455000
|
| 93 |
+
0.1538345,14.859418,-3.3211017,-126.18047,-202.1669,0.7330548,-0.78662544,47.13583,1460000
|
| 94 |
+
0.15844785,22.811132,-6.9626603,-130.325,-202.84769,4.128011,-3.766036,93.825195,1465000
|
| 95 |
+
0.13953684,19.281681,-1.8400195,-129.24727,-203.30783,0.6995609,-0.8351497,54.293823,1470000
|
| 96 |
+
0.15487185,18.433676,-1.6091748,-130.8004,-202.8574,0.70479965,-0.678793,50.16637,1475000
|
| 97 |
+
0.15267289,15.237981,-0.8261657,-129.98375,-200.70447,0.80038035,-1.3094321,66.11626,1480000
|
| 98 |
+
0.13351944,11.186969,-6.029231,-132.02634,-202.9213,0.8598913,-0.39677283,41.406918,1485000
|
| 99 |
+
0.14290078,22.839794,-1.4702399,-125.6324,-204.51616,0.61196357,-0.6889965,50.50095,1490000
|
| 100 |
+
0.16251379,29.46639,0.12553546,-124.888466,-203.94048,1.463575,-1.5300245,78.53082,1495000
|
| 101 |
+
0.17200536,23.92192,-6.1842484,-121.42336,-204.03441,7.291288,-5.438014,179.91748,1500000
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c7ce8dee31b1d71c732693479060dbbe530c0a1975ad7a13de72a57b0f73b45
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e089e8d5d6ab0a64eaf4a3d7f5c2f16de8d1ae11dfc28cbeb3c2d5c074813aac
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e8e0ca6c2ccb32518e532bfb8a635f5f5b5d78c0bda3dd06ed1676d19bc17e4
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9ee032a3c761b2a30ba29d535192add2218edb3b30b67c99e79142d43f0b217
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:301957bc63837f91f14abc832983a856729e733c880c1c66597bab16ca257767
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7d3580cc855b74658625150565005138a3839abbe33f3f1796fecb165c059ab
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b8117cc000dccdd84bed81893805d25d67504d2300ad2cbaace723dc4f30d57
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0dbf4982232fa516b9a68f26a24f4c3b59dbe915e01ee193d2cfe78f3f8421bb
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:275eff927e0a97cb3b9f5a2df950ade898904a0e9da24eb375e6c9bf970f2036
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe3d7e7a5c4f0061aae0166c340a91694a58a1dc1407f22cb05e025d1eb098b2
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac8929e5bc24cac5275ec9c6cfd451c86e8642068cc5c9018e4d43eb519f04f0
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:942c7e83d64b5224cb71d7ff13aeca9e47ef190d7b51831eef5ca44fdfc6c06d
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_1500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f88298384c86045e5805074ed8e05a92d309d0224dc75905c03bb8d78f936e8a
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aec5db0d982dadb5e583815ae4d791abef756fe53ec8e48486f081ea8f0b5b8e
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa629857d74c1c3a135b3e4d5802713a493e4f49e05261d1f4c2e8e1e0d83722
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48d42f82fcf13da4d69555f83c128c893b5f54b825a7e2d7bc51776e9c478095
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2bd072662f619e2a1eb289f2ce4f6d116745a0344d90a965cbbdba248d979926
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7fea7a1d604c5658a3479f3171a1cf07f3051d31bb0eeecfedf59fca47ac58a9
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5a5d88b05710b049bdc36939b0a751d80d5645530664e8bdabc695e3d71f679c
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_50000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6add634985a76c5aaba3db95a0b39c80d5e76756f54ce78db2ad7d3405e3edd7
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4b03ef94fdfe7330b191b921fa77b555f860ad8a1d4dfbca7265401269b69ec
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6678a39b803dd75091fe1142a13dbf17ab2d11a3862cbeeb5c47c83e9c83856e
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd3f9cc37f203fe2dd14dccfc6f870d84f92dafd1eb15bb9c861880fbbeb8f50
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04c506af5f780e1fa6238b10ca7b56f8b20decd14a35eb90b43aecd65e0635e4
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:553fdda291c60e723bf8f24c9d192d8f96f012922858545728290971faff66f2
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32812f360d818e89b624bf78684cfc45061e023c5ed1a4f0d27ba7e07b375597
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd87b1b5bdbb3c3384d078eb33b35ccd91848169faeff7c133d4bfe918a08bfc
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:826958b7c600f8ad36058b6e4a6fdc4dd1d1bd96c1a6e0b8dc33f23b0ef1a941
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9b6887d9270717f6b02787942b5b1986e8b77e6c7ec9ba9ffc3105f8836b677
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c551133b22f8d82b82f41d54c170b01fd596abaf700c52a34c76a6fef42c89d
|
| 3 |
+
size 218098304
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
pretrained_models/cube-double-play-singletask-task2-v0/20260307_005755/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-reproduce/runs/yiyqaamq
|