Upload folder using huggingface_hub
Browse files- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/env.csv +0 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/env_sv.csv +0 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/eval.csv +31 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/eval_sv.csv +31 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/flags.json +1 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/offline_agent.csv +201 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/offline_agent_sv.csv +201 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/online_agent.csv +101 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/online_agent_sv.csv +101 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_100000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1000000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1050000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1100000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1150000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1200000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1250000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1300000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1350000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1400000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1450000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_150000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1500000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_200000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_250000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_300000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_350000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_400000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_450000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_50000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_500000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_550000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_600000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_650000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_700000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_750000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_800000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_850000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_900000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_950000.pkl +3 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/progress.tk +1 -0
- pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/token.tk +1 -0
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/eval.csv
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.1150905461173951,0.0017332581988431862,-0.11525977145642079,-0.0035016474425275334,33.35099185560882,50.10000000001527,0.0,25500.0,-1.0,-1000.0,1000.0,3.363956694602966,50000
|
| 3 |
+
0.0,0.0,-0.09207808826767427,-0.005129119163859791,-0.09253720330579768,-0.0102226637262386,28.264558431047377,50.10000000001527,0.0,77500.0,-1.02,-1003.36,1000.0,3.230590343475342,100000
|
| 4 |
+
0.0,0.0,-0.019155536193033715,-0.002650661131894152,-0.019504153007297634,-0.00766855890989474,32.59219804708132,50.10000000001527,0.0,129500.0,-1.02,-1000.74,1000.0,3.247565517425537,150000
|
| 5 |
+
0.0,0.0,-0.04095050645198984,-0.00122734743982585,-0.04146219186163449,-0.0036566878424692324,26.23427771714386,45.14600000001308,0.14,179121.6,-0.86,-900.78,900.92,2.852505931854248,200000
|
| 6 |
+
0.0,0.0,-0.12228792759746884,0.003657858449844202,-0.12275305612953363,-0.013827999283810115,22.746438035283216,48.0910000000141,0.08,226753.7,-0.92,-959.74,959.82,3.037530903816223,250000
|
| 7 |
+
0.0,0.0,-0.08596742998674785,0.006155352914636916,-0.08757578881723536,-0.005664103574225158,15.471002039542014,45.812000000013,0.16,274882.12,-0.84,-914.08,914.24,2.866514835357666,300000
|
| 8 |
+
0.0,0.0,-0.05238838121855234,0.008125851849213293,-0.05152207213646412,0.005121166531145143,25.016341705972238,44.70000000001275,0.18,321404.66,-0.86,-894.92,892.0,2.821347403526306,350000
|
| 9 |
+
0.0,0.0,-0.10156817602366032,-0.008044486846356036,-0.10119867692809813,-0.0071137823666803926,18.90352976538614,47.957000000014176,0.08,368874.88,-0.96,-974.02,957.14,3.003897957801819,400000
|
| 10 |
+
0.0,0.0,-0.07328948354079629,-0.0014148379996071448,-0.07345127027168019,0.002423871434391755,21.67878288523265,42.04500000001128,0.28,415293.74,-0.74,-840.56,838.9,2.681168942451477,450000
|
| 11 |
+
0.0,0.0,-0.0566330520626763,0.0008418457574799202,-0.057227849067335475,-0.014368473588949033,23.724442396127934,47.78500000001378,0.1,462442.86,-0.96,-993.72,953.7,3.0723362398147582,500000
|
| 12 |
+
0.0,0.0,-0.050394227032701924,-0.007173543764443009,-0.050774888812752016,-0.012973092865398056,19.284545353536373,43.35900000001165,0.22,508433.4,-0.8,-866.5,865.18,2.724212646484375,550000
|
| 13 |
+
0.0,0.0,-0.04080110020701557,-0.003762690805564969,-0.04054470984594845,-0.004596081460810824,21.662286807733587,41.46100000001063,0.34,552251.02,-0.76,-861.44,827.22,2.624824910163879,600000
|
| 14 |
+
0.0,0.0,-0.09028670845782735,-0.03665665989238124,-0.09183229540769967,-0.0522397102474347,17.529308194766756,38.38500000000876,0.42,593474.02,-0.66,-811.84,765.7,2.425058584213257,650000
|
| 15 |
+
0.0,0.0,-0.08933747354955664,-0.005229280103001981,-0.08927924387251199,0.002165567376824456,21.513614440317863,42.89000000001138,0.24,635659.9,-0.82,-893.04,855.8,2.7013267993927004,700000
|
| 16 |
+
0.0,0.0,-0.07163820605747732,-0.0041346119442908485,-0.07139980402346117,-0.008418317418150833,22.55120162100841,41.033000000011235,0.28,678484.86,-0.82,-847.82,818.66,2.597715287208557,750000
|
| 17 |
+
0.0,0.0,-0.07690805445809536,0.002093383680451455,-0.07649956758049727,-0.00982718683330774,20.425536024469785,45.27300000001169,0.24,723372.12,-0.82,-932.06,903.46,2.8480923318862916,800000
|
| 18 |
+
0.0,0.0,-0.04795898204548137,-0.006752431597094888,-0.04860572272801348,-0.030386106188075312,18.085399859838013,37.85300000001002,0.42,766879.12,-0.64,-789.62,755.06,2.433527669906616,850000
|
| 19 |
+
0.0,0.0,-0.06097959996017969,0.008158214378813068,-0.06096825763978981,0.01342914410787015,19.247663445364545,44.18200000001249,0.18,808520.62,-0.9,-902.96,881.64,2.7669228458404542,900000
|
| 20 |
+
0.0,0.0,-0.035977383070990646,0.011207230199813314,-0.03598704485603086,0.002275883133601839,15.269092652008439,40.583000000008845,0.42,852759.08,-0.64,-839.88,809.66,2.573007435798645,950000
|
| 21 |
+
0.0,0.0,-0.05276310042573295,-0.013450407575611086,-0.05277279733239095,-0.024565568666282584,22.524568683833525,41.186000000010736,0.34,894310.4,-0.8,-878.68,821.72,2.602993674278259,1000000
|
| 22 |
+
0.0,0.0,-0.07604023399077965,-0.0050759802382629995,-0.07772801314316186,-0.06240807418965222,23.29491360333276,15.387000000002843,0.8,924113.36,-0.36,-401.78,305.74,1.0172606468200684,1050000
|
| 23 |
+
0.0,0.0,-0.06712930202272302,0.021379822493552733,-0.06748229118242666,-0.007250035820931209,32.91197046540232,6.832000000000896,0.94,935097.86,-0.16,-180.32,134.64,0.46257604122161866,1100000
|
| 24 |
+
0.0,0.0,-0.06569131311157016,0.0165230539418911,-0.064928200728191,-0.011606114398804695,33.898402068415784,4.3040000000001895,0.98,940506.42,-0.02,-83.1,84.08,0.3002503442764282,1150000
|
| 25 |
+
0.0,0.0,-0.05810919885652289,0.01647319069993257,-0.057623216424308885,-0.012366883386901015,33.59462930274752,3.707000000000229,0.98,944346.56,-0.02,-71.16,72.14,0.24848686218261717,1200000
|
| 26 |
+
0.0,0.0,-0.05187683989384394,0.012142347450763303,-0.05343634932087491,-0.009625093026489015,29.352441714064998,4.38400000000023,1.0,948920.34,0.0,-84.68,85.68,0.29190471172332766,1250000
|
| 27 |
+
0.0,0.0,-0.05845263525835673,-0.015787321781359304,-0.05831179395708067,-0.004395669221992609,32.7870256917953,4.99900000000051,0.96,953457.26,-0.04,-97.12,97.98,0.3349006175994873,1300000
|
| 28 |
+
0.0,0.0,-0.07633844886214254,0.05225933102091029,-0.07498272395005003,0.0288751467990397,34.77639455242667,3.486000000000219,0.98,957833.88,-0.04,-81.92,67.72,0.23003596305847168,1350000
|
| 29 |
+
0.0,0.0,-0.06229638892899094,0.03776810563686425,-0.06201304018544996,0.04240976892051883,32.63082948221167,3.906000000000227,0.98,961483.58,-0.04,-85.2,76.12,0.26792253494262697,1400000
|
| 30 |
+
0.0,0.0,-0.07729664695067288,0.07389546751262788,-0.07747437424677284,0.003638183355397764,31.471909436797837,2.48699999999992,1.0,964649.42,0.0,-46.74,47.74,0.17328372955322266,1450000
|
| 31 |
+
0.0,0.0,-0.04252113461462094,0.01733253208961123,-0.043159981443649915,-0.09586668462421997,30.675502801603393,3.2369999999998704,1.0,967531.44,0.0,-61.74,62.74,0.23621900081634523,1500000
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/eval_sv.csv
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.1150905461173951,0.0017332581988431862,-0.11525977145642079,-0.0035016474425275334,33.35099185560882,50.10000000001527,0.0,25500.0,-1.0,-1000.0,1000.0,3.363956694602966,50000
|
| 3 |
+
0.0,0.0,-0.09207808826767427,-0.005129119163859791,-0.09253720330579768,-0.0102226637262386,28.264558431047377,50.10000000001527,0.0,77500.0,-1.02,-1003.36,1000.0,3.230590343475342,100000
|
| 4 |
+
0.0,0.0,-0.019155536193033715,-0.002650661131894152,-0.019504153007297634,-0.00766855890989474,32.59219804708132,50.10000000001527,0.0,129500.0,-1.02,-1000.74,1000.0,3.247565517425537,150000
|
| 5 |
+
0.0,0.0,-0.04095050645198984,-0.00122734743982585,-0.04146219186163449,-0.0036566878424692324,26.23427771714386,45.14600000001308,0.14,179121.6,-0.86,-900.78,900.92,2.852505931854248,200000
|
| 6 |
+
0.0,0.0,-0.12228792759746884,0.003657858449844202,-0.12275305612953363,-0.013827999283810115,22.746438035283216,48.0910000000141,0.08,226753.7,-0.92,-959.74,959.82,3.037530903816223,250000
|
| 7 |
+
0.0,0.0,-0.08596742998674785,0.006155352914636916,-0.08757578881723536,-0.005664103574225158,15.471002039542014,45.812000000013,0.16,274882.12,-0.84,-914.08,914.24,2.866514835357666,300000
|
| 8 |
+
0.0,0.0,-0.05238838121855234,0.008125851849213293,-0.05152207213646412,0.005121166531145143,25.016341705972238,44.70000000001275,0.18,321404.66,-0.86,-894.92,892.0,2.821347403526306,350000
|
| 9 |
+
0.0,0.0,-0.10156817602366032,-0.008044486846356036,-0.10119867692809813,-0.0071137823666803926,18.90352976538614,47.957000000014176,0.08,368874.88,-0.96,-974.02,957.14,3.003897957801819,400000
|
| 10 |
+
0.0,0.0,-0.07328948354079629,-0.0014148379996071448,-0.07345127027168019,0.002423871434391755,21.67878288523265,42.04500000001128,0.28,415293.74,-0.74,-840.56,838.9,2.681168942451477,450000
|
| 11 |
+
0.0,0.0,-0.0566330520626763,0.0008418457574799202,-0.057227849067335475,-0.014368473588949033,23.724442396127934,47.78500000001378,0.1,462442.86,-0.96,-993.72,953.7,3.0723362398147582,500000
|
| 12 |
+
0.0,0.0,-0.050394227032701924,-0.007173543764443009,-0.050774888812752016,-0.012973092865398056,19.284545353536373,43.35900000001165,0.22,508433.4,-0.8,-866.5,865.18,2.724212646484375,550000
|
| 13 |
+
0.0,0.0,-0.04080110020701557,-0.003762690805564969,-0.04054470984594845,-0.004596081460810824,21.662286807733587,41.46100000001063,0.34,552251.02,-0.76,-861.44,827.22,2.624824910163879,600000
|
| 14 |
+
0.0,0.0,-0.09028670845782735,-0.03665665989238124,-0.09183229540769967,-0.0522397102474347,17.529308194766756,38.38500000000876,0.42,593474.02,-0.66,-811.84,765.7,2.425058584213257,650000
|
| 15 |
+
0.0,0.0,-0.08933747354955664,-0.005229280103001981,-0.08927924387251199,0.002165567376824456,21.513614440317863,42.89000000001138,0.24,635659.9,-0.82,-893.04,855.8,2.7013267993927004,700000
|
| 16 |
+
0.0,0.0,-0.07163820605747732,-0.0041346119442908485,-0.07139980402346117,-0.008418317418150833,22.55120162100841,41.033000000011235,0.28,678484.86,-0.82,-847.82,818.66,2.597715287208557,750000
|
| 17 |
+
0.0,0.0,-0.07690805445809536,0.002093383680451455,-0.07649956758049727,-0.00982718683330774,20.425536024469785,45.27300000001169,0.24,723372.12,-0.82,-932.06,903.46,2.8480923318862916,800000
|
| 18 |
+
0.0,0.0,-0.04795898204548137,-0.006752431597094888,-0.04860572272801348,-0.030386106188075312,18.085399859838013,37.85300000001002,0.42,766879.12,-0.64,-789.62,755.06,2.433527669906616,850000
|
| 19 |
+
0.0,0.0,-0.06097959996017969,0.008158214378813068,-0.06096825763978981,0.01342914410787015,19.247663445364545,44.18200000001249,0.18,808520.62,-0.9,-902.96,881.64,2.7669228458404542,900000
|
| 20 |
+
0.0,0.0,-0.035977383070990646,0.011207230199813314,-0.03598704485603086,0.002275883133601839,15.269092652008439,40.583000000008845,0.42,852759.08,-0.64,-839.88,809.66,2.573007435798645,950000
|
| 21 |
+
0.0,0.0,-0.05276310042573295,-0.013450407575611086,-0.05277279733239095,-0.024565568666282584,22.524568683833525,41.186000000010736,0.34,894310.4,-0.8,-878.68,821.72,2.602993674278259,1000000
|
| 22 |
+
0.0,0.0,-0.07604023399077965,-0.0050759802382629995,-0.07772801314316186,-0.06240807418965222,23.29491360333276,15.387000000002843,0.8,924113.36,-0.36,-401.78,305.74,1.0172606468200684,1050000
|
| 23 |
+
0.0,0.0,-0.06712930202272302,0.021379822493552733,-0.06748229118242666,-0.007250035820931209,32.91197046540232,6.832000000000896,0.94,935097.86,-0.16,-180.32,134.64,0.46257604122161866,1100000
|
| 24 |
+
0.0,0.0,-0.06569131311157016,0.0165230539418911,-0.064928200728191,-0.011606114398804695,33.898402068415784,4.3040000000001895,0.98,940506.42,-0.02,-83.1,84.08,0.3002503442764282,1150000
|
| 25 |
+
0.0,0.0,-0.05810919885652289,0.01647319069993257,-0.057623216424308885,-0.012366883386901015,33.59462930274752,3.707000000000229,0.98,944346.56,-0.02,-71.16,72.14,0.24848686218261717,1200000
|
| 26 |
+
0.0,0.0,-0.05187683989384394,0.012142347450763303,-0.05343634932087491,-0.009625093026489015,29.352441714064998,4.38400000000023,1.0,948920.34,0.0,-84.68,85.68,0.29190471172332766,1250000
|
| 27 |
+
0.0,0.0,-0.05845263525835673,-0.015787321781359304,-0.05831179395708067,-0.004395669221992609,32.7870256917953,4.99900000000051,0.96,953457.26,-0.04,-97.12,97.98,0.3349006175994873,1300000
|
| 28 |
+
0.0,0.0,-0.07633844886214254,0.05225933102091029,-0.07498272395005003,0.0288751467990397,34.77639455242667,3.486000000000219,0.98,957833.88,-0.04,-81.92,67.72,0.23003596305847168,1350000
|
| 29 |
+
0.0,0.0,-0.06229638892899094,0.03776810563686425,-0.06201304018544996,0.04240976892051883,32.63082948221167,3.906000000000227,0.98,961483.58,-0.04,-85.2,76.12,0.26792253494262697,1400000
|
| 30 |
+
0.0,0.0,-0.07729664695067288,0.07389546751262788,-0.07747437424677284,0.003638183355397764,31.471909436797837,2.48699999999992,1.0,964649.42,0.0,-46.74,47.74,0.17328372955322266,1450000
|
| 31 |
+
0.0,0.0,-0.04252113461462094,0.01733253208961123,-0.043159981443649915,-0.09586668462421997,30.675502801603393,3.2369999999998704,1.0,967531.44,0.0,-61.74,62.74,0.23621900081634523,1500000
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/flags.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"logtostderr": false, "alsologtostderr": false, "log_dir": "", "v": 0, "verbosity": 0, "logger_levels": {}, "stderrthreshold": "fatal", "showprefixforinfo": true, "run_with_pdb": false, "pdb_post_mortem": false, "pdb": false, "run_with_profiling": false, "profile_file": null, "use_cprofile_for_profiling": true, "only_check_args": false, "pymjcf_debug": false, "pymjcf_debug_full_dump_dir": "", "pymjcf_log_xml": false, "timeout": true, "chex_n_cpu_devices": 1, "chex_assert_multiple_cpu_devices": false, "test_srcdir": "", "test_tmpdir": "/tmp/absl_testing", "test_random_seed": 301, "test_randomize_ordering_seed": "", "xml_output_file": "", "chex_skip_pmap_variant_if_single_device": true, "run_group": "main-experiments", "project_name": "qam-reproduce", "tags": "CGQL", "seed": 10001, "env_name": "cube-triple-play-singletask-task1-v0", "save_dir": "exp/qam-reproduce/main-experiments/cube-triple-play-singletask-task1-v0/cgql/20260320_222926", "offline_steps": 1000000, "online_steps": 500000, "buffer_size": 1000000, "log_interval": 5000, "eval_interval": 50000, "save_interval": 50000, "start_training": 5000, "utd_ratio": 1, "eval_episodes": 50, "video_episodes": 2, "video_frame_skip": 3, "agent": {"action_chunking": true, "action_dim": 5, "actor_hidden_dims": [512, 512, 512, 512], "actor_layer_norm": false, "agent_name": "cgql", "batch_size": 256, "best_of_n": 1, "discount": 0.99, "flow_steps": 10, "guidance_coef": 0.1, "horizon_length": 5, "inv_temp": 10.0, "isd_clip": 5.0, "lr": 0.0003, "mode": "simple", "noisy_coef": 0.001, "num_qs": 10, "ob_dims": [46], "rho": 0.5, "separate": false, "target_guidance": true, "tau": 0.005, "value_hidden_dims": [512, 512, 512, 512], "value_layer_norm": true}, "dataset_proportion": 1.0, "dataset_replace_interval": 1000, "ogbench_dataset_dir": null, "horizon_length": 5, "sparse": false, "save_all_online_states": false, "save_last_checkpoint": false, "save_replay_buffer": false, "balanced_sampling": false, "load_checkpoint": null, "skip_offline": false, "?": false, "help": false, "helpshort": false, "helpfull": false, "helpxml": false}
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/offline_agent.csv
ADDED
|
@@ -0,0 +1,201 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.24325898,7.017555,-109.12517,-161.67207,-183.5833,0.5223896,-0.5426802,82.92198,5000
|
| 3 |
+
0.24309711,11.137981,-115.25632,-190.20998,-219.43323,1.3415776,-1.1019359,127.85433,10000
|
| 4 |
+
0.23193483,8.222114,-106.50411,-192.87218,-226.0044,0.79603666,-0.7832624,114.68792,15000
|
| 5 |
+
0.24423806,11.89311,-59.222534,-187.97014,-217.72539,1.229686,-1.059076,125.60008,20000
|
| 6 |
+
0.2270502,10.963061,-108.25993,-188.28935,-223.01773,0.8475939,-0.9913928,118.45982,25000
|
| 7 |
+
0.23865066,15.116897,-60.036892,-194.61612,-231.90553,1.6650697,-1.5810593,161.05621,30000
|
| 8 |
+
0.18994169,9.062964,-53.014015,-193.47351,-226.1311,0.9755887,-1.162626,95.98425,35000
|
| 9 |
+
0.21543318,10.859412,-96.19734,-198.17004,-227.34784,0.8334055,-0.83562034,85.810165,40000
|
| 10 |
+
0.20565015,10.169051,-110.71258,-195.36528,-235.72186,0.7420294,-1.405011,100.15561,45000
|
| 11 |
+
0.20866802,10.55096,-122.7884,-201.26668,-236.73409,1.1418632,-1.1855738,96.25952,50000
|
| 12 |
+
0.23502512,9.680705,-91.23475,-201.11002,-239.30173,1.2375011,-0.75394523,91.51051,55000
|
| 13 |
+
0.21682465,10.520166,-77.99898,-200.88579,-241.49048,1.1174315,-1.1288075,82.80963,60000
|
| 14 |
+
0.217331,9.636312,-91.32104,-199.97449,-237.29773,0.6367143,-0.8297311,97.36511,65000
|
| 15 |
+
0.23458764,10.855138,-102.34822,-198.68503,-234.6798,0.67657685,-0.88260365,64.06746,70000
|
| 16 |
+
0.19264534,8.612869,-119.090096,-199.39693,-236.42746,0.8217063,-0.8627314,61.3376,75000
|
| 17 |
+
0.17934628,12.264003,-80.45716,-203.89424,-240.08069,0.8542338,-0.7108364,90.94657,80000
|
| 18 |
+
0.24839014,10.456427,-121.606,-204.65868,-243.25772,0.93321323,-0.93653363,66.185074,85000
|
| 19 |
+
0.23367862,16.174637,-97.0018,-206.42574,-245.81404,0.6237538,-0.7301478,82.38522,90000
|
| 20 |
+
0.19317403,10.869563,-97.72989,-204.29704,-239.44537,0.6160474,-0.6855877,62.33123,95000
|
| 21 |
+
0.22190738,12.494547,-106.647125,-204.69379,-242.7235,0.8461203,-0.7719591,62.368942,100000
|
| 22 |
+
0.20102403,10.090884,-90.559784,-207.1464,-244.17776,0.98480386,-1.0229977,69.46083,105000
|
| 23 |
+
0.22013153,9.934352,-111.55354,-208.07817,-241.92213,0.86805594,-0.7933478,77.88745,110000
|
| 24 |
+
0.1896081,8.486223,-119.42618,-212.73648,-252.39891,0.5602897,-0.5460216,50.52272,115000
|
| 25 |
+
0.20738861,12.536552,-115.898575,-209.45268,-255.62413,0.7453166,-0.80782306,83.94879,120000
|
| 26 |
+
0.17958131,9.772927,-110.352646,-206.8791,-243.33815,0.78259194,-0.84675455,57.920086,125000
|
| 27 |
+
0.20106998,14.537668,-68.95818,-208.39758,-250.84967,0.85281235,-0.888683,69.845604,130000
|
| 28 |
+
0.19072446,10.486742,-26.899237,-209.59546,-245.19803,0.73230225,-0.5237191,63.611313,135000
|
| 29 |
+
0.19233897,11.9998255,-88.42256,-207.36221,-247.94872,1.2441866,-1.3173326,107.6684,140000
|
| 30 |
+
0.2232614,12.426371,-100.97441,-210.72781,-249.2856,0.7845001,-0.7712689,66.9604,145000
|
| 31 |
+
0.18259324,14.128043,-115.836365,-211.18872,-253.09843,0.72319835,-0.6886332,57.087864,150000
|
| 32 |
+
0.18302101,12.298577,-103.69111,-210.65283,-246.23196,1.5886822,-1.6267091,65.59183,155000
|
| 33 |
+
0.20435844,10.924269,-121.86593,-209.98344,-246.31464,0.90350914,-1.2010026,78.671295,160000
|
| 34 |
+
0.19592261,8.180892,-131.4103,-213.44017,-247.78575,0.8259285,-0.8314739,58.119804,165000
|
| 35 |
+
0.21349698,12.585328,-130.60228,-208.07825,-245.36366,1.9447525,-1.8987011,76.6189,170000
|
| 36 |
+
0.21937321,11.508255,-114.09234,-205.66304,-246.74066,1.4422414,-1.5289853,70.65051,175000
|
| 37 |
+
0.20401987,9.375186,-134.5402,-212.5426,-243.86224,0.8111396,-0.6194407,50.107643,180000
|
| 38 |
+
0.21568364,11.930223,-105.30943,-210.11194,-248.94296,1.1863698,-1.2330837,80.423065,185000
|
| 39 |
+
0.21040925,8.828392,-96.43391,-214.84036,-246.9545,0.78831196,-0.84097004,50.928032,190000
|
| 40 |
+
0.20937926,11.313224,-132.60277,-212.75023,-253.47061,0.6060192,-0.594582,49.653687,195000
|
| 41 |
+
0.2123,10.950229,-83.44838,-213.34813,-252.439,0.66567576,-0.7824282,71.21142,200000
|
| 42 |
+
0.17552222,13.9439,-124.131966,-210.08492,-250.26773,0.7862737,-0.7675098,62.75676,205000
|
| 43 |
+
0.2129391,12.223796,-142.1778,-215.3621,-252.41362,0.8987439,-0.91376543,44.64213,210000
|
| 44 |
+
0.16684604,8.658037,-69.34779,-217.66173,-257.30988,0.48819816,-0.44870943,46.42199,215000
|
| 45 |
+
0.18345071,10.6889925,-126.70411,-213.97652,-263.0215,1.6019961,-1.7851497,64.3559,220000
|
| 46 |
+
0.17608798,8.749019,-63.626377,-218.21309,-253.20285,0.54749537,-0.5763707,39.39507,225000
|
| 47 |
+
0.1924884,9.267941,-73.567024,-215.33891,-246.98697,0.5065804,-0.56920177,44.431835,230000
|
| 48 |
+
0.18366522,8.343997,-121.39432,-214.2636,-252.10756,0.54501534,-0.5279212,39.149216,235000
|
| 49 |
+
0.18038501,11.69823,-82.528145,-216.88956,-254.38332,1.0919555,-0.72722137,60.582943,240000
|
| 50 |
+
0.24299452,10.614183,-44.452374,-217.43687,-250.72284,0.70604664,-0.74064434,52.566055,245000
|
| 51 |
+
0.18131153,10.876448,-119.09774,-219.68057,-257.94907,0.5995469,-0.7754848,58.28669,250000
|
| 52 |
+
0.19184737,7.847667,-69.59219,-216.7609,-258.68073,0.57447875,-0.66324794,59.25494,255000
|
| 53 |
+
0.19137546,8.999483,-122.07385,-218.13536,-255.7637,0.43202296,-0.43755063,35.640373,260000
|
| 54 |
+
0.19129542,8.629927,-145.55666,-219.1403,-256.61823,0.5613166,-0.5701859,46.18283,265000
|
| 55 |
+
0.18863517,9.222793,-137.82785,-221.58008,-261.30618,0.74390775,-0.7850413,39.99446,270000
|
| 56 |
+
0.17603165,10.818348,-85.77474,-221.7539,-264.54868,0.48316684,-0.5369025,45.3577,275000
|
| 57 |
+
0.18849707,9.813098,-85.95253,-223.77596,-265.97083,0.8306801,-0.8107069,50.627434,280000
|
| 58 |
+
0.18542157,10.557172,-96.015884,-220.92326,-261.1595,0.46490195,-0.45048708,40.196384,285000
|
| 59 |
+
0.177789,11.78584,-100.00244,-217.38394,-254.4527,0.94028705,-0.7990995,50.494736,290000
|
| 60 |
+
0.17875469,9.564857,-94.627396,-217.7277,-248.17026,1.1053475,-0.9771136,48.720734,295000
|
| 61 |
+
0.17349303,11.290439,-81.160286,-215.03087,-255.36443,0.64406663,-0.49679452,43.722794,300000
|
| 62 |
+
0.20760816,8.954771,-133.66061,-221.29446,-255.12555,1.1536723,-1.0702682,61.46151,305000
|
| 63 |
+
0.17031148,6.509813,-121.83524,-224.45605,-270.90054,0.52390635,-0.5476158,37.72037,310000
|
| 64 |
+
0.15995647,7.7443466,-133.24051,-222.04532,-269.34393,0.5195124,-0.63994914,42.406845,315000
|
| 65 |
+
0.20128646,9.869791,-137.06,-224.03853,-270.16306,0.48179573,-0.45472285,39.899933,320000
|
| 66 |
+
0.17378825,10.460022,-129.28954,-222.38582,-260.09192,0.6620989,-0.6582066,45.430103,325000
|
| 67 |
+
0.20274295,8.045503,-78.912605,-220.74571,-260.6876,0.7949773,-1.229708,44.236843,330000
|
| 68 |
+
0.21162072,10.384791,-85.55662,-221.17839,-268.9658,1.1639274,-0.9255958,41.718792,335000
|
| 69 |
+
0.21664417,12.099829,-97.90212,-223.63785,-263.7763,1.0997578,-1.1878428,59.705124,340000
|
| 70 |
+
0.18911737,10.983801,-28.348175,-218.00325,-259.91354,0.5488235,-0.57483405,40.554855,345000
|
| 71 |
+
0.20746198,9.421626,-85.67809,-222.44762,-256.8107,0.82070166,-0.5596283,46.834404,350000
|
| 72 |
+
0.21253964,8.709662,-142.92935,-225.42813,-259.655,0.5093336,-0.5447057,36.304977,355000
|
| 73 |
+
0.1970149,8.940036,-145.89038,-223.6809,-266.35556,0.59132206,-0.69086677,45.783463,360000
|
| 74 |
+
0.18665138,13.245627,-103.80241,-225.36104,-268.45505,0.4563611,-0.45954767,42.05386,365000
|
| 75 |
+
0.20731583,10.483699,-25.79157,-219.61295,-275.26233,0.8572612,-0.52659035,55.233658,370000
|
| 76 |
+
0.21556264,6.436271,-146.00156,-221.81389,-269.58575,0.5294118,-0.5045508,32.40307,375000
|
| 77 |
+
0.16543494,8.065038,-149.31015,-224.98584,-274.99643,0.37389976,-0.37178624,35.50104,380000
|
| 78 |
+
0.18708861,9.001831,-120.911385,-221.81848,-260.81116,1.5899514,-1.3185315,53.140198,385000
|
| 79 |
+
0.18635437,8.361488,-134.08067,-220.82642,-269.22348,0.38364035,-0.7588964,40.447666,390000
|
| 80 |
+
0.17110753,7.0890107,-136.20544,-224.22087,-265.36804,0.59099835,-0.62317383,40.424797,395000
|
| 81 |
+
0.18757331,10.639949,-138.62471,-223.01485,-269.99084,0.4714576,-0.6064214,50.616257,400000
|
| 82 |
+
0.2153258,8.837515,-105.46776,-220.727,-262.0533,0.39696425,-0.38176492,35.35353,405000
|
| 83 |
+
0.18855412,9.797674,-95.64657,-224.26236,-264.48532,1.9060394,-1.85989,64.82523,410000
|
| 84 |
+
0.19134249,8.029215,-95.71258,-224.3214,-276.09726,0.66051257,-0.4155552,42.615273,415000
|
| 85 |
+
0.17641376,7.0505753,-135.77365,-225.07176,-265.17194,0.370742,-0.428988,32.94096,420000
|
| 86 |
+
0.19773039,8.7032,-147.41373,-223.71031,-261.383,1.2376026,-0.8021884,73.74869,425000
|
| 87 |
+
0.21370703,7.594227,-47.329586,-221.15376,-264.5845,0.83094156,-0.87059134,41.515503,430000
|
| 88 |
+
0.19133976,7.252487,-155.05484,-226.93452,-261.77856,0.59243906,-0.47483832,33.05211,435000
|
| 89 |
+
0.17948982,14.654563,-133.73792,-224.45543,-268.32736,0.39347696,-0.6224559,41.642796,440000
|
| 90 |
+
0.19125013,8.157847,-142.16702,-223.92296,-266.4873,0.7723674,-0.70609754,39.088478,445000
|
| 91 |
+
0.2232902,11.743143,-146.29251,-222.96696,-273.00507,1.0315077,-1.0029215,44.091846,450000
|
| 92 |
+
0.18496168,8.1211,-141.13182,-221.19168,-259.35913,0.48637378,-0.56090647,31.617126,455000
|
| 93 |
+
0.18054429,12.192431,-108.301155,-223.51006,-266.5478,0.45391345,-0.515421,39.91213,460000
|
| 94 |
+
0.1899041,6.9340777,-129.75134,-222.6501,-257.77658,0.4218084,-0.6966147,42.8825,465000
|
| 95 |
+
0.19152439,10.503478,-138.24829,-221.86353,-260.6047,0.26930496,-0.5447179,34.671146,470000
|
| 96 |
+
0.20220146,8.706514,-128.26442,-223.32286,-274.91855,0.60252506,-0.60986555,43.59659,475000
|
| 97 |
+
0.1980375,11.170917,-127.84079,-224.38902,-271.62115,0.45383766,-0.453467,35.06036,480000
|
| 98 |
+
0.19698101,7.2770157,-82.95686,-222.51541,-260.20944,0.5789488,-0.68310726,47.38767,485000
|
| 99 |
+
0.19181086,9.985528,-91.911575,-226.37903,-268.26028,0.66358113,-0.63143945,43.226364,490000
|
| 100 |
+
0.22114924,9.392632,-127.18844,-223.08818,-271.86105,1.0476048,-0.39805943,50.518024,495000
|
| 101 |
+
0.21165647,6.475226,-140.60423,-221.91402,-270.5393,0.4487086,-0.45368803,35.40246,500000
|
| 102 |
+
0.18871504,9.393735,-88.30915,-224.11601,-279.553,0.62903863,-0.47730222,37.00487,505000
|
| 103 |
+
0.19306187,8.371185,-132.88336,-225.61812,-271.063,0.69388676,-0.7710937,44.387794,510000
|
| 104 |
+
0.21670592,8.57823,-134.76846,-225.19469,-263.88513,0.32548252,-0.5506112,41.20398,515000
|
| 105 |
+
0.18652192,7.3441253,-89.07858,-225.06355,-270.63657,0.30267376,-0.23504317,25.811543,520000
|
| 106 |
+
0.19420078,7.5827193,-101.69572,-223.25443,-272.63113,0.84261817,-0.5405459,48.754375,525000
|
| 107 |
+
0.20938173,6.8994536,-137.3854,-227.90962,-273.9012,0.34064287,-0.7294614,39.8303,530000
|
| 108 |
+
0.18375121,10.297299,-109.46889,-224.10645,-266.92123,0.69976354,-0.71678406,39.54781,535000
|
| 109 |
+
0.21801499,8.717917,-135.96375,-221.58784,-272.41714,0.8412359,-0.8843283,42.67382,540000
|
| 110 |
+
0.19777583,10.568057,-108.32284,-222.0562,-260.0082,0.49949136,-0.48737818,34.07876,545000
|
| 111 |
+
0.1988022,6.7675395,-86.05472,-224.91069,-268.02405,0.45737785,-0.53184277,34.20371,550000
|
| 112 |
+
0.18494368,9.009641,-101.538155,-226.3557,-270.87018,0.8543689,-0.87509173,37.920944,555000
|
| 113 |
+
0.19617574,7.571411,-98.13916,-226.40532,-264.9922,0.9174158,-1.9567398,34.081055,560000
|
| 114 |
+
0.20479065,10.414572,-149.08844,-225.42369,-270.35297,0.5121785,-0.49935132,37.56713,565000
|
| 115 |
+
0.18595727,7.8543015,-75.434525,-219.67537,-265.42178,0.4064096,-0.23954478,29.057884,570000
|
| 116 |
+
0.18429811,10.222348,-133.69872,-221.14714,-269.21658,0.62863785,-0.45382878,40.243317,575000
|
| 117 |
+
0.19612488,8.2424135,-100.860176,-220.27676,-270.85162,0.5012764,-0.42081186,35.42012,580000
|
| 118 |
+
0.17459498,10.139825,-141.9491,-222.86792,-276.8165,0.75413024,-0.8116324,47.254517,585000
|
| 119 |
+
0.16493383,9.21237,-91.657616,-218.23503,-267.54843,0.36289263,-0.5222965,37.02716,590000
|
| 120 |
+
0.17981683,11.093732,-96.132065,-224.67683,-266.90628,1.0073074,-0.7572815,40.252483,595000
|
| 121 |
+
0.20316513,12.1910095,-21.34335,-223.14214,-269.72064,1.1249113,-0.80031985,72.3134,600000
|
| 122 |
+
0.17478275,7.24369,-88.55317,-223.55655,-268.99103,0.32619974,-0.543095,36.527523,605000
|
| 123 |
+
0.18148243,9.195104,-129.67819,-225.08049,-275.83224,0.85283786,-0.72849435,41.734688,610000
|
| 124 |
+
0.168679,8.99886,-118.54783,-220.53116,-278.78616,0.6200656,-0.6056398,39.14865,615000
|
| 125 |
+
0.17400078,11.344863,-93.89439,-224.11324,-269.75882,0.60050505,-0.6036082,39.398182,620000
|
| 126 |
+
0.2294418,11.6514,-92.15868,-224.66594,-268.82404,1.0909288,-1.1904296,50.323532,625000
|
| 127 |
+
0.2169151,9.266731,-153.65291,-225.80127,-268.78793,0.4468769,-0.50400484,35.57542,630000
|
| 128 |
+
0.1565733,8.2516575,-117.31006,-223.6744,-272.81848,0.58374673,-0.5518483,39.48991,635000
|
| 129 |
+
0.20076267,8.971086,-112.32319,-227.87358,-266.87497,0.4400183,-0.390167,36.302917,640000
|
| 130 |
+
0.21508467,14.62948,-136.5587,-228.76982,-264.43524,0.6894461,-0.3744797,44.800793,645000
|
| 131 |
+
0.1838127,7.50283,-83.79567,-224.71007,-265.31784,0.5705951,-0.5225973,38.28475,650000
|
| 132 |
+
0.19103631,7.583416,-94.61482,-225.45316,-275.71555,0.31267935,-0.3541201,27.764612,655000
|
| 133 |
+
0.17504475,9.427108,-138.02821,-227.53653,-283.93408,1.6417423,-1.5578947,47.919952,660000
|
| 134 |
+
0.2161694,8.115671,-141.10094,-229.9414,-285.96378,0.55179477,-0.55629075,33.17598,665000
|
| 135 |
+
0.20403698,9.656182,-95.51994,-229.38086,-271.29898,0.65549374,-0.5189972,42.263153,670000
|
| 136 |
+
0.18177745,9.292236,-90.40679,-226.58727,-269.69708,0.55239797,-0.44907504,34.659023,675000
|
| 137 |
+
0.16111134,8.65143,-121.679596,-228.45097,-278.96378,0.7907002,-0.37997344,36.972923,680000
|
| 138 |
+
0.17358276,7.046249,-35.116425,-229.5937,-277.05392,0.2331679,-0.4604817,26.777855,685000
|
| 139 |
+
0.19188951,11.2282505,-109.77075,-224.21495,-268.8573,0.7610639,-0.7359022,52.0673,690000
|
| 140 |
+
0.19894075,10.280133,-31.106678,-226.5999,-284.1012,0.49825338,-0.3621758,38.926083,695000
|
| 141 |
+
0.19896297,9.597862,-100.61624,-226.26904,-271.7387,0.37163842,-0.2694836,30.797306,700000
|
| 142 |
+
0.19444934,10.847662,-140.78282,-225.43745,-277.85944,0.8266653,-0.8906216,52.59403,705000
|
| 143 |
+
0.17782743,9.623694,-119.54394,-226.35674,-269.97275,0.6669158,-0.9700729,40.610146,710000
|
| 144 |
+
0.21849903,9.032274,-94.788605,-223.28287,-272.10043,0.39621896,-0.5434016,35.2443,715000
|
| 145 |
+
0.22061402,10.74,-125.670105,-224.19914,-286.19934,0.7126702,-0.5493498,57.07851,720000
|
| 146 |
+
0.16724047,7.6794963,-117.717514,-221.40904,-272.02383,0.44447643,-0.624906,35.096092,725000
|
| 147 |
+
0.2329676,8.556323,-89.72178,-223.83353,-267.69135,0.4370642,-0.8740181,43.01361,730000
|
| 148 |
+
0.19615787,10.887412,-138.5165,-227.40706,-278.80524,0.3255184,-0.7220768,44.253407,735000
|
| 149 |
+
0.1888012,11.453775,-40.08868,-222.57893,-274.00748,0.41549462,-0.39268717,41.404343,740000
|
| 150 |
+
0.19319555,9.885478,-119.27017,-230.6816,-276.14713,0.40669364,-0.41367015,30.747868,745000
|
| 151 |
+
0.17311779,8.696192,-59.505486,-223.03447,-286.34433,0.9038705,-0.9141234,35.8812,750000
|
| 152 |
+
0.19813532,7.7336564,-126.69419,-226.48018,-266.5561,0.37660274,-0.33071607,29.113705,755000
|
| 153 |
+
0.23468421,9.071628,-75.496376,-224.53772,-277.80255,0.5997172,-1.0037875,42.583954,760000
|
| 154 |
+
0.19767386,7.799709,-125.228035,-227.65894,-273.99063,0.34937412,-0.67791986,39.6354,765000
|
| 155 |
+
0.19291633,6.5609164,-136.36969,-230.13548,-276.67108,0.48165622,-1.1698291,50.957043,770000
|
| 156 |
+
0.17809331,7.702523,-139.4167,-229.1733,-268.60025,0.32733342,-0.42149115,30.844212,775000
|
| 157 |
+
0.20752445,10.405594,-121.7719,-226.35918,-290.90198,0.524115,-0.49220085,39.9299,780000
|
| 158 |
+
0.17501177,10.904696,-92.36949,-221.79741,-278.30716,0.30374885,-0.26569128,30.941772,785000
|
| 159 |
+
0.18744424,14.540384,-74.178085,-221.29814,-271.45984,1.0166034,-0.998841,48.352806,790000
|
| 160 |
+
0.17733587,7.492161,-125.63378,-228.42485,-268.96362,0.5475403,-0.5761718,31.096792,795000
|
| 161 |
+
0.20867383,11.89835,-90.26174,-227.23997,-271.60272,1.9541284,-1.717692,57.3745,800000
|
| 162 |
+
0.18740301,9.990746,-103.39948,-226.13628,-276.8292,0.83518994,-0.5721465,33.858685,805000
|
| 163 |
+
0.20947386,10.58474,-107.79226,-226.44678,-274.09552,0.3712277,-0.57068497,32.363914,810000
|
| 164 |
+
0.17096171,9.402325,-141.21037,-226.49107,-273.6703,0.52919656,-0.7695571,37.884056,815000
|
| 165 |
+
0.16540036,10.411382,-131.3544,-227.39441,-279.26462,0.43669182,-0.33087146,29.826534,820000
|
| 166 |
+
0.18904775,9.323943,-121.3605,-223.96382,-264.2425,0.7009486,-0.40640298,35.110474,825000
|
| 167 |
+
0.19714399,8.303637,-117.6213,-230.10547,-264.4179,0.86866146,-0.909717,36.391468,830000
|
| 168 |
+
0.21160164,8.253382,-108.30426,-227.62862,-271.84088,0.3931369,-0.36556408,29.622353,835000
|
| 169 |
+
0.1775654,9.1042,-102.2103,-227.38045,-271.8151,0.8948517,-0.3747908,44.346153,840000
|
| 170 |
+
0.1984653,13.836043,-100.38373,-226.76277,-274.94827,0.3876205,-0.87551725,57.770683,845000
|
| 171 |
+
0.18653502,8.243118,-116.4825,-229.10889,-276.9422,0.7142146,-0.5731575,40.47457,850000
|
| 172 |
+
0.19414899,12.737536,-134.00104,-226.51924,-276.81375,0.52956045,-0.47431448,44.138683,855000
|
| 173 |
+
0.18461457,10.184387,-116.39657,-225.54007,-274.71326,0.53022516,-0.5773188,30.598864,860000
|
| 174 |
+
0.18096104,9.764244,-66.956696,-226.59029,-277.1239,0.45172244,-1.4214164,32.083786,865000
|
| 175 |
+
0.17140329,8.712367,-92.12612,-227.66064,-267.28778,0.65265757,-0.8693854,38.052025,870000
|
| 176 |
+
0.19066578,8.114482,-136.19803,-224.90538,-276.69974,0.4512553,-0.35681626,30.061255,875000
|
| 177 |
+
0.17642874,7.3640227,-133.99574,-229.2733,-277.98892,0.34712577,-0.16333126,25.730167,880000
|
| 178 |
+
0.19968808,6.939809,-139.45076,-231.62617,-274.29993,0.78227377,-1.2403927,31.485561,885000
|
| 179 |
+
0.18233234,10.240705,-102.908554,-227.29419,-280.2525,0.74982935,-0.37430263,44.20501,890000
|
| 180 |
+
0.1698552,8.976834,-145.3998,-227.27676,-275.47656,0.54306155,-0.34778413,31.62155,895000
|
| 181 |
+
0.18611985,14.863828,-106.19202,-226.6276,-272.3756,0.5158535,-0.4109513,43.03401,900000
|
| 182 |
+
0.17940767,6.49167,-83.77408,-224.72684,-284.3204,0.31172213,-0.7483107,34.46302,905000
|
| 183 |
+
0.21478757,7.214084,-97.34151,-224.51228,-284.65002,0.47880208,-0.7023082,36.079475,910000
|
| 184 |
+
0.16630587,9.289879,-124.01,-227.47911,-278.69073,0.5291576,-0.47269848,36.55186,915000
|
| 185 |
+
0.21877095,9.032126,-92.150566,-226.95845,-278.83582,1.964602,-2.0883484,74.76618,920000
|
| 186 |
+
0.18201931,11.159148,-96.628395,-225.06754,-274.6884,0.9538006,-1.0065885,48.929047,925000
|
| 187 |
+
0.20856276,8.49721,-124.22844,-230.65889,-284.6981,0.46762717,-0.22974196,33.3072,930000
|
| 188 |
+
0.18941043,9.903111,-141.82817,-226.90196,-272.55447,0.2686409,-0.42914706,27.175652,935000
|
| 189 |
+
0.19411522,8.551196,-115.33685,-227.05396,-274.92462,0.37043363,-0.3679828,28.197903,940000
|
| 190 |
+
0.17884019,9.010976,-90.1071,-227.89537,-284.54013,0.4973458,-0.52582884,35.956287,945000
|
| 191 |
+
0.20958069,7.2079425,-23.206318,-225.75723,-278.4291,0.35829136,-0.6266109,35.03846,950000
|
| 192 |
+
0.15972322,9.332461,-93.534004,-224.3455,-276.80975,0.40133744,-0.9229709,49.751152,955000
|
| 193 |
+
0.2080281,7.2531877,-113.95447,-225.70413,-276.0446,0.42135027,-0.73497504,39.88163,960000
|
| 194 |
+
0.21611968,8.862021,-116.481926,-224.07693,-267.1555,0.2857663,-0.38976467,28.616877,965000
|
| 195 |
+
0.16629836,7.0802855,-92.645546,-226.16711,-270.36166,0.68181574,-0.6968141,30.512634,970000
|
| 196 |
+
0.18609503,11.284785,-86.95836,-225.87833,-274.2793,1.2041609,-0.6461122,63.00088,975000
|
| 197 |
+
0.1989667,7.5919456,-91.64723,-227.54564,-286.07416,0.24423553,-0.23214877,24.710339,980000
|
| 198 |
+
0.17626268,11.76385,-108.25279,-224.41722,-270.7033,0.60627455,-0.5671794,36.159607,985000
|
| 199 |
+
0.17281452,7.1844707,-125.36101,-225.73933,-277.8669,0.36925632,-0.8750354,34.798615,990000
|
| 200 |
+
0.19433829,9.297838,-131.26054,-224.91133,-271.51587,0.7169211,-0.61874425,42.987427,995000
|
| 201 |
+
0.16345108,6.7871184,-145.84499,-226.61491,-281.87613,0.53663653,-0.56871134,30.229021,1000000
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/offline_agent_sv.csv
ADDED
|
@@ -0,0 +1,201 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.24325898,7.017555,-109.12517,-161.67207,-183.5833,0.5223896,-0.5426802,82.92198,5000
|
| 3 |
+
0.24309711,11.137981,-115.25632,-190.20998,-219.43323,1.3415776,-1.1019359,127.85433,10000
|
| 4 |
+
0.23193483,8.222114,-106.50411,-192.87218,-226.0044,0.79603666,-0.7832624,114.68792,15000
|
| 5 |
+
0.24423806,11.89311,-59.222534,-187.97014,-217.72539,1.229686,-1.059076,125.60008,20000
|
| 6 |
+
0.2270502,10.963061,-108.25993,-188.28935,-223.01773,0.8475939,-0.9913928,118.45982,25000
|
| 7 |
+
0.23865066,15.116897,-60.036892,-194.61612,-231.90553,1.6650697,-1.5810593,161.05621,30000
|
| 8 |
+
0.18994169,9.062964,-53.014015,-193.47351,-226.1311,0.9755887,-1.162626,95.98425,35000
|
| 9 |
+
0.21543318,10.859412,-96.19734,-198.17004,-227.34784,0.8334055,-0.83562034,85.810165,40000
|
| 10 |
+
0.20565015,10.169051,-110.71258,-195.36528,-235.72186,0.7420294,-1.405011,100.15561,45000
|
| 11 |
+
0.20866802,10.55096,-122.7884,-201.26668,-236.73409,1.1418632,-1.1855738,96.25952,50000
|
| 12 |
+
0.23502512,9.680705,-91.23475,-201.11002,-239.30173,1.2375011,-0.75394523,91.51051,55000
|
| 13 |
+
0.21682465,10.520166,-77.99898,-200.88579,-241.49048,1.1174315,-1.1288075,82.80963,60000
|
| 14 |
+
0.217331,9.636312,-91.32104,-199.97449,-237.29773,0.6367143,-0.8297311,97.36511,65000
|
| 15 |
+
0.23458764,10.855138,-102.34822,-198.68503,-234.6798,0.67657685,-0.88260365,64.06746,70000
|
| 16 |
+
0.19264534,8.612869,-119.090096,-199.39693,-236.42746,0.8217063,-0.8627314,61.3376,75000
|
| 17 |
+
0.17934628,12.264003,-80.45716,-203.89424,-240.08069,0.8542338,-0.7108364,90.94657,80000
|
| 18 |
+
0.24839014,10.456427,-121.606,-204.65868,-243.25772,0.93321323,-0.93653363,66.185074,85000
|
| 19 |
+
0.23367862,16.174637,-97.0018,-206.42574,-245.81404,0.6237538,-0.7301478,82.38522,90000
|
| 20 |
+
0.19317403,10.869563,-97.72989,-204.29704,-239.44537,0.6160474,-0.6855877,62.33123,95000
|
| 21 |
+
0.22190738,12.494547,-106.647125,-204.69379,-242.7235,0.8461203,-0.7719591,62.368942,100000
|
| 22 |
+
0.20102403,10.090884,-90.559784,-207.1464,-244.17776,0.98480386,-1.0229977,69.46083,105000
|
| 23 |
+
0.22013153,9.934352,-111.55354,-208.07817,-241.92213,0.86805594,-0.7933478,77.88745,110000
|
| 24 |
+
0.1896081,8.486223,-119.42618,-212.73648,-252.39891,0.5602897,-0.5460216,50.52272,115000
|
| 25 |
+
0.20738861,12.536552,-115.898575,-209.45268,-255.62413,0.7453166,-0.80782306,83.94879,120000
|
| 26 |
+
0.17958131,9.772927,-110.352646,-206.8791,-243.33815,0.78259194,-0.84675455,57.920086,125000
|
| 27 |
+
0.20106998,14.537668,-68.95818,-208.39758,-250.84967,0.85281235,-0.888683,69.845604,130000
|
| 28 |
+
0.19072446,10.486742,-26.899237,-209.59546,-245.19803,0.73230225,-0.5237191,63.611313,135000
|
| 29 |
+
0.19233897,11.9998255,-88.42256,-207.36221,-247.94872,1.2441866,-1.3173326,107.6684,140000
|
| 30 |
+
0.2232614,12.426371,-100.97441,-210.72781,-249.2856,0.7845001,-0.7712689,66.9604,145000
|
| 31 |
+
0.18259324,14.128043,-115.836365,-211.18872,-253.09843,0.72319835,-0.6886332,57.087864,150000
|
| 32 |
+
0.18302101,12.298577,-103.69111,-210.65283,-246.23196,1.5886822,-1.6267091,65.59183,155000
|
| 33 |
+
0.20435844,10.924269,-121.86593,-209.98344,-246.31464,0.90350914,-1.2010026,78.671295,160000
|
| 34 |
+
0.19592261,8.180892,-131.4103,-213.44017,-247.78575,0.8259285,-0.8314739,58.119804,165000
|
| 35 |
+
0.21349698,12.585328,-130.60228,-208.07825,-245.36366,1.9447525,-1.8987011,76.6189,170000
|
| 36 |
+
0.21937321,11.508255,-114.09234,-205.66304,-246.74066,1.4422414,-1.5289853,70.65051,175000
|
| 37 |
+
0.20401987,9.375186,-134.5402,-212.5426,-243.86224,0.8111396,-0.6194407,50.107643,180000
|
| 38 |
+
0.21568364,11.930223,-105.30943,-210.11194,-248.94296,1.1863698,-1.2330837,80.423065,185000
|
| 39 |
+
0.21040925,8.828392,-96.43391,-214.84036,-246.9545,0.78831196,-0.84097004,50.928032,190000
|
| 40 |
+
0.20937926,11.313224,-132.60277,-212.75023,-253.47061,0.6060192,-0.594582,49.653687,195000
|
| 41 |
+
0.2123,10.950229,-83.44838,-213.34813,-252.439,0.66567576,-0.7824282,71.21142,200000
|
| 42 |
+
0.17552222,13.9439,-124.131966,-210.08492,-250.26773,0.7862737,-0.7675098,62.75676,205000
|
| 43 |
+
0.2129391,12.223796,-142.1778,-215.3621,-252.41362,0.8987439,-0.91376543,44.64213,210000
|
| 44 |
+
0.16684604,8.658037,-69.34779,-217.66173,-257.30988,0.48819816,-0.44870943,46.42199,215000
|
| 45 |
+
0.18345071,10.6889925,-126.70411,-213.97652,-263.0215,1.6019961,-1.7851497,64.3559,220000
|
| 46 |
+
0.17608798,8.749019,-63.626377,-218.21309,-253.20285,0.54749537,-0.5763707,39.39507,225000
|
| 47 |
+
0.1924884,9.267941,-73.567024,-215.33891,-246.98697,0.5065804,-0.56920177,44.431835,230000
|
| 48 |
+
0.18366522,8.343997,-121.39432,-214.2636,-252.10756,0.54501534,-0.5279212,39.149216,235000
|
| 49 |
+
0.18038501,11.69823,-82.528145,-216.88956,-254.38332,1.0919555,-0.72722137,60.582943,240000
|
| 50 |
+
0.24299452,10.614183,-44.452374,-217.43687,-250.72284,0.70604664,-0.74064434,52.566055,245000
|
| 51 |
+
0.18131153,10.876448,-119.09774,-219.68057,-257.94907,0.5995469,-0.7754848,58.28669,250000
|
| 52 |
+
0.19184737,7.847667,-69.59219,-216.7609,-258.68073,0.57447875,-0.66324794,59.25494,255000
|
| 53 |
+
0.19137546,8.999483,-122.07385,-218.13536,-255.7637,0.43202296,-0.43755063,35.640373,260000
|
| 54 |
+
0.19129542,8.629927,-145.55666,-219.1403,-256.61823,0.5613166,-0.5701859,46.18283,265000
|
| 55 |
+
0.18863517,9.222793,-137.82785,-221.58008,-261.30618,0.74390775,-0.7850413,39.99446,270000
|
| 56 |
+
0.17603165,10.818348,-85.77474,-221.7539,-264.54868,0.48316684,-0.5369025,45.3577,275000
|
| 57 |
+
0.18849707,9.813098,-85.95253,-223.77596,-265.97083,0.8306801,-0.8107069,50.627434,280000
|
| 58 |
+
0.18542157,10.557172,-96.015884,-220.92326,-261.1595,0.46490195,-0.45048708,40.196384,285000
|
| 59 |
+
0.177789,11.78584,-100.00244,-217.38394,-254.4527,0.94028705,-0.7990995,50.494736,290000
|
| 60 |
+
0.17875469,9.564857,-94.627396,-217.7277,-248.17026,1.1053475,-0.9771136,48.720734,295000
|
| 61 |
+
0.17349303,11.290439,-81.160286,-215.03087,-255.36443,0.64406663,-0.49679452,43.722794,300000
|
| 62 |
+
0.20760816,8.954771,-133.66061,-221.29446,-255.12555,1.1536723,-1.0702682,61.46151,305000
|
| 63 |
+
0.17031148,6.509813,-121.83524,-224.45605,-270.90054,0.52390635,-0.5476158,37.72037,310000
|
| 64 |
+
0.15995647,7.7443466,-133.24051,-222.04532,-269.34393,0.5195124,-0.63994914,42.406845,315000
|
| 65 |
+
0.20128646,9.869791,-137.06,-224.03853,-270.16306,0.48179573,-0.45472285,39.899933,320000
|
| 66 |
+
0.17378825,10.460022,-129.28954,-222.38582,-260.09192,0.6620989,-0.6582066,45.430103,325000
|
| 67 |
+
0.20274295,8.045503,-78.912605,-220.74571,-260.6876,0.7949773,-1.229708,44.236843,330000
|
| 68 |
+
0.21162072,10.384791,-85.55662,-221.17839,-268.9658,1.1639274,-0.9255958,41.718792,335000
|
| 69 |
+
0.21664417,12.099829,-97.90212,-223.63785,-263.7763,1.0997578,-1.1878428,59.705124,340000
|
| 70 |
+
0.18911737,10.983801,-28.348175,-218.00325,-259.91354,0.5488235,-0.57483405,40.554855,345000
|
| 71 |
+
0.20746198,9.421626,-85.67809,-222.44762,-256.8107,0.82070166,-0.5596283,46.834404,350000
|
| 72 |
+
0.21253964,8.709662,-142.92935,-225.42813,-259.655,0.5093336,-0.5447057,36.304977,355000
|
| 73 |
+
0.1970149,8.940036,-145.89038,-223.6809,-266.35556,0.59132206,-0.69086677,45.783463,360000
|
| 74 |
+
0.18665138,13.245627,-103.80241,-225.36104,-268.45505,0.4563611,-0.45954767,42.05386,365000
|
| 75 |
+
0.20731583,10.483699,-25.79157,-219.61295,-275.26233,0.8572612,-0.52659035,55.233658,370000
|
| 76 |
+
0.21556264,6.436271,-146.00156,-221.81389,-269.58575,0.5294118,-0.5045508,32.40307,375000
|
| 77 |
+
0.16543494,8.065038,-149.31015,-224.98584,-274.99643,0.37389976,-0.37178624,35.50104,380000
|
| 78 |
+
0.18708861,9.001831,-120.911385,-221.81848,-260.81116,1.5899514,-1.3185315,53.140198,385000
|
| 79 |
+
0.18635437,8.361488,-134.08067,-220.82642,-269.22348,0.38364035,-0.7588964,40.447666,390000
|
| 80 |
+
0.17110753,7.0890107,-136.20544,-224.22087,-265.36804,0.59099835,-0.62317383,40.424797,395000
|
| 81 |
+
0.18757331,10.639949,-138.62471,-223.01485,-269.99084,0.4714576,-0.6064214,50.616257,400000
|
| 82 |
+
0.2153258,8.837515,-105.46776,-220.727,-262.0533,0.39696425,-0.38176492,35.35353,405000
|
| 83 |
+
0.18855412,9.797674,-95.64657,-224.26236,-264.48532,1.9060394,-1.85989,64.82523,410000
|
| 84 |
+
0.19134249,8.029215,-95.71258,-224.3214,-276.09726,0.66051257,-0.4155552,42.615273,415000
|
| 85 |
+
0.17641376,7.0505753,-135.77365,-225.07176,-265.17194,0.370742,-0.428988,32.94096,420000
|
| 86 |
+
0.19773039,8.7032,-147.41373,-223.71031,-261.383,1.2376026,-0.8021884,73.74869,425000
|
| 87 |
+
0.21370703,7.594227,-47.329586,-221.15376,-264.5845,0.83094156,-0.87059134,41.515503,430000
|
| 88 |
+
0.19133976,7.252487,-155.05484,-226.93452,-261.77856,0.59243906,-0.47483832,33.05211,435000
|
| 89 |
+
0.17948982,14.654563,-133.73792,-224.45543,-268.32736,0.39347696,-0.6224559,41.642796,440000
|
| 90 |
+
0.19125013,8.157847,-142.16702,-223.92296,-266.4873,0.7723674,-0.70609754,39.088478,445000
|
| 91 |
+
0.2232902,11.743143,-146.29251,-222.96696,-273.00507,1.0315077,-1.0029215,44.091846,450000
|
| 92 |
+
0.18496168,8.1211,-141.13182,-221.19168,-259.35913,0.48637378,-0.56090647,31.617126,455000
|
| 93 |
+
0.18054429,12.192431,-108.301155,-223.51006,-266.5478,0.45391345,-0.515421,39.91213,460000
|
| 94 |
+
0.1899041,6.9340777,-129.75134,-222.6501,-257.77658,0.4218084,-0.6966147,42.8825,465000
|
| 95 |
+
0.19152439,10.503478,-138.24829,-221.86353,-260.6047,0.26930496,-0.5447179,34.671146,470000
|
| 96 |
+
0.20220146,8.706514,-128.26442,-223.32286,-274.91855,0.60252506,-0.60986555,43.59659,475000
|
| 97 |
+
0.1980375,11.170917,-127.84079,-224.38902,-271.62115,0.45383766,-0.453467,35.06036,480000
|
| 98 |
+
0.19698101,7.2770157,-82.95686,-222.51541,-260.20944,0.5789488,-0.68310726,47.38767,485000
|
| 99 |
+
0.19181086,9.985528,-91.911575,-226.37903,-268.26028,0.66358113,-0.63143945,43.226364,490000
|
| 100 |
+
0.22114924,9.392632,-127.18844,-223.08818,-271.86105,1.0476048,-0.39805943,50.518024,495000
|
| 101 |
+
0.21165647,6.475226,-140.60423,-221.91402,-270.5393,0.4487086,-0.45368803,35.40246,500000
|
| 102 |
+
0.18871504,9.393735,-88.30915,-224.11601,-279.553,0.62903863,-0.47730222,37.00487,505000
|
| 103 |
+
0.19306187,8.371185,-132.88336,-225.61812,-271.063,0.69388676,-0.7710937,44.387794,510000
|
| 104 |
+
0.21670592,8.57823,-134.76846,-225.19469,-263.88513,0.32548252,-0.5506112,41.20398,515000
|
| 105 |
+
0.18652192,7.3441253,-89.07858,-225.06355,-270.63657,0.30267376,-0.23504317,25.811543,520000
|
| 106 |
+
0.19420078,7.5827193,-101.69572,-223.25443,-272.63113,0.84261817,-0.5405459,48.754375,525000
|
| 107 |
+
0.20938173,6.8994536,-137.3854,-227.90962,-273.9012,0.34064287,-0.7294614,39.8303,530000
|
| 108 |
+
0.18375121,10.297299,-109.46889,-224.10645,-266.92123,0.69976354,-0.71678406,39.54781,535000
|
| 109 |
+
0.21801499,8.717917,-135.96375,-221.58784,-272.41714,0.8412359,-0.8843283,42.67382,540000
|
| 110 |
+
0.19777583,10.568057,-108.32284,-222.0562,-260.0082,0.49949136,-0.48737818,34.07876,545000
|
| 111 |
+
0.1988022,6.7675395,-86.05472,-224.91069,-268.02405,0.45737785,-0.53184277,34.20371,550000
|
| 112 |
+
0.18494368,9.009641,-101.538155,-226.3557,-270.87018,0.8543689,-0.87509173,37.920944,555000
|
| 113 |
+
0.19617574,7.571411,-98.13916,-226.40532,-264.9922,0.9174158,-1.9567398,34.081055,560000
|
| 114 |
+
0.20479065,10.414572,-149.08844,-225.42369,-270.35297,0.5121785,-0.49935132,37.56713,565000
|
| 115 |
+
0.18595727,7.8543015,-75.434525,-219.67537,-265.42178,0.4064096,-0.23954478,29.057884,570000
|
| 116 |
+
0.18429811,10.222348,-133.69872,-221.14714,-269.21658,0.62863785,-0.45382878,40.243317,575000
|
| 117 |
+
0.19612488,8.2424135,-100.860176,-220.27676,-270.85162,0.5012764,-0.42081186,35.42012,580000
|
| 118 |
+
0.17459498,10.139825,-141.9491,-222.86792,-276.8165,0.75413024,-0.8116324,47.254517,585000
|
| 119 |
+
0.16493383,9.21237,-91.657616,-218.23503,-267.54843,0.36289263,-0.5222965,37.02716,590000
|
| 120 |
+
0.17981683,11.093732,-96.132065,-224.67683,-266.90628,1.0073074,-0.7572815,40.252483,595000
|
| 121 |
+
0.20316513,12.1910095,-21.34335,-223.14214,-269.72064,1.1249113,-0.80031985,72.3134,600000
|
| 122 |
+
0.17478275,7.24369,-88.55317,-223.55655,-268.99103,0.32619974,-0.543095,36.527523,605000
|
| 123 |
+
0.18148243,9.195104,-129.67819,-225.08049,-275.83224,0.85283786,-0.72849435,41.734688,610000
|
| 124 |
+
0.168679,8.99886,-118.54783,-220.53116,-278.78616,0.6200656,-0.6056398,39.14865,615000
|
| 125 |
+
0.17400078,11.344863,-93.89439,-224.11324,-269.75882,0.60050505,-0.6036082,39.398182,620000
|
| 126 |
+
0.2294418,11.6514,-92.15868,-224.66594,-268.82404,1.0909288,-1.1904296,50.323532,625000
|
| 127 |
+
0.2169151,9.266731,-153.65291,-225.80127,-268.78793,0.4468769,-0.50400484,35.57542,630000
|
| 128 |
+
0.1565733,8.2516575,-117.31006,-223.6744,-272.81848,0.58374673,-0.5518483,39.48991,635000
|
| 129 |
+
0.20076267,8.971086,-112.32319,-227.87358,-266.87497,0.4400183,-0.390167,36.302917,640000
|
| 130 |
+
0.21508467,14.62948,-136.5587,-228.76982,-264.43524,0.6894461,-0.3744797,44.800793,645000
|
| 131 |
+
0.1838127,7.50283,-83.79567,-224.71007,-265.31784,0.5705951,-0.5225973,38.28475,650000
|
| 132 |
+
0.19103631,7.583416,-94.61482,-225.45316,-275.71555,0.31267935,-0.3541201,27.764612,655000
|
| 133 |
+
0.17504475,9.427108,-138.02821,-227.53653,-283.93408,1.6417423,-1.5578947,47.919952,660000
|
| 134 |
+
0.2161694,8.115671,-141.10094,-229.9414,-285.96378,0.55179477,-0.55629075,33.17598,665000
|
| 135 |
+
0.20403698,9.656182,-95.51994,-229.38086,-271.29898,0.65549374,-0.5189972,42.263153,670000
|
| 136 |
+
0.18177745,9.292236,-90.40679,-226.58727,-269.69708,0.55239797,-0.44907504,34.659023,675000
|
| 137 |
+
0.16111134,8.65143,-121.679596,-228.45097,-278.96378,0.7907002,-0.37997344,36.972923,680000
|
| 138 |
+
0.17358276,7.046249,-35.116425,-229.5937,-277.05392,0.2331679,-0.4604817,26.777855,685000
|
| 139 |
+
0.19188951,11.2282505,-109.77075,-224.21495,-268.8573,0.7610639,-0.7359022,52.0673,690000
|
| 140 |
+
0.19894075,10.280133,-31.106678,-226.5999,-284.1012,0.49825338,-0.3621758,38.926083,695000
|
| 141 |
+
0.19896297,9.597862,-100.61624,-226.26904,-271.7387,0.37163842,-0.2694836,30.797306,700000
|
| 142 |
+
0.19444934,10.847662,-140.78282,-225.43745,-277.85944,0.8266653,-0.8906216,52.59403,705000
|
| 143 |
+
0.17782743,9.623694,-119.54394,-226.35674,-269.97275,0.6669158,-0.9700729,40.610146,710000
|
| 144 |
+
0.21849903,9.032274,-94.788605,-223.28287,-272.10043,0.39621896,-0.5434016,35.2443,715000
|
| 145 |
+
0.22061402,10.74,-125.670105,-224.19914,-286.19934,0.7126702,-0.5493498,57.07851,720000
|
| 146 |
+
0.16724047,7.6794963,-117.717514,-221.40904,-272.02383,0.44447643,-0.624906,35.096092,725000
|
| 147 |
+
0.2329676,8.556323,-89.72178,-223.83353,-267.69135,0.4370642,-0.8740181,43.01361,730000
|
| 148 |
+
0.19615787,10.887412,-138.5165,-227.40706,-278.80524,0.3255184,-0.7220768,44.253407,735000
|
| 149 |
+
0.1888012,11.453775,-40.08868,-222.57893,-274.00748,0.41549462,-0.39268717,41.404343,740000
|
| 150 |
+
0.19319555,9.885478,-119.27017,-230.6816,-276.14713,0.40669364,-0.41367015,30.747868,745000
|
| 151 |
+
0.17311779,8.696192,-59.505486,-223.03447,-286.34433,0.9038705,-0.9141234,35.8812,750000
|
| 152 |
+
0.19813532,7.7336564,-126.69419,-226.48018,-266.5561,0.37660274,-0.33071607,29.113705,755000
|
| 153 |
+
0.23468421,9.071628,-75.496376,-224.53772,-277.80255,0.5997172,-1.0037875,42.583954,760000
|
| 154 |
+
0.19767386,7.799709,-125.228035,-227.65894,-273.99063,0.34937412,-0.67791986,39.6354,765000
|
| 155 |
+
0.19291633,6.5609164,-136.36969,-230.13548,-276.67108,0.48165622,-1.1698291,50.957043,770000
|
| 156 |
+
0.17809331,7.702523,-139.4167,-229.1733,-268.60025,0.32733342,-0.42149115,30.844212,775000
|
| 157 |
+
0.20752445,10.405594,-121.7719,-226.35918,-290.90198,0.524115,-0.49220085,39.9299,780000
|
| 158 |
+
0.17501177,10.904696,-92.36949,-221.79741,-278.30716,0.30374885,-0.26569128,30.941772,785000
|
| 159 |
+
0.18744424,14.540384,-74.178085,-221.29814,-271.45984,1.0166034,-0.998841,48.352806,790000
|
| 160 |
+
0.17733587,7.492161,-125.63378,-228.42485,-268.96362,0.5475403,-0.5761718,31.096792,795000
|
| 161 |
+
0.20867383,11.89835,-90.26174,-227.23997,-271.60272,1.9541284,-1.717692,57.3745,800000
|
| 162 |
+
0.18740301,9.990746,-103.39948,-226.13628,-276.8292,0.83518994,-0.5721465,33.858685,805000
|
| 163 |
+
0.20947386,10.58474,-107.79226,-226.44678,-274.09552,0.3712277,-0.57068497,32.363914,810000
|
| 164 |
+
0.17096171,9.402325,-141.21037,-226.49107,-273.6703,0.52919656,-0.7695571,37.884056,815000
|
| 165 |
+
0.16540036,10.411382,-131.3544,-227.39441,-279.26462,0.43669182,-0.33087146,29.826534,820000
|
| 166 |
+
0.18904775,9.323943,-121.3605,-223.96382,-264.2425,0.7009486,-0.40640298,35.110474,825000
|
| 167 |
+
0.19714399,8.303637,-117.6213,-230.10547,-264.4179,0.86866146,-0.909717,36.391468,830000
|
| 168 |
+
0.21160164,8.253382,-108.30426,-227.62862,-271.84088,0.3931369,-0.36556408,29.622353,835000
|
| 169 |
+
0.1775654,9.1042,-102.2103,-227.38045,-271.8151,0.8948517,-0.3747908,44.346153,840000
|
| 170 |
+
0.1984653,13.836043,-100.38373,-226.76277,-274.94827,0.3876205,-0.87551725,57.770683,845000
|
| 171 |
+
0.18653502,8.243118,-116.4825,-229.10889,-276.9422,0.7142146,-0.5731575,40.47457,850000
|
| 172 |
+
0.19414899,12.737536,-134.00104,-226.51924,-276.81375,0.52956045,-0.47431448,44.138683,855000
|
| 173 |
+
0.18461457,10.184387,-116.39657,-225.54007,-274.71326,0.53022516,-0.5773188,30.598864,860000
|
| 174 |
+
0.18096104,9.764244,-66.956696,-226.59029,-277.1239,0.45172244,-1.4214164,32.083786,865000
|
| 175 |
+
0.17140329,8.712367,-92.12612,-227.66064,-267.28778,0.65265757,-0.8693854,38.052025,870000
|
| 176 |
+
0.19066578,8.114482,-136.19803,-224.90538,-276.69974,0.4512553,-0.35681626,30.061255,875000
|
| 177 |
+
0.17642874,7.3640227,-133.99574,-229.2733,-277.98892,0.34712577,-0.16333126,25.730167,880000
|
| 178 |
+
0.19968808,6.939809,-139.45076,-231.62617,-274.29993,0.78227377,-1.2403927,31.485561,885000
|
| 179 |
+
0.18233234,10.240705,-102.908554,-227.29419,-280.2525,0.74982935,-0.37430263,44.20501,890000
|
| 180 |
+
0.1698552,8.976834,-145.3998,-227.27676,-275.47656,0.54306155,-0.34778413,31.62155,895000
|
| 181 |
+
0.18611985,14.863828,-106.19202,-226.6276,-272.3756,0.5158535,-0.4109513,43.03401,900000
|
| 182 |
+
0.17940767,6.49167,-83.77408,-224.72684,-284.3204,0.31172213,-0.7483107,34.46302,905000
|
| 183 |
+
0.21478757,7.214084,-97.34151,-224.51228,-284.65002,0.47880208,-0.7023082,36.079475,910000
|
| 184 |
+
0.16630587,9.289879,-124.01,-227.47911,-278.69073,0.5291576,-0.47269848,36.55186,915000
|
| 185 |
+
0.21877095,9.032126,-92.150566,-226.95845,-278.83582,1.964602,-2.0883484,74.76618,920000
|
| 186 |
+
0.18201931,11.159148,-96.628395,-225.06754,-274.6884,0.9538006,-1.0065885,48.929047,925000
|
| 187 |
+
0.20856276,8.49721,-124.22844,-230.65889,-284.6981,0.46762717,-0.22974196,33.3072,930000
|
| 188 |
+
0.18941043,9.903111,-141.82817,-226.90196,-272.55447,0.2686409,-0.42914706,27.175652,935000
|
| 189 |
+
0.19411522,8.551196,-115.33685,-227.05396,-274.92462,0.37043363,-0.3679828,28.197903,940000
|
| 190 |
+
0.17884019,9.010976,-90.1071,-227.89537,-284.54013,0.4973458,-0.52582884,35.956287,945000
|
| 191 |
+
0.20958069,7.2079425,-23.206318,-225.75723,-278.4291,0.35829136,-0.6266109,35.03846,950000
|
| 192 |
+
0.15972322,9.332461,-93.534004,-224.3455,-276.80975,0.40133744,-0.9229709,49.751152,955000
|
| 193 |
+
0.2080281,7.2531877,-113.95447,-225.70413,-276.0446,0.42135027,-0.73497504,39.88163,960000
|
| 194 |
+
0.21611968,8.862021,-116.481926,-224.07693,-267.1555,0.2857663,-0.38976467,28.616877,965000
|
| 195 |
+
0.16629836,7.0802855,-92.645546,-226.16711,-270.36166,0.68181574,-0.6968141,30.512634,970000
|
| 196 |
+
0.18609503,11.284785,-86.95836,-225.87833,-274.2793,1.2041609,-0.6461122,63.00088,975000
|
| 197 |
+
0.1989667,7.5919456,-91.64723,-227.54564,-286.07416,0.24423553,-0.23214877,24.710339,980000
|
| 198 |
+
0.17626268,11.76385,-108.25279,-224.41722,-270.7033,0.60627455,-0.5671794,36.159607,985000
|
| 199 |
+
0.17281452,7.1844707,-125.36101,-225.73933,-277.8669,0.36925632,-0.8750354,34.798615,990000
|
| 200 |
+
0.19433829,9.297838,-131.26054,-224.91133,-271.51587,0.7169211,-0.61874425,42.987427,995000
|
| 201 |
+
0.16345108,6.7871184,-145.84499,-226.61491,-281.87613,0.53663653,-0.56871134,30.229021,1000000
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.17641154,7.5946145,-120.17801,-224.99117,-268.54712,0.30012405,-0.70543826,32.469547,1005000
|
| 3 |
+
0.17108263,8.83628,0.11031416,-220.66075,-277.856,0.8510328,-0.8318027,47.785477,1010000
|
| 4 |
+
0.18847165,8.13786,-127.04139,-221.15984,-272.62463,0.50258434,-0.36886135,32.647186,1015000
|
| 5 |
+
0.1957767,11.318285,-86.35525,-218.60403,-266.688,0.4320312,-0.24759024,33.183205,1020000
|
| 6 |
+
0.2102532,7.2009544,-94.087944,-216.37285,-269.6049,0.27647257,-0.28100747,26.307169,1025000
|
| 7 |
+
0.17449436,9.83466,-79.63301,-208.93675,-275.55444,0.30738175,-0.48564398,31.598202,1030000
|
| 8 |
+
0.21002516,9.15256,-70.50587,-204.92766,-249.76045,0.83596516,-1.4369217,55.91915,1035000
|
| 9 |
+
0.15492174,9.087466,-75.72712,-205.04146,-269.11404,1.2374535,-0.9577376,71.05425,1040000
|
| 10 |
+
0.18939975,8.8498125,-28.952885,-205.66275,-264.94977,0.32368138,-0.7101069,41.31945,1045000
|
| 11 |
+
0.20001069,8.460469,-43.152042,-207.57596,-283.13434,0.40557435,-0.34153372,31.205643,1050000
|
| 12 |
+
0.18758318,8.805694,-64.20377,-202.43117,-255.93912,0.358871,-0.4162927,33.506004,1055000
|
| 13 |
+
0.1875247,12.926089,-119.06779,-201.50343,-254.38017,0.5455763,-0.5145859,35.221214,1060000
|
| 14 |
+
0.175014,8.222324,-67.2098,-201.38445,-266.56305,0.4879016,-1.1014341,50.593704,1065000
|
| 15 |
+
0.22117217,12.373928,-47.039364,-196.63187,-249.86473,0.65799904,-0.7607829,38.166817,1070000
|
| 16 |
+
0.198827,9.311478,-2.4566565,-197.80074,-257.23376,0.7842286,-0.736411,41.14575,1075000
|
| 17 |
+
0.21126404,9.076419,-55.761906,-196.28954,-255.1947,0.67360795,-0.2917546,34.890846,1080000
|
| 18 |
+
0.20780993,9.470188,-55.41355,-199.63522,-254.56822,0.4614075,-0.9674337,54.073914,1085000
|
| 19 |
+
0.18400851,12.8532915,-28.385773,-195.31339,-257.03195,0.5856026,-0.62440145,41.07467,1090000
|
| 20 |
+
0.18981025,9.324071,-52.07001,-196.59297,-245.57768,0.48122513,-0.93652666,52.202583,1095000
|
| 21 |
+
0.19418497,10.609046,-14.546445,-193.59108,-268.92163,0.5899004,-0.6470428,39.423386,1100000
|
| 22 |
+
0.22064626,10.001825,-31.46203,-194.62721,-255.48322,0.611187,-0.39074084,42.154675,1105000
|
| 23 |
+
0.17903528,10.737134,-25.511202,-194.8306,-256.31696,0.2978437,-0.5578294,34.77639,1110000
|
| 24 |
+
0.16135529,9.41653,-30.485613,-191.6872,-254.27911,0.51256216,-1.0854795,54.232437,1115000
|
| 25 |
+
0.20130756,10.866289,-39.10101,-188.7473,-255.73132,0.5261324,-0.6277548,45.557396,1120000
|
| 26 |
+
0.21888795,9.440025,-35.98727,-193.14334,-247.40454,0.570758,-0.58871454,31.156645,1125000
|
| 27 |
+
0.17022747,11.870994,-18.349812,-188.91946,-251.92065,0.41685647,-0.4074378,34.068485,1130000
|
| 28 |
+
0.22636583,8.940159,-35.923897,-193.88263,-264.76114,0.43632862,-0.48640552,35.01294,1135000
|
| 29 |
+
0.21342528,11.917285,-25.475704,-191.79655,-262.77542,0.5207551,-0.54779935,37.650543,1140000
|
| 30 |
+
0.21806338,12.160661,-28.906977,-189.9186,-278.23264,0.7270169,-0.72712445,49.1168,1145000
|
| 31 |
+
0.20447865,9.711627,-8.43451,-191.73404,-262.5492,0.27547452,-0.8169315,41.774956,1150000
|
| 32 |
+
0.22425078,13.620877,-33.88995,-190.20024,-271.82373,0.6672642,-0.45850623,41.625027,1155000
|
| 33 |
+
0.21443594,10.84769,-32.52242,-190.11012,-270.1509,0.77667373,-0.6693764,51.334732,1160000
|
| 34 |
+
0.23266104,11.0556555,-13.191838,-191.94041,-262.42926,0.7430417,-0.7136203,50.17201,1165000
|
| 35 |
+
0.19001515,13.573981,-28.939217,-192.16978,-262.73297,1.4216542,-1.5236458,58.040962,1170000
|
| 36 |
+
0.19601071,12.985232,-26.877115,-194.65552,-248.05025,0.8140967,-0.8868111,50.90271,1175000
|
| 37 |
+
0.22865888,11.468795,-25.034744,-192.64268,-259.01874,0.66583353,-0.5347033,40.09521,1180000
|
| 38 |
+
0.20230716,9.905368,-32.55633,-188.62708,-268.7074,0.49698597,-0.41100845,37.231014,1185000
|
| 39 |
+
0.20344199,13.350388,-23.88294,-188.31577,-265.5221,0.81112194,-0.57844484,55.824814,1190000
|
| 40 |
+
0.22816303,16.842457,-1.508288,-187.50085,-278.26562,1.1538868,-0.9834292,64.39255,1195000
|
| 41 |
+
0.22342986,13.10337,-11.563877,-184.27646,-267.80557,1.1621342,-0.61377424,52.374855,1200000
|
| 42 |
+
0.1931102,9.365575,-1.9293207,-192.65717,-281.02048,1.1825345,-0.89505297,41.844425,1205000
|
| 43 |
+
0.21620516,13.311258,-20.057066,-192.17918,-266.46063,1.4323814,-1.4629303,65.31708,1210000
|
| 44 |
+
0.26101896,11.742354,-18.685802,-195.10493,-266.99948,0.46913493,-0.3399288,37.475414,1215000
|
| 45 |
+
0.24964583,13.817766,-7.936205,-188.25452,-263.93085,0.7108058,-0.82284975,55.978294,1220000
|
| 46 |
+
0.23917542,12.314979,-17.8727,-193.52933,-258.8411,1.5183613,-1.6424334,82.47531,1225000
|
| 47 |
+
0.24317336,13.249534,-7.001824,-190.62083,-263.94223,1.1444368,-0.46522248,50.735657,1230000
|
| 48 |
+
0.24087578,14.810424,-8.034131,-196.20758,-284.49603,0.44637445,-0.7724868,48.344894,1235000
|
| 49 |
+
0.22935359,13.753139,-11.331305,-189.85292,-258.24835,0.6628854,-0.44189286,43.360943,1240000
|
| 50 |
+
0.2415805,10.200251,-3.8133092,-191.26387,-270.61804,0.74807096,-0.42800158,42.0495,1245000
|
| 51 |
+
0.21636876,11.602031,-26.725826,-196.7162,-271.1928,0.47861218,-0.47100085,36.236908,1250000
|
| 52 |
+
0.24244833,10.8655815,-8.399908,-193.03642,-259.04892,0.46816522,-1.039156,56.850163,1255000
|
| 53 |
+
0.21883783,10.75859,-23.610579,-198.90648,-270.63455,0.65935117,-1.3045833,59.0967,1260000
|
| 54 |
+
0.23647386,9.339427,-5.3744016,-193.25826,-274.33127,0.61248136,-0.86059093,37.57721,1265000
|
| 55 |
+
0.19826818,10.22262,-8.22785,-196.57051,-280.9164,0.65237266,-0.6111182,37.05746,1270000
|
| 56 |
+
0.28606963,9.598359,-15.935074,-194.13133,-277.9396,0.5546897,-0.25341564,35.74229,1275000
|
| 57 |
+
0.24983099,16.265524,-20.493973,-192.8078,-272.92612,0.8674211,-0.787508,57.484375,1280000
|
| 58 |
+
0.23695835,14.4374695,-13.883066,-195.53316,-274.46326,0.83648574,-0.80108976,48.34636,1285000
|
| 59 |
+
0.25238422,11.584067,-9.386669,-186.45598,-268.24982,0.93853664,-0.5129729,55.392517,1290000
|
| 60 |
+
0.25422657,10.808853,-7.108749,-190.37816,-268.98218,0.4971617,-0.42789742,36.371094,1295000
|
| 61 |
+
0.23352645,11.9139385,-16.97376,-192.64867,-265.7339,0.4802457,-0.6073313,45.250618,1300000
|
| 62 |
+
0.21767865,10.766815,-19.525555,-195.91898,-270.7354,0.39355648,-0.88897574,45.31778,1305000
|
| 63 |
+
0.24379069,11.936496,3.2267804,-190.29088,-265.94034,0.6116303,-0.6759949,42.45672,1310000
|
| 64 |
+
0.22777797,10.106383,-7.610672,-192.68497,-274.9888,0.7029643,-0.7749473,40.177727,1315000
|
| 65 |
+
0.26027665,8.180751,-14.385991,-195.60228,-280.96545,0.3907336,-0.75666845,36.846935,1320000
|
| 66 |
+
0.24436891,9.12056,-14.616453,-192.4605,-268.15488,1.2227967,-0.5683894,60.577698,1325000
|
| 67 |
+
0.25942415,8.516022,-12.632338,-199.93776,-272.96725,0.29435167,-0.38971493,30.15058,1330000
|
| 68 |
+
0.2671892,8.819183,-20.569115,-194.2994,-271.65555,0.4771307,-0.51707625,36.52675,1335000
|
| 69 |
+
0.23213795,10.335324,-11.491398,-192.17102,-273.50195,0.55781925,-1.1595256,69.90867,1340000
|
| 70 |
+
0.22192922,7.957231,-16.182964,-192.27118,-272.5012,0.32652953,-0.39671358,28.706429,1345000
|
| 71 |
+
0.22146574,11.004407,-21.130636,-199.97762,-262.1732,0.58884954,-0.4070018,36.750725,1350000
|
| 72 |
+
0.27328414,9.00992,-17.472116,-188.96947,-269.7279,0.35434392,-1.0338393,45.462807,1355000
|
| 73 |
+
0.24437794,10.478436,-10.695715,-185.0194,-266.00253,0.63557124,-0.5129966,39.60142,1360000
|
| 74 |
+
0.23845777,14.548264,-13.638675,-191.5136,-265.23517,1.1813959,-0.8218653,57.724705,1365000
|
| 75 |
+
0.25262588,9.764149,-13.616791,-188.89812,-262.9058,0.39417148,-0.42047247,31.86992,1370000
|
| 76 |
+
0.21184714,8.7479925,-28.073446,-191.81522,-266.60583,0.4306971,-0.74088013,45.32441,1375000
|
| 77 |
+
0.20919302,9.683517,-0.8559153,-186.1176,-255.40099,1.172804,-0.573103,45.141975,1380000
|
| 78 |
+
0.24435288,11.543363,-6.544501,-189.6722,-273.8431,0.6330962,-0.6020069,48.777515,1385000
|
| 79 |
+
0.19706942,8.9499655,-20.371147,-194.52164,-263.01498,1.1790451,-0.90334255,44.092247,1390000
|
| 80 |
+
0.23266658,10.627294,-16.690926,-187.94745,-278.14777,0.5992506,-0.72963905,44.76537,1395000
|
| 81 |
+
0.22419405,12.343512,-17.242397,-197.47012,-271.13956,0.48083997,-0.56642026,51.228653,1400000
|
| 82 |
+
0.24331047,11.661219,-12.13847,-191.99763,-264.88058,0.4241003,-0.5663066,35.080017,1405000
|
| 83 |
+
0.2512192,11.311072,-13.84771,-190.45712,-265.22156,0.93917817,-0.92257833,54.143845,1410000
|
| 84 |
+
0.25362408,8.963172,-4.72669,-193.48494,-266.90656,0.38383228,-0.62287474,36.969166,1415000
|
| 85 |
+
0.21700998,8.662157,1.0714853,-191.4438,-274.9121,0.47928438,-0.630871,33.38144,1420000
|
| 86 |
+
0.2758389,9.656287,-3.3898377,-188.90327,-255.45891,0.6619823,-0.3302242,42.54621,1425000
|
| 87 |
+
0.2428992,16.157738,-21.28596,-189.80566,-269.20493,0.9094971,-0.579096,56.767017,1430000
|
| 88 |
+
0.21942887,11.01208,-4.203007,-193.79825,-270.3181,0.7828794,-0.7979217,34.064922,1435000
|
| 89 |
+
0.24587595,11.213252,-11.430162,-192.60176,-264.63513,0.38771802,-0.64762616,43.15004,1440000
|
| 90 |
+
0.27423912,12.136374,-8.115661,-191.47589,-271.1193,0.54229206,-0.9866584,38.076633,1445000
|
| 91 |
+
0.23958582,9.553462,-18.47598,-192.99103,-271.12048,0.3430923,-0.79385877,32.05759,1450000
|
| 92 |
+
0.22990696,10.528193,-13.284005,-188.87198,-264.77682,0.5003336,-0.5318047,36.71735,1455000
|
| 93 |
+
0.22440268,10.825653,-3.9139593,-189.94035,-265.93942,0.551428,-0.6923291,41.733757,1460000
|
| 94 |
+
0.27402014,10.472144,-24.2836,-195.51634,-267.72,0.53314793,-0.33852136,36.063633,1465000
|
| 95 |
+
0.24322242,11.620148,-12.898092,-182.5301,-264.27307,0.88472927,-0.79860866,44.366905,1470000
|
| 96 |
+
0.2847603,13.691688,1.277263,-181.9376,-268.359,0.61894923,-0.59227276,43.186176,1475000
|
| 97 |
+
0.2511816,8.396324,-4.6050377,-190.503,-266.12732,0.7040199,-0.70167863,30.982805,1480000
|
| 98 |
+
0.2197691,13.815337,-8.22799,-188.94908,-275.9793,0.78842527,-0.8773894,52.688507,1485000
|
| 99 |
+
0.24080755,11.369249,-14.714853,-187.8853,-270.099,0.64440435,-0.59096867,46.194267,1490000
|
| 100 |
+
0.21790037,9.554146,-10.001682,-198.4161,-261.9535,0.39746523,-0.41802445,36.64697,1495000
|
| 101 |
+
0.27053493,7.5656357,-11.520069,-191.42996,-275.3674,0.26627624,-0.2947516,28.66011,1500000
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
0.17641154,7.5946145,-120.17801,-224.99117,-268.54712,0.30012405,-0.70543826,32.469547,1005000
|
| 3 |
+
0.17108263,8.83628,0.11031416,-220.66075,-277.856,0.8510328,-0.8318027,47.785477,1010000
|
| 4 |
+
0.18847165,8.13786,-127.04139,-221.15984,-272.62463,0.50258434,-0.36886135,32.647186,1015000
|
| 5 |
+
0.1957767,11.318285,-86.35525,-218.60403,-266.688,0.4320312,-0.24759024,33.183205,1020000
|
| 6 |
+
0.2102532,7.2009544,-94.087944,-216.37285,-269.6049,0.27647257,-0.28100747,26.307169,1025000
|
| 7 |
+
0.17449436,9.83466,-79.63301,-208.93675,-275.55444,0.30738175,-0.48564398,31.598202,1030000
|
| 8 |
+
0.21002516,9.15256,-70.50587,-204.92766,-249.76045,0.83596516,-1.4369217,55.91915,1035000
|
| 9 |
+
0.15492174,9.087466,-75.72712,-205.04146,-269.11404,1.2374535,-0.9577376,71.05425,1040000
|
| 10 |
+
0.18939975,8.8498125,-28.952885,-205.66275,-264.94977,0.32368138,-0.7101069,41.31945,1045000
|
| 11 |
+
0.20001069,8.460469,-43.152042,-207.57596,-283.13434,0.40557435,-0.34153372,31.205643,1050000
|
| 12 |
+
0.18758318,8.805694,-64.20377,-202.43117,-255.93912,0.358871,-0.4162927,33.506004,1055000
|
| 13 |
+
0.1875247,12.926089,-119.06779,-201.50343,-254.38017,0.5455763,-0.5145859,35.221214,1060000
|
| 14 |
+
0.175014,8.222324,-67.2098,-201.38445,-266.56305,0.4879016,-1.1014341,50.593704,1065000
|
| 15 |
+
0.22117217,12.373928,-47.039364,-196.63187,-249.86473,0.65799904,-0.7607829,38.166817,1070000
|
| 16 |
+
0.198827,9.311478,-2.4566565,-197.80074,-257.23376,0.7842286,-0.736411,41.14575,1075000
|
| 17 |
+
0.21126404,9.076419,-55.761906,-196.28954,-255.1947,0.67360795,-0.2917546,34.890846,1080000
|
| 18 |
+
0.20780993,9.470188,-55.41355,-199.63522,-254.56822,0.4614075,-0.9674337,54.073914,1085000
|
| 19 |
+
0.18400851,12.8532915,-28.385773,-195.31339,-257.03195,0.5856026,-0.62440145,41.07467,1090000
|
| 20 |
+
0.18981025,9.324071,-52.07001,-196.59297,-245.57768,0.48122513,-0.93652666,52.202583,1095000
|
| 21 |
+
0.19418497,10.609046,-14.546445,-193.59108,-268.92163,0.5899004,-0.6470428,39.423386,1100000
|
| 22 |
+
0.22064626,10.001825,-31.46203,-194.62721,-255.48322,0.611187,-0.39074084,42.154675,1105000
|
| 23 |
+
0.17903528,10.737134,-25.511202,-194.8306,-256.31696,0.2978437,-0.5578294,34.77639,1110000
|
| 24 |
+
0.16135529,9.41653,-30.485613,-191.6872,-254.27911,0.51256216,-1.0854795,54.232437,1115000
|
| 25 |
+
0.20130756,10.866289,-39.10101,-188.7473,-255.73132,0.5261324,-0.6277548,45.557396,1120000
|
| 26 |
+
0.21888795,9.440025,-35.98727,-193.14334,-247.40454,0.570758,-0.58871454,31.156645,1125000
|
| 27 |
+
0.17022747,11.870994,-18.349812,-188.91946,-251.92065,0.41685647,-0.4074378,34.068485,1130000
|
| 28 |
+
0.22636583,8.940159,-35.923897,-193.88263,-264.76114,0.43632862,-0.48640552,35.01294,1135000
|
| 29 |
+
0.21342528,11.917285,-25.475704,-191.79655,-262.77542,0.5207551,-0.54779935,37.650543,1140000
|
| 30 |
+
0.21806338,12.160661,-28.906977,-189.9186,-278.23264,0.7270169,-0.72712445,49.1168,1145000
|
| 31 |
+
0.20447865,9.711627,-8.43451,-191.73404,-262.5492,0.27547452,-0.8169315,41.774956,1150000
|
| 32 |
+
0.22425078,13.620877,-33.88995,-190.20024,-271.82373,0.6672642,-0.45850623,41.625027,1155000
|
| 33 |
+
0.21443594,10.84769,-32.52242,-190.11012,-270.1509,0.77667373,-0.6693764,51.334732,1160000
|
| 34 |
+
0.23266104,11.0556555,-13.191838,-191.94041,-262.42926,0.7430417,-0.7136203,50.17201,1165000
|
| 35 |
+
0.19001515,13.573981,-28.939217,-192.16978,-262.73297,1.4216542,-1.5236458,58.040962,1170000
|
| 36 |
+
0.19601071,12.985232,-26.877115,-194.65552,-248.05025,0.8140967,-0.8868111,50.90271,1175000
|
| 37 |
+
0.22865888,11.468795,-25.034744,-192.64268,-259.01874,0.66583353,-0.5347033,40.09521,1180000
|
| 38 |
+
0.20230716,9.905368,-32.55633,-188.62708,-268.7074,0.49698597,-0.41100845,37.231014,1185000
|
| 39 |
+
0.20344199,13.350388,-23.88294,-188.31577,-265.5221,0.81112194,-0.57844484,55.824814,1190000
|
| 40 |
+
0.22816303,16.842457,-1.508288,-187.50085,-278.26562,1.1538868,-0.9834292,64.39255,1195000
|
| 41 |
+
0.22342986,13.10337,-11.563877,-184.27646,-267.80557,1.1621342,-0.61377424,52.374855,1200000
|
| 42 |
+
0.1931102,9.365575,-1.9293207,-192.65717,-281.02048,1.1825345,-0.89505297,41.844425,1205000
|
| 43 |
+
0.21620516,13.311258,-20.057066,-192.17918,-266.46063,1.4323814,-1.4629303,65.31708,1210000
|
| 44 |
+
0.26101896,11.742354,-18.685802,-195.10493,-266.99948,0.46913493,-0.3399288,37.475414,1215000
|
| 45 |
+
0.24964583,13.817766,-7.936205,-188.25452,-263.93085,0.7108058,-0.82284975,55.978294,1220000
|
| 46 |
+
0.23917542,12.314979,-17.8727,-193.52933,-258.8411,1.5183613,-1.6424334,82.47531,1225000
|
| 47 |
+
0.24317336,13.249534,-7.001824,-190.62083,-263.94223,1.1444368,-0.46522248,50.735657,1230000
|
| 48 |
+
0.24087578,14.810424,-8.034131,-196.20758,-284.49603,0.44637445,-0.7724868,48.344894,1235000
|
| 49 |
+
0.22935359,13.753139,-11.331305,-189.85292,-258.24835,0.6628854,-0.44189286,43.360943,1240000
|
| 50 |
+
0.2415805,10.200251,-3.8133092,-191.26387,-270.61804,0.74807096,-0.42800158,42.0495,1245000
|
| 51 |
+
0.21636876,11.602031,-26.725826,-196.7162,-271.1928,0.47861218,-0.47100085,36.236908,1250000
|
| 52 |
+
0.24244833,10.8655815,-8.399908,-193.03642,-259.04892,0.46816522,-1.039156,56.850163,1255000
|
| 53 |
+
0.21883783,10.75859,-23.610579,-198.90648,-270.63455,0.65935117,-1.3045833,59.0967,1260000
|
| 54 |
+
0.23647386,9.339427,-5.3744016,-193.25826,-274.33127,0.61248136,-0.86059093,37.57721,1265000
|
| 55 |
+
0.19826818,10.22262,-8.22785,-196.57051,-280.9164,0.65237266,-0.6111182,37.05746,1270000
|
| 56 |
+
0.28606963,9.598359,-15.935074,-194.13133,-277.9396,0.5546897,-0.25341564,35.74229,1275000
|
| 57 |
+
0.24983099,16.265524,-20.493973,-192.8078,-272.92612,0.8674211,-0.787508,57.484375,1280000
|
| 58 |
+
0.23695835,14.4374695,-13.883066,-195.53316,-274.46326,0.83648574,-0.80108976,48.34636,1285000
|
| 59 |
+
0.25238422,11.584067,-9.386669,-186.45598,-268.24982,0.93853664,-0.5129729,55.392517,1290000
|
| 60 |
+
0.25422657,10.808853,-7.108749,-190.37816,-268.98218,0.4971617,-0.42789742,36.371094,1295000
|
| 61 |
+
0.23352645,11.9139385,-16.97376,-192.64867,-265.7339,0.4802457,-0.6073313,45.250618,1300000
|
| 62 |
+
0.21767865,10.766815,-19.525555,-195.91898,-270.7354,0.39355648,-0.88897574,45.31778,1305000
|
| 63 |
+
0.24379069,11.936496,3.2267804,-190.29088,-265.94034,0.6116303,-0.6759949,42.45672,1310000
|
| 64 |
+
0.22777797,10.106383,-7.610672,-192.68497,-274.9888,0.7029643,-0.7749473,40.177727,1315000
|
| 65 |
+
0.26027665,8.180751,-14.385991,-195.60228,-280.96545,0.3907336,-0.75666845,36.846935,1320000
|
| 66 |
+
0.24436891,9.12056,-14.616453,-192.4605,-268.15488,1.2227967,-0.5683894,60.577698,1325000
|
| 67 |
+
0.25942415,8.516022,-12.632338,-199.93776,-272.96725,0.29435167,-0.38971493,30.15058,1330000
|
| 68 |
+
0.2671892,8.819183,-20.569115,-194.2994,-271.65555,0.4771307,-0.51707625,36.52675,1335000
|
| 69 |
+
0.23213795,10.335324,-11.491398,-192.17102,-273.50195,0.55781925,-1.1595256,69.90867,1340000
|
| 70 |
+
0.22192922,7.957231,-16.182964,-192.27118,-272.5012,0.32652953,-0.39671358,28.706429,1345000
|
| 71 |
+
0.22146574,11.004407,-21.130636,-199.97762,-262.1732,0.58884954,-0.4070018,36.750725,1350000
|
| 72 |
+
0.27328414,9.00992,-17.472116,-188.96947,-269.7279,0.35434392,-1.0338393,45.462807,1355000
|
| 73 |
+
0.24437794,10.478436,-10.695715,-185.0194,-266.00253,0.63557124,-0.5129966,39.60142,1360000
|
| 74 |
+
0.23845777,14.548264,-13.638675,-191.5136,-265.23517,1.1813959,-0.8218653,57.724705,1365000
|
| 75 |
+
0.25262588,9.764149,-13.616791,-188.89812,-262.9058,0.39417148,-0.42047247,31.86992,1370000
|
| 76 |
+
0.21184714,8.7479925,-28.073446,-191.81522,-266.60583,0.4306971,-0.74088013,45.32441,1375000
|
| 77 |
+
0.20919302,9.683517,-0.8559153,-186.1176,-255.40099,1.172804,-0.573103,45.141975,1380000
|
| 78 |
+
0.24435288,11.543363,-6.544501,-189.6722,-273.8431,0.6330962,-0.6020069,48.777515,1385000
|
| 79 |
+
0.19706942,8.9499655,-20.371147,-194.52164,-263.01498,1.1790451,-0.90334255,44.092247,1390000
|
| 80 |
+
0.23266658,10.627294,-16.690926,-187.94745,-278.14777,0.5992506,-0.72963905,44.76537,1395000
|
| 81 |
+
0.22419405,12.343512,-17.242397,-197.47012,-271.13956,0.48083997,-0.56642026,51.228653,1400000
|
| 82 |
+
0.24331047,11.661219,-12.13847,-191.99763,-264.88058,0.4241003,-0.5663066,35.080017,1405000
|
| 83 |
+
0.2512192,11.311072,-13.84771,-190.45712,-265.22156,0.93917817,-0.92257833,54.143845,1410000
|
| 84 |
+
0.25362408,8.963172,-4.72669,-193.48494,-266.90656,0.38383228,-0.62287474,36.969166,1415000
|
| 85 |
+
0.21700998,8.662157,1.0714853,-191.4438,-274.9121,0.47928438,-0.630871,33.38144,1420000
|
| 86 |
+
0.2758389,9.656287,-3.3898377,-188.90327,-255.45891,0.6619823,-0.3302242,42.54621,1425000
|
| 87 |
+
0.2428992,16.157738,-21.28596,-189.80566,-269.20493,0.9094971,-0.579096,56.767017,1430000
|
| 88 |
+
0.21942887,11.01208,-4.203007,-193.79825,-270.3181,0.7828794,-0.7979217,34.064922,1435000
|
| 89 |
+
0.24587595,11.213252,-11.430162,-192.60176,-264.63513,0.38771802,-0.64762616,43.15004,1440000
|
| 90 |
+
0.27423912,12.136374,-8.115661,-191.47589,-271.1193,0.54229206,-0.9866584,38.076633,1445000
|
| 91 |
+
0.23958582,9.553462,-18.47598,-192.99103,-271.12048,0.3430923,-0.79385877,32.05759,1450000
|
| 92 |
+
0.22990696,10.528193,-13.284005,-188.87198,-264.77682,0.5003336,-0.5318047,36.71735,1455000
|
| 93 |
+
0.22440268,10.825653,-3.9139593,-189.94035,-265.93942,0.551428,-0.6923291,41.733757,1460000
|
| 94 |
+
0.27402014,10.472144,-24.2836,-195.51634,-267.72,0.53314793,-0.33852136,36.063633,1465000
|
| 95 |
+
0.24322242,11.620148,-12.898092,-182.5301,-264.27307,0.88472927,-0.79860866,44.366905,1470000
|
| 96 |
+
0.2847603,13.691688,1.277263,-181.9376,-268.359,0.61894923,-0.59227276,43.186176,1475000
|
| 97 |
+
0.2511816,8.396324,-4.6050377,-190.503,-266.12732,0.7040199,-0.70167863,30.982805,1480000
|
| 98 |
+
0.2197691,13.815337,-8.22799,-188.94908,-275.9793,0.78842527,-0.8773894,52.688507,1485000
|
| 99 |
+
0.24080755,11.369249,-14.714853,-187.8853,-270.099,0.64440435,-0.59096867,46.194267,1490000
|
| 100 |
+
0.21790037,9.554146,-10.001682,-198.4161,-261.9535,0.39746523,-0.41802445,36.64697,1495000
|
| 101 |
+
0.27053493,7.5656357,-11.520069,-191.42996,-275.3674,0.26627624,-0.2947516,28.66011,1500000
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d296bd9afc88a03ea17ece147ef8cdb6ad9ea26a0136e6c128d23e58cb844da2
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9852b6e5e587474d8c29532379778ae51dd39e00c26429893a215f85bc30c167
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0a968d7d780efee8f341aadbab582dbbe13bc0403a5dcef45660d8cec95e8d0
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ef3a4f000815517a36cb550e3d6a0b047cd99707a9512ad986983ddcb130935
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c1de6015df5f3853bbd99f500c35547732631accb13f3b3878638a32e6f88a6
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd147ffb179b1f379948e6c463e13620bded0fe7ab7c5d2c0a6c69e9f52036fd
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24e64288fc28d6e69610a96fc224a58ce4f6b2d3163db63945b8560d17869f35
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3932688e0b053633443e7dcfdd4200942589a8b739f2180e7f097fb97694cc20
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57eb9846cf2019918873471998ef0262ed8583559d0bcc62800355147a37cfe6
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80c7b517c93ef0dcd3a14f9e76216b29815c1cca13f471a08d477f894c819e9a
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33294d901bcaf4f97d9021bcf62f6089cc4094c645d7dd2cf6d521f25c36904a
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_150000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:733ce2b43b88d7a4c64faa4e715afae21bc1552e87c5f91532cc16150710b0d0
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_1500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c1c0012f3b136e08195eb97ae53a9cba2d1ae09ba2696056701d33ce40e1f6f
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_200000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f49e3f06101cabcbc4d592493b01dce7cfbb68fe59296bfd0fcbad38849ff0e
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f28ba68f53dbf88497e0521240e8687a34e995b8bdd7dfefd9f16bb58cc8469
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7efa535e3168639385922917b667b72f656c88a582ce8b4b9b122366aab37f3e
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91e9cc01060a5128cd51148cabee9117e85551625465b1d4081a6b436f081ae5
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:050f5c9ed1f91cb23e1a239511e1d5ca35154f03b6b4bcd537ad98cc49fe1c3c
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8e66105c55fddca1054b7b112eafb45b28f5b0452e7c65852295fb377d0ab8b
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_50000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14c7f05d3437776d62f3653fd931648af002bbe6b0a13432a481b16f66bbea64
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06d26c6f448c5349ee1c4e45c560ec343bd862c3992b869fbe90ef605f2e539c
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92b235f3046816dd7a4896038509dd35db45da1259f9b26a26b4d21b8a1863ec
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c65596d2271321cd28f09b629e48de07683e8e95b40e3d4e29d172bb0da7db15
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ea6a113fa52a703866661329289b8c300a1dcdfd08909d7b7640e750feffd16
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b071140f1d367f996a4b74104800707ae336cc03d976ed20b24a498821ea45c
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5d7fc5a237695f3f53b571bef59fe0cd150a4bce847989efd003a7f5989dc03
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a142526698a60a5e49eeca0692ac02593de111f15e61f775cc5557f9652ea4c
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:750346d513475d5875a5b74b944df905d0b211f89ea4b08cb6cd40d050553d4e
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7512f5b3a7a7c6faa441d65ccff5836a527cdeb070c01878b05fdc52a4c940c
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1fd8c1508ed5395f6dd30a02ae63dae456aad9bbe2fbddd31821f5cd6c750f7
|
| 3 |
+
size 219314815
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
pretrained_models/cube-triple-play-singletask-task1-v0/cgql/20260320_222926/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-reproduce/runs/wb01sou4
|