| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 1.4606472253799438, |
| "min": 1.2818001508712769, |
| "max": 3.295718193054199, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 30287.98046875, |
| "min": 16307.234375, |
| "max": 109189.453125, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 91.50943396226415, |
| "min": 40.30833333333333, |
| "max": 999.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 19400.0, |
| "min": 13036.0, |
| "max": 28132.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1638.1093737463184, |
| "min": 1198.4322416455373, |
| "max": 1715.266684285121, |
| "count": 4978 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 173639.59361710976, |
| "min": 2397.567130297888, |
| "max": 397417.51250759757, |
| "count": 4978 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 49999972.0, |
| "min": 9086.0, |
| "max": 49999972.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 49999972.0, |
| "min": 9086.0, |
| "max": 49999972.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": -0.035314299166202545, |
| "min": -0.1513925939798355, |
| "max": 0.261381059885025, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": -3.778630018234253, |
| "min": -33.76054763793945, |
| "max": 35.04165267944336, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": -0.03379722312092781, |
| "min": -0.15381675958633423, |
| "max": 0.26418569684028625, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": -3.616302728652954, |
| "min": -34.3011360168457, |
| "max": 35.56377410888672, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": 0.1563420557530127, |
| "min": -0.5447555556893349, |
| "max": 0.6125354814913965, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": 16.728599965572357, |
| "min": -87.84300005435944, |
| "max": 76.05240023136139, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": 0.1563420557530127, |
| "min": -0.5447555556893349, |
| "max": 0.6125354814913965, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": 16.728599965572357, |
| "min": -87.84300005435944, |
| "max": 76.05240023136139, |
| "count": 5000 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.020271552559764434, |
| "min": 0.009705064026638866, |
| "max": 0.02512652772832856, |
| "count": 2424 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.020271552559764434, |
| "min": 0.009705064026638866, |
| "max": 0.02512652772832856, |
| "count": 2424 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.08147014304995537, |
| "min": 0.00011633944911106179, |
| "max": 0.12695539717872936, |
| "count": 2424 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.08147014304995537, |
| "min": 0.00011633944911106179, |
| "max": 0.12695539717872936, |
| "count": 2424 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.0821972573796908, |
| "min": 0.00010153193531247477, |
| "max": 0.12931535094976426, |
| "count": 2424 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.0821972573796908, |
| "min": 0.00010153193531247477, |
| "max": 0.12931535094976426, |
| "count": 2424 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 2424 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 2424 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 2424 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 2424 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 2424 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 2424 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1678720696", |
| "python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", |
| "command_line_arguments": "/home/ivan/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force", |
| "mlagents_version": "0.31.0.dev0", |
| "mlagents_envs_version": "0.31.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.11.0+cu102", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1678864766" |
| }, |
| "total": 144070.11821003904, |
| "count": 1, |
| "self": 0.2191282089916058, |
| "children": { |
| "run_training.setup": { |
| "total": 0.008097673009615391, |
| "count": 1, |
| "self": 0.008097673009615391 |
| }, |
| "TrainerController.start_learning": { |
| "total": 144069.89098415704, |
| "count": 1, |
| "self": 69.02466520911548, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 4.632106091885362, |
| "count": 250, |
| "self": 4.632106091885362 |
| }, |
| "TrainerController.advance": { |
| "total": 143996.0793338091, |
| "count": 3442990, |
| "self": 66.45647222403204, |
| "children": { |
| "env_step": { |
| "total": 46244.63626892376, |
| "count": 3442990, |
| "self": 37887.79250735021, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 8317.804537528718, |
| "count": 3442990, |
| "self": 336.71693324833177, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 7981.087604280387, |
| "count": 6283122, |
| "self": 7981.087604280387 |
| } |
| } |
| }, |
| "workers": { |
| "total": 39.03922404482728, |
| "count": 3442990, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 143976.92156786704, |
| "count": 3442990, |
| "is_parallel": true, |
| "self": 113122.60298189969, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.001963631948456168, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.000467139994725585, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014964919537305832, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0014964919537305832 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.019571140001062304, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004837249871343374, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0003792460192926228, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003792460192926228 |
| }, |
| "communicator.exchange": { |
| "total": 0.017254301987122744, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.017254301987122744 |
| }, |
| "steps_from_proto": { |
| "total": 0.0014538670075125992, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0003151089767925441, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.001138758030720055, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.001138758030720055 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 30853.926119588723, |
| "count": 3442989, |
| "is_parallel": true, |
| "self": 1769.8957734311116, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 1270.0130755080027, |
| "count": 3442989, |
| "is_parallel": true, |
| "self": 1270.0130755080027 |
| }, |
| "communicator.exchange": { |
| "total": 22603.56078915886, |
| "count": 3442989, |
| "is_parallel": true, |
| "self": 22603.56078915886 |
| }, |
| "steps_from_proto": { |
| "total": 5210.45648149075, |
| "count": 6885978, |
| "is_parallel": true, |
| "self": 1112.2107851236942, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 4098.245696367056, |
| "count": 27543912, |
| "is_parallel": true, |
| "self": 4098.245696367056 |
| } |
| } |
| } |
| } |
| }, |
| "steps_from_proto": { |
| "total": 0.39246637863107026, |
| "count": 498, |
| "is_parallel": true, |
| "self": 0.08386936254100874, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.3085970160900615, |
| "count": 1992, |
| "is_parallel": true, |
| "self": 0.3085970160900615 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 97684.9865926613, |
| "count": 3442990, |
| "self": 435.5247600186849, |
| "children": { |
| "process_trajectory": { |
| "total": 8790.586209100147, |
| "count": 3442990, |
| "self": 8773.4900656924, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 17.09614340774715, |
| "count": 100, |
| "self": 17.09614340774715 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 88458.87562354247, |
| "count": 2424, |
| "self": 6828.4682076094905, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 81630.40741593298, |
| "count": 72720, |
| "self": 81630.40741593298 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 7.189810276031494e-07, |
| "count": 1, |
| "self": 7.189810276031494e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.15487832797225565, |
| "count": 1, |
| "self": 0.0010931319557130337, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.1537851960165426, |
| "count": 1, |
| "self": 0.1537851960165426 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |