| { | |
| "name": "root", | |
| "gauges": { | |
| "SoccerTwos.Policy.Entropy.mean": { | |
| "value": 1.902220368385315, | |
| "min": 1.8798245191574097, | |
| "max": 3.2957026958465576, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Policy.Entropy.sum": { | |
| "value": 38896.6015625, | |
| "min": 23470.833984375, | |
| "max": 108659.1328125, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Environment.EpisodeLength.mean": { | |
| "value": 55.61797752808989, | |
| "min": 49.714285714285715, | |
| "max": 999.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Environment.EpisodeLength.sum": { | |
| "value": 19800.0, | |
| "min": 12324.0, | |
| "max": 28844.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Self-play.ELO.mean": { | |
| "value": 1501.7467793182816, | |
| "min": 1199.5057223791089, | |
| "max": 1540.44027129552, | |
| "count": 492 | |
| }, | |
| "SoccerTwos.Self-play.ELO.sum": { | |
| "value": 267310.9267186541, | |
| "min": 2401.634377486819, | |
| "max": 299121.75718526833, | |
| "count": 492 | |
| }, | |
| "SoccerTwos.Step.mean": { | |
| "value": 4999978.0, | |
| "min": 9440.0, | |
| "max": 4999978.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Step.sum": { | |
| "value": 4999978.0, | |
| "min": 9440.0, | |
| "max": 4999978.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { | |
| "value": 0.019829465076327324, | |
| "min": -0.09591928124427795, | |
| "max": 0.21020308136940002, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { | |
| "value": 3.509815216064453, | |
| "min": -14.855474472045898, | |
| "max": 23.866817474365234, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.01356409676373005, | |
| "min": -0.09563414007425308, | |
| "max": 0.21305915713310242, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 2.4008450508117676, | |
| "min": -15.107744216918945, | |
| "max": 23.645427703857422, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Environment.CumulativeReward.mean": { | |
| "value": 0.0, | |
| "min": 0.0, | |
| "max": 0.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Environment.CumulativeReward.sum": { | |
| "value": 0.0, | |
| "min": 0.0, | |
| "max": 0.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { | |
| "value": 0.08759774057205114, | |
| "min": -0.6153846153846154, | |
| "max": 0.4061299994587898, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { | |
| "value": 15.504800081253052, | |
| "min": -59.5175998210907, | |
| "max": 49.892799854278564, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { | |
| "value": 0.08759774057205114, | |
| "min": -0.6153846153846154, | |
| "max": 0.4061299994587898, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { | |
| "value": 15.504800081253052, | |
| "min": -59.5175998210907, | |
| "max": 49.892799854278564, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 500 | |
| }, | |
| "SoccerTwos.Losses.PolicyLoss.mean": { | |
| "value": 0.010770902594473834, | |
| "min": 0.010770902594473834, | |
| "max": 0.024406571467019, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Losses.PolicyLoss.sum": { | |
| "value": 0.010770902594473834, | |
| "min": 0.010770902594473834, | |
| "max": 0.024406571467019, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Losses.ValueLoss.mean": { | |
| "value": 0.10224802096684774, | |
| "min": 6.370583942043595e-05, | |
| "max": 0.10771091034015019, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Losses.ValueLoss.sum": { | |
| "value": 0.10224802096684774, | |
| "min": 6.370583942043595e-05, | |
| "max": 0.10771091034015019, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Losses.BaselineLoss.mean": { | |
| "value": 0.1042000745733579, | |
| "min": 6.349220360183002e-05, | |
| "max": 0.10975950236121813, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Losses.BaselineLoss.sum": { | |
| "value": 0.1042000745733579, | |
| "min": 6.349220360183002e-05, | |
| "max": 0.10975950236121813, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Policy.LearningRate.mean": { | |
| "value": 0.0003, | |
| "min": 0.0003, | |
| "max": 0.0003, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Policy.LearningRate.sum": { | |
| "value": 0.0003, | |
| "min": 0.0003, | |
| "max": 0.0003, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Policy.Epsilon.mean": { | |
| "value": 0.20000000000000007, | |
| "min": 0.2, | |
| "max": 0.20000000000000007, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Policy.Epsilon.sum": { | |
| "value": 0.20000000000000007, | |
| "min": 0.2, | |
| "max": 0.20000000000000007, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Policy.Beta.mean": { | |
| "value": 0.005000000000000001, | |
| "min": 0.005, | |
| "max": 0.005000000000000001, | |
| "count": 241 | |
| }, | |
| "SoccerTwos.Policy.Beta.sum": { | |
| "value": 0.005000000000000001, | |
| "min": 0.005, | |
| "max": 0.005000000000000001, | |
| "count": 241 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1676356153", | |
| "python_version": "3.9.0 (default, Nov 15 2020, 14:28:56) \n[GCC 7.3.0]", | |
| "command_line_arguments": "/home/olav/dev/anaconda3/envs/rl/bin/mlagents-learn baseline_config.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.x86_64 --run-id=baseline --no-graphics --results-dir=./ml-agents/results --force", | |
| "mlagents_version": "0.31.0.dev0", | |
| "mlagents_envs_version": "0.31.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.11.0", | |
| "numpy_version": "1.21.2", | |
| "end_time_seconds": "1676360710" | |
| }, | |
| "total": 4556.409521426001, | |
| "count": 1, | |
| "self": 0.21829356800299138, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.007075053999869851, | |
| "count": 1, | |
| "self": 0.007075053999869851 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 4556.184152803999, | |
| "count": 1, | |
| "self": 3.7660274021764053, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.7079156409854477, | |
| "count": 25, | |
| "self": 2.7079156409854477 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 4549.590081618844, | |
| "count": 339195, | |
| "self": 3.8062295802701556, | |
| "children": { | |
| "env_step": { | |
| "total": 3325.751270890276, | |
| "count": 339195, | |
| "self": 2444.2383848079116, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 879.2354413706198, | |
| "count": 339195, | |
| "self": 24.615664796565397, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 854.6197765740544, | |
| "count": 630046, | |
| "self": 854.6197765740544 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 2.277444711744465, | |
| "count": 339195, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 4550.621719077015, | |
| "count": 339195, | |
| "is_parallel": true, | |
| "self": 2565.3810402612326, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0018831889974535443, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.00047415399967576377, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0014090349977777805, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0014090349977777805 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.014492382997559616, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00042730500354082324, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0003527939988998696, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003527939988998696 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.012379479998344323, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.012379479998344323 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0013328039967746008, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.00026445299954502843, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0010683509972295724, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0010683509972295724 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1985.2043392907872, | |
| "count": 339194, | |
| "is_parallel": true, | |
| "self": 135.7385649650896, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 91.14345474129004, | |
| "count": 339194, | |
| "is_parallel": true, | |
| "self": 91.14345474129004 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1352.4512743431078, | |
| "count": 339194, | |
| "is_parallel": true, | |
| "self": 1352.4512743431078 | |
| }, | |
| "steps_from_proto": { | |
| "total": 405.8710452412997, | |
| "count": 678388, | |
| "is_parallel": true, | |
| "self": 76.04295478028507, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 329.82809046101465, | |
| "count": 2713552, | |
| "is_parallel": true, | |
| "self": 329.82809046101465 | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.03633952499512816, | |
| "count": 48, | |
| "is_parallel": true, | |
| "self": 0.006832120940089226, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.029507404055038933, | |
| "count": 192, | |
| "is_parallel": true, | |
| "self": 0.029507404055038933 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1220.032581148298, | |
| "count": 339195, | |
| "self": 31.443536122798832, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 454.6751856874653, | |
| "count": 339195, | |
| "self": 453.46062648547013, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 1.2145592019951437, | |
| "count": 10, | |
| "self": 1.2145592019951437 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 733.913859338034, | |
| "count": 241, | |
| "self": 519.5579340195, | |
| "children": { | |
| "TorchPOCAOptimizer.update": { | |
| "total": 214.355925318534, | |
| "count": 7233, | |
| "self": 214.355925318534 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 6.899936124682426e-07, | |
| "count": 1, | |
| "self": 6.899936124682426e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.12012745199899655, | |
| "count": 1, | |
| "self": 0.0008023029949981719, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.11932514900399838, | |
| "count": 1, | |
| "self": 0.11932514900399838 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |