| { | |
| "name": "root", | |
| "gauges": { | |
| "SoccerTwos.Policy.Entropy.mean": { | |
| "value": 3.149009943008423, | |
| "min": 3.0920655727386475, | |
| "max": 3.295755386352539, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Policy.Entropy.sum": { | |
| "value": 57639.4765625, | |
| "min": 17742.544921875, | |
| "max": 123030.3515625, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Environment.EpisodeLength.mean": { | |
| "value": 999.0, | |
| "min": 419.9230769230769, | |
| "max": 999.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Environment.EpisodeLength.sum": { | |
| "value": 19980.0, | |
| "min": 11988.0, | |
| "max": 28196.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Self-play.ELO.mean": { | |
| "value": 1197.1405668605373, | |
| "min": 1194.6627015140439, | |
| "max": 1204.034278640044, | |
| "count": 73 | |
| }, | |
| "SoccerTwos.Self-play.ELO.sum": { | |
| "value": 2394.2811337210746, | |
| "min": 2392.647101577426, | |
| "max": 16821.98242286591, | |
| "count": 73 | |
| }, | |
| "SoccerTwos.Step.mean": { | |
| "value": 999986.0, | |
| "min": 9116.0, | |
| "max": 999986.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Step.sum": { | |
| "value": 999986.0, | |
| "min": 9116.0, | |
| "max": 999986.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { | |
| "value": 0.002587884897366166, | |
| "min": -0.03601016849279404, | |
| "max": 0.005797781050205231, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { | |
| "value": 0.025878848508000374, | |
| "min": -0.5041423439979553, | |
| "max": 0.07835473120212555, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.0025931489653885365, | |
| "min": -0.039575692266225815, | |
| "max": 0.005782643333077431, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 0.02593148872256279, | |
| "min": -0.5540596842765808, | |
| "max": 0.07517436146736145, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Environment.CumulativeReward.mean": { | |
| "value": 0.0, | |
| "min": 0.0, | |
| "max": 0.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Environment.CumulativeReward.sum": { | |
| "value": 0.0, | |
| "min": 0.0, | |
| "max": 0.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { | |
| "value": 0.0, | |
| "min": -0.5625, | |
| "max": 0.3017142776932035, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { | |
| "value": 0.0, | |
| "min": -9.0, | |
| "max": 4.223999887704849, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { | |
| "value": 0.0, | |
| "min": -0.5625, | |
| "max": 0.3017142776932035, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { | |
| "value": 0.0, | |
| "min": -9.0, | |
| "max": 4.223999887704849, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "SoccerTwos.Losses.PolicyLoss.mean": { | |
| "value": 0.0168987456165875, | |
| "min": 0.012042445930031438, | |
| "max": 0.02239705673904003, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Losses.PolicyLoss.sum": { | |
| "value": 0.0168987456165875, | |
| "min": 0.012042445930031438, | |
| "max": 0.02239705673904003, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Losses.ValueLoss.mean": { | |
| "value": 0.000625235964738143, | |
| "min": 4.422941644103654e-06, | |
| "max": 0.007038854543740551, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Losses.ValueLoss.sum": { | |
| "value": 0.000625235964738143, | |
| "min": 4.422941644103654e-06, | |
| "max": 0.007038854543740551, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Losses.BaselineLoss.mean": { | |
| "value": 0.0006257908535189927, | |
| "min": 4.599396841816391e-06, | |
| "max": 0.0070884921588003635, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Losses.BaselineLoss.sum": { | |
| "value": 0.0006257908535189927, | |
| "min": 4.599396841816391e-06, | |
| "max": 0.0070884921588003635, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Policy.LearningRate.mean": { | |
| "value": 0.0003, | |
| "min": 0.0003, | |
| "max": 0.0003, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Policy.LearningRate.sum": { | |
| "value": 0.0003, | |
| "min": 0.0003, | |
| "max": 0.0003, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Policy.Epsilon.mean": { | |
| "value": 0.20000000000000007, | |
| "min": 0.2, | |
| "max": 0.20000000000000007, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Policy.Epsilon.sum": { | |
| "value": 0.20000000000000007, | |
| "min": 0.2, | |
| "max": 0.20000000000000007, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Policy.Beta.mean": { | |
| "value": 0.005000000000000001, | |
| "min": 0.005, | |
| "max": 0.005000000000000001, | |
| "count": 46 | |
| }, | |
| "SoccerTwos.Policy.Beta.sum": { | |
| "value": 0.005000000000000001, | |
| "min": 0.005, | |
| "max": 0.005000000000000001, | |
| "count": 46 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1699443423", | |
| "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn /content/ml-agents/config/poca/SoccerTwos.yaml --env=/content/ml-agents/training-envs-executables/linux/SoccerTwos --run-id=SoccerTwos --no-graphics --force", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.1.0+cu118", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1699445605" | |
| }, | |
| "total": 2181.160465174, | |
| "count": 1, | |
| "self": 0.42680890199972055, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0681738690000202, | |
| "count": 1, | |
| "self": 0.0681738690000202 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2180.665482403, | |
| "count": 1, | |
| "self": 1.482598219130523, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 4.778055871999641, | |
| "count": 5, | |
| "self": 4.778055871999641 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2174.1929239598703, | |
| "count": 64922, | |
| "self": 1.6057936520119256, | |
| "children": { | |
| "env_step": { | |
| "total": 1780.3524618128895, | |
| "count": 64922, | |
| "self": 1369.766810939087, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 409.6754709328279, | |
| "count": 64922, | |
| "self": 10.97205778098487, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 398.70341315184305, | |
| "count": 129046, | |
| "self": 398.70341315184305 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.9101799409745581, | |
| "count": 64922, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2176.474749460971, | |
| "count": 64922, | |
| "is_parallel": true, | |
| "self": 1019.283098851889, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.004532323999228538, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.0010208789999524015, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0035114449992761365, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0035114449992761365 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.03913147999992361, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.001174363998870831, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.000787323000622564, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.000787323000622564 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.03343747400049324, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.03343747400049324 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.003732318999936979, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.0007477830013158382, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0029845359986211406, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0029845359986211406 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1157.181611549082, | |
| "count": 64921, | |
| "is_parallel": true, | |
| "self": 75.01715701136709, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 48.206555096093325, | |
| "count": 64921, | |
| "is_parallel": true, | |
| "self": 48.206555096093325 | |
| }, | |
| "communicator.exchange": { | |
| "total": 806.254951789816, | |
| "count": 64921, | |
| "is_parallel": true, | |
| "self": 806.254951789816 | |
| }, | |
| "steps_from_proto": { | |
| "total": 227.70294765180552, | |
| "count": 129842, | |
| "is_parallel": true, | |
| "self": 36.63705008140914, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 191.06589757039637, | |
| "count": 519368, | |
| "is_parallel": true, | |
| "self": 191.06589757039637 | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.010039060000053723, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0018889550001404132, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.00815010499991331, | |
| "count": 32, | |
| "is_parallel": true, | |
| "self": 0.00815010499991331 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 392.2346684949689, | |
| "count": 64922, | |
| "self": 14.265407442085234, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 105.45076121288639, | |
| "count": 64922, | |
| "self": 104.89955790788736, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.551203304999035, | |
| "count": 2, | |
| "self": 0.551203304999035 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 272.5184998399973, | |
| "count": 46, | |
| "self": 164.45873168098115, | |
| "children": { | |
| "TorchPOCAOptimizer.update": { | |
| "total": 108.05976815901613, | |
| "count": 1383, | |
| "self": 108.05976815901613 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.99999429041054e-07, | |
| "count": 1, | |
| "self": 9.99999429041054e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.2119033520002631, | |
| "count": 1, | |
| "self": 0.0022559970002475893, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.20964735500001552, | |
| "count": 1, | |
| "self": 0.20964735500001552 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |