| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 1.9089889526367188, |
| "min": 1.8442237377166748, |
| "max": 3.213865041732788, |
| "count": 472 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 35919.53515625, |
| "min": 29317.10546875, |
| "max": 120344.625, |
| "count": 472 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 62.17948717948718, |
| "min": 42.51304347826087, |
| "max": 999.0, |
| "count": 472 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 19400.0, |
| "min": 11112.0, |
| "max": 28436.0, |
| "count": 472 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1556.9494059513054, |
| "min": 1184.4253004330594, |
| "max": 1576.660508881427, |
| "count": 471 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 242884.10732840362, |
| "min": 2370.6947943219175, |
| "max": 334525.03998778446, |
| "count": 471 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 5039949.0, |
| "min": 329805.0, |
| "max": 5039949.0, |
| "count": 472 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 5039949.0, |
| "min": 329805.0, |
| "max": 5039949.0, |
| "count": 472 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": -0.010436630807816982, |
| "min": -0.09697045385837555, |
| "max": 0.1714733988046646, |
| "count": 472 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": -1.6385509967803955, |
| "min": -16.600444793701172, |
| "max": 23.41659164428711, |
| "count": 472 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": -0.01028787437826395, |
| "min": -0.09972328692674637, |
| "max": 0.17430460453033447, |
| "count": 472 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": -1.6151962280273438, |
| "min": -17.1435546875, |
| "max": 23.17365837097168, |
| "count": 472 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 472 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 472 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": 0.10489171933216654, |
| "min": -0.5669750012457371, |
| "max": 0.44391110796987276, |
| "count": 472 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": 16.467999935150146, |
| "min": -50.66320013999939, |
| "max": 46.512000262737274, |
| "count": 472 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": 0.10489171933216654, |
| "min": -0.5669750012457371, |
| "max": 0.44391110796987276, |
| "count": 472 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": 16.467999935150146, |
| "min": -50.66320013999939, |
| "max": 46.512000262737274, |
| "count": 472 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 472 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 472 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.016275092681947476, |
| "min": 0.010151559529488926, |
| "max": 0.024196836646297015, |
| "count": 227 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.016275092681947476, |
| "min": 0.010151559529488926, |
| "max": 0.024196836646297015, |
| "count": 227 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.09684030537803968, |
| "min": 0.0013416305688830714, |
| "max": 0.11689281612634658, |
| "count": 227 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.09684030537803968, |
| "min": 0.0013416305688830714, |
| "max": 0.11689281612634658, |
| "count": 227 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.09833643784125647, |
| "min": 0.0013579658038603763, |
| "max": 0.11826808328429858, |
| "count": 227 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.09833643784125647, |
| "min": 0.0013579658038603763, |
| "max": 0.11826808328429858, |
| "count": 227 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 227 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 227 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 227 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 227 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 227 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 227 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1688468546", |
| "python_version": "3.10.10 (main, Mar 21 2023, 18:45:11) [GCC 11.2.0]", |
| "command_line_arguments": "/opt/conda/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume", |
| "mlagents_version": "0.31.0.dev0", |
| "mlagents_envs_version": "0.31.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.11.0+cu102", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1688485154" |
| }, |
| "total": 16607.525235416368, |
| "count": 1, |
| "self": 0.013366627972573042, |
| "children": { |
| "run_training.setup": { |
| "total": 0.015603977721184492, |
| "count": 1, |
| "self": 0.015603977721184492 |
| }, |
| "TrainerController.start_learning": { |
| "total": 16607.496264810674, |
| "count": 1, |
| "self": 8.919515123125166, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 1.5175714301876724, |
| "count": 25, |
| "self": 1.5175714301876724 |
| }, |
| "TrainerController.advance": { |
| "total": 16596.756896799896, |
| "count": 322264, |
| "self": 7.916705624666065, |
| "children": { |
| "env_step": { |
| "total": 5911.727526604664, |
| "count": 322264, |
| "self": 4514.543463871349, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 1392.023328505922, |
| "count": 322264, |
| "self": 49.78212635125965, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 1342.2412021546625, |
| "count": 595496, |
| "self": 1342.2412021546625 |
| } |
| } |
| }, |
| "workers": { |
| "total": 5.1607342273928225, |
| "count": 322264, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 16555.016848264262, |
| "count": 322264, |
| "is_parallel": true, |
| "self": 12923.445410506334, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.00312175415456295, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0008582943119108677, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0022634598426520824, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0022634598426520824 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.026854357682168484, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006880271248519421, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0005317311733961105, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005317311733961105 |
| }, |
| "communicator.exchange": { |
| "total": 0.023468355182558298, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.023468355182558298 |
| }, |
| "steps_from_proto": { |
| "total": 0.002166244201362133, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.000483611598610878, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.001682632602751255, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.001682632602751255 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "steps_from_proto": { |
| "total": 0.053547489922493696, |
| "count": 48, |
| "is_parallel": true, |
| "self": 0.010899828281253576, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.04264766164124012, |
| "count": 192, |
| "is_parallel": true, |
| "self": 0.04264766164124012 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 3631.5178902680054, |
| "count": 322263, |
| "is_parallel": true, |
| "self": 189.9846967374906, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 131.83427887735888, |
| "count": 322263, |
| "is_parallel": true, |
| "self": 131.83427887735888 |
| }, |
| "communicator.exchange": { |
| "total": 2676.0341983493418, |
| "count": 322263, |
| "is_parallel": true, |
| "self": 2676.0341983493418 |
| }, |
| "steps_from_proto": { |
| "total": 633.6647163038142, |
| "count": 644526, |
| "is_parallel": true, |
| "self": 126.69072948535904, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 506.97398681845516, |
| "count": 2578104, |
| "is_parallel": true, |
| "self": 506.97398681845516 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 10677.112664570566, |
| "count": 322264, |
| "self": 69.58496827818453, |
| "children": { |
| "process_trajectory": { |
| "total": 1633.3974608271383, |
| "count": 322264, |
| "self": 1630.1399948387407, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 3.2574659883975983, |
| "count": 10, |
| "self": 3.2574659883975983 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 8974.130235465243, |
| "count": 228, |
| "self": 946.202926828526, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 8027.9273086367175, |
| "count": 6840, |
| "self": 8027.9273086367175 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 2.514570951461792e-06, |
| "count": 1, |
| "self": 2.514570951461792e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.30227894289419055, |
| "count": 1, |
| "self": 0.005925939884036779, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.29635300301015377, |
| "count": 1, |
| "self": 0.29635300301015377 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |