| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 3.2812230587005615, |
| "min": 3.2812230587005615, |
| "max": 3.295708656311035, |
| "count": 5 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 70559.421875, |
| "min": 15777.21875, |
| "max": 105462.6796875, |
| "count": 5 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 717.4285714285714, |
| "min": 623.5714285714286, |
| "max": 995.0, |
| "count": 5 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 20088.0, |
| "min": 14204.0, |
| "max": 28652.0, |
| "count": 5 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1200.105955145682, |
| "min": 1198.9373468557678, |
| "max": 1200.9769858473817, |
| "count": 5 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 7200.635730874092, |
| "min": 2400.056872686747, |
| "max": 12009.769858473817, |
| "count": 5 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 49822.0, |
| "min": 9342.0, |
| "max": 49822.0, |
| "count": 5 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 49822.0, |
| "min": 9342.0, |
| "max": 49822.0, |
| "count": 5 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": -0.07366155833005905, |
| "min": -0.1015477403998375, |
| "max": -0.07366155833005905, |
| "count": 5 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": -0.9576002955436707, |
| "min": -1.3201180696487427, |
| "max": -0.8542187809944153, |
| "count": 5 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": -0.07048321515321732, |
| "min": -0.10155700147151947, |
| "max": -0.07048321515321732, |
| "count": 5 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": -0.9162818193435669, |
| "min": -1.3202409744262695, |
| "max": -0.8557853102684021, |
| "count": 5 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 5 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 5 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": -0.05258461145254282, |
| "min": -0.3301090896129608, |
| "max": -0.05258461145254282, |
| "count": 5 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": -0.6835999488830566, |
| "min": -3.631199985742569, |
| "max": -0.6835999488830566, |
| "count": 5 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": -0.05258461145254282, |
| "min": -0.3301090896129608, |
| "max": -0.05258461145254282, |
| "count": 5 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": -0.6835999488830566, |
| "min": -3.631199985742569, |
| "max": -0.6835999488830566, |
| "count": 5 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 5 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 5 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.01506708687520586, |
| "min": 0.01506708687520586, |
| "max": 0.01566864464257378, |
| "count": 2 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.01506708687520586, |
| "min": 0.01506708687520586, |
| "max": 0.01566864464257378, |
| "count": 2 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.0036884615282443437, |
| "min": 0.003062593149176488, |
| "max": 0.0036884615282443437, |
| "count": 2 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.0036884615282443437, |
| "min": 0.003062593149176488, |
| "max": 0.0036884615282443437, |
| "count": 2 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.003729660508476875, |
| "min": 0.0026367754287396866, |
| "max": 0.003729660508476875, |
| "count": 2 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.003729660508476875, |
| "min": 0.0026367754287396866, |
| "max": 0.003729660508476875, |
| "count": 2 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 2 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 2 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.2, |
| "min": 0.2, |
| "max": 0.20000000000000007, |
| "count": 2 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.2, |
| "min": 0.2, |
| "max": 0.20000000000000007, |
| "count": 2 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 0.005, |
| "min": 0.005, |
| "max": 0.005000000000000001, |
| "count": 2 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 0.005, |
| "min": 0.005, |
| "max": 0.005000000000000001, |
| "count": 2 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1699862602", |
| "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --resume --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos/SoccerTwos --run-id=SoccerTwos2 --no-graphics", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.1.0+cu118", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1699862869" |
| }, |
| "total": 266.84529422700007, |
| "count": 1, |
| "self": 0.47672217900026226, |
| "children": { |
| "run_training.setup": { |
| "total": 0.05492019099983736, |
| "count": 1, |
| "self": 0.05492019099983736 |
| }, |
| "TrainerController.start_learning": { |
| "total": 266.31365185699997, |
| "count": 1, |
| "self": 0.13312792999431622, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 1.3484470980001788, |
| "count": 1, |
| "self": 1.3484470980001788 |
| }, |
| "TrainerController.advance": { |
| "total": 264.6316215560055, |
| "count": 3670, |
| "self": 0.16579634501886176, |
| "children": { |
| "env_step": { |
| "total": 123.00177471899633, |
| "count": 3670, |
| "self": 100.1245651079953, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 22.792715752999584, |
| "count": 3670, |
| "self": 0.8397715250212059, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 21.952944227978378, |
| "count": 7304, |
| "self": 21.952944227978378 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.08449385800145137, |
| "count": 3670, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 265.61760057600327, |
| "count": 3670, |
| "is_parallel": true, |
| "self": 182.17596656100454, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.003117426999779127, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0008162530002664425, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0023011739995126845, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0023011739995126845 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.04634818399995311, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0013344429996777762, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0009126159998231742, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0009126159998231742 |
| }, |
| "communicator.exchange": { |
| "total": 0.04008600200018009, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.04008600200018009 |
| }, |
| "steps_from_proto": { |
| "total": 0.0040151230002720695, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0007105310005499632, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0033045919997221063, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0033045919997221063 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 83.44163401499873, |
| "count": 3669, |
| "is_parallel": true, |
| "self": 5.154427128979933, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 3.0319108860080632, |
| "count": 3669, |
| "is_parallel": true, |
| "self": 3.0319108860080632 |
| }, |
| "communicator.exchange": { |
| "total": 59.40444901599835, |
| "count": 3669, |
| "is_parallel": true, |
| "self": 59.40444901599835 |
| }, |
| "steps_from_proto": { |
| "total": 15.850846984012378, |
| "count": 7338, |
| "is_parallel": true, |
| "self": 2.7187540600293687, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 13.13209292398301, |
| "count": 29352, |
| "is_parallel": true, |
| "self": 13.13209292398301 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 141.4640504919903, |
| "count": 3670, |
| "self": 1.07506253899669, |
| "children": { |
| "process_trajectory": { |
| "total": 20.72282923399348, |
| "count": 3670, |
| "self": 20.72282923399348 |
| }, |
| "_update_policy": { |
| "total": 119.66615871900012, |
| "count": 2, |
| "self": 9.33598303000008, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 110.33017568900004, |
| "count": 63, |
| "self": 110.33017568900004 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.0399999155197293e-06, |
| "count": 1, |
| "self": 1.0399999155197293e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.20045423300007315, |
| "count": 1, |
| "self": 0.0028815390001000196, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.19757269399997313, |
| "count": 1, |
| "self": 0.19757269399997313 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |