| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 1.5435189008712769, |
| "min": 1.4646319150924683, |
| "max": 1.6610451936721802, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 31759.4453125, |
| "min": 25814.9765625, |
| "max": 36021.5078125, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 58.79761904761905, |
| "min": 42.716814159292035, |
| "max": 82.63333333333334, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 19756.0, |
| "min": 18480.0, |
| "max": 20628.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1641.0530434980756, |
| "min": 1581.3414240873562, |
| "max": 1645.42222380018, |
| "count": 500 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 275696.9113076767, |
| "min": 194048.29977610603, |
| "max": 373368.55337094323, |
| "count": 500 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 14999981.0, |
| "min": 10009960.0, |
| "max": 14999981.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 14999981.0, |
| "min": 10009960.0, |
| "max": 14999981.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": -0.0025916770100593567, |
| "min": -0.11438218504190445, |
| "max": 0.07807338982820511, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": -0.4379934072494507, |
| "min": -23.128673553466797, |
| "max": 14.677797317504883, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.0026981872506439686, |
| "min": -0.11424611508846283, |
| "max": 0.07508175075054169, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 0.45599365234375, |
| "min": -23.13912582397461, |
| "max": 14.11536979675293, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": -0.02577988283168635, |
| "min": -0.3560073624359318, |
| "max": 0.2735396422578033, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": -4.356800198554993, |
| "min": -58.029200077056885, |
| "max": 46.228199541568756, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": -0.02577988283168635, |
| "min": -0.3560073624359318, |
| "max": 0.2735396422578033, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": -4.356800198554993, |
| "min": -58.029200077056885, |
| "max": 46.228199541568756, |
| "count": 500 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 500 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.012675322993891314, |
| "min": 0.008311386445226769, |
| "max": 0.016500145032963095, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.012675322993891314, |
| "min": 0.008311386445226769, |
| "max": 0.016500145032963095, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.12124239106973013, |
| "min": 0.10481940135359764, |
| "max": 0.1345561275879542, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.12124239106973013, |
| "min": 0.10481940135359764, |
| "max": 0.1345561275879542, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.12398228074113528, |
| "min": 0.10591413453221321, |
| "max": 0.1369128222266833, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.12398228074113528, |
| "min": 0.10591413453221321, |
| "max": 0.1369128222266833, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 0.00019999999999999996, |
| "min": 0.00019999999999999996, |
| "max": 0.00019999999999999996, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 0.00019999999999999996, |
| "min": 0.00019999999999999996, |
| "max": 0.00019999999999999996, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 121 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1761011053", |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
| "command_line_arguments": "/home/ada/work/ai/venv3.10/bin/mlagents-learn ./config/poca/SoccerTwosGo.yaml --resume --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.9.0+cu128", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1761019758" |
| }, |
| "total": 8704.57901644602, |
| "count": 1, |
| "self": 0.9726788210100494, |
| "children": { |
| "run_training.setup": { |
| "total": 0.024575264018494636, |
| "count": 1, |
| "self": 0.024575264018494636 |
| }, |
| "TrainerController.start_learning": { |
| "total": 8703.581762360991, |
| "count": 1, |
| "self": 7.502892200194765, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.129385295906104, |
| "count": 26, |
| "self": 2.129385295906104 |
| }, |
| "TrainerController.advance": { |
| "total": 8691.612080165913, |
| "count": 347303, |
| "self": 6.230914909858257, |
| "children": { |
| "env_step": { |
| "total": 6704.959744712687, |
| "count": 347303, |
| "self": 5021.182745416998, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 1678.7599376246217, |
| "count": 347303, |
| "self": 39.04678861272987, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 1639.7131490118918, |
| "count": 627670, |
| "self": 1639.7131490118918 |
| } |
| } |
| }, |
| "workers": { |
| "total": 5.017061671067495, |
| "count": 347303, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 8685.496602965024, |
| "count": 347303, |
| "is_parallel": true, |
| "self": 4470.667818740127, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.002683888975298032, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.000585997971938923, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.002097891003359109, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.002097891003359109 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.021987969987094402, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004761809832416475, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00046435699914582074, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00046435699914582074 |
| }, |
| "communicator.exchange": { |
| "total": 0.01973794001969509, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.01973794001969509 |
| }, |
| "steps_from_proto": { |
| "total": 0.0013094919850118458, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.00024246098473668098, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0010670310002751648, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0010670310002751648 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "steps_from_proto": { |
| "total": 0.05173607706092298, |
| "count": 50, |
| "is_parallel": true, |
| "self": 0.008709836401976645, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.043026240658946335, |
| "count": 200, |
| "is_parallel": true, |
| "self": 0.043026240658946335 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 4214.7770481478365, |
| "count": 347302, |
| "is_parallel": true, |
| "self": 237.83366664528148, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 162.09566081810044, |
| "count": 347302, |
| "is_parallel": true, |
| "self": 162.09566081810044 |
| }, |
| "communicator.exchange": { |
| "total": 3184.5067745028355, |
| "count": 347302, |
| "is_parallel": true, |
| "self": 3184.5067745028355 |
| }, |
| "steps_from_proto": { |
| "total": 630.3409461816191, |
| "count": 694604, |
| "is_parallel": true, |
| "self": 106.73629873536993, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 523.6046474462491, |
| "count": 2778416, |
| "is_parallel": true, |
| "self": 523.6046474462491 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 1980.4214205433673, |
| "count": 347303, |
| "self": 60.59123472208739, |
| "children": { |
| "process_trajectory": { |
| "total": 951.9022839034442, |
| "count": 347303, |
| "self": 928.9015034834156, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 23.000780420028605, |
| "count": 10, |
| "self": 23.000780420028605 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 967.9279019178357, |
| "count": 121, |
| "self": 540.7814483185066, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 427.1464535993291, |
| "count": 3630, |
| "self": 427.1464535993291 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 5.709880497306585e-07, |
| "count": 1, |
| "self": 5.709880497306585e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 2.33740412798943, |
| "count": 1, |
| "self": 0.15179298998555169, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 2.1856111380038783, |
| "count": 1, |
| "self": 2.1856111380038783 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |