| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 2.043433427810669, |
| "min": 2.002654790878296, |
| "max": 3.2957193851470947, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 42307.24609375, |
| "min": 37271.40234375, |
| "max": 105462.953125, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 50.69072164948454, |
| "min": 43.16814159292036, |
| "max": 999.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 19668.0, |
| "min": 5044.0, |
| "max": 33112.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1569.8012609836373, |
| "min": 1194.942531212991, |
| "max": 1579.9635787113561, |
| "count": 475 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 304541.44463082566, |
| "min": 2390.8722929202386, |
| "max": 354365.63427159167, |
| "count": 475 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 4999972.0, |
| "min": 9838.0, |
| "max": 4999972.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 4999972.0, |
| "min": 9838.0, |
| "max": 4999972.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": 0.015788059681653976, |
| "min": -0.0971170961856842, |
| "max": 0.24398364126682281, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": 3.047095537185669, |
| "min": -16.00063133239746, |
| "max": 33.913726806640625, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.016314547508955002, |
| "min": -0.10192587971687317, |
| "max": 0.24265357851982117, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 3.148707628250122, |
| "min": -17.021621704101562, |
| "max": 33.72884750366211, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": -0.05183419785968998, |
| "min": -0.5222799986600876, |
| "max": 0.6643522355093885, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": -10.004000186920166, |
| "min": -44.24160009622574, |
| "max": 63.76680028438568, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": -0.05183419785968998, |
| "min": -0.5222799986600876, |
| "max": 0.6643522355093885, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": -10.004000186920166, |
| "min": -44.24160009622574, |
| "max": 63.76680028438568, |
| "count": 500 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 500 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.01610611495610404, |
| "min": 0.01364388675752366, |
| "max": 0.02153439579803186, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.01610611495610404, |
| "min": 0.01364388675752366, |
| "max": 0.02153439579803186, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.11749531750877698, |
| "min": 0.00015545396484715942, |
| "max": 0.11749531750877698, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.11749531750877698, |
| "min": 0.00015545396484715942, |
| "max": 0.11749531750877698, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.1181148203710715, |
| "min": 0.0001561577077760982, |
| "max": 0.1181419820835193, |
| "count": 121 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.1181148203710715, |
| "min": 0.0001561577077760982, |
| "max": 0.1181419820835193, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 9.381396873199956e-07, |
| "min": 9.381396873199956e-07, |
| "max": 0.0002975029208323599, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 9.381396873199956e-07, |
| "min": 9.381396873199956e-07, |
| "max": 0.0002975029208323599, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.10031268000000002, |
| "min": 0.10031268000000002, |
| "max": 0.19916764000000006, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.10031268000000002, |
| "min": 0.10031268000000002, |
| "max": 0.19916764000000006, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 1.4658931999999977e-05, |
| "min": 1.4658931999999977e-05, |
| "max": 0.001487597836, |
| "count": 121 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 1.4658931999999977e-05, |
| "min": 1.4658931999999977e-05, |
| "max": 0.001487597836, |
| "count": 121 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1758430599", |
| "python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", |
| "command_line_arguments": "/home/server/miniconda3/envs/ml-agents/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.8.0+cu128", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1758433835" |
| }, |
| "total": 3236.878929101, |
| "count": 1, |
| "self": 0.16656741299993882, |
| "children": { |
| "run_training.setup": { |
| "total": 0.016506588000083866, |
| "count": 1, |
| "self": 0.016506588000083866 |
| }, |
| "TrainerController.start_learning": { |
| "total": 3236.6958551, |
| "count": 1, |
| "self": 3.151246516070387, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 0.9842582800001765, |
| "count": 13, |
| "self": 0.9842582800001765 |
| }, |
| "TrainerController.advance": { |
| "total": 3232.5214720049307, |
| "count": 333051, |
| "self": 2.8924686324667164, |
| "children": { |
| "env_step": { |
| "total": 2459.814977523006, |
| "count": 333051, |
| "self": 1707.511216469176, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 750.4258359408827, |
| "count": 333051, |
| "self": 20.733830670390944, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 729.6920052704918, |
| "count": 627574, |
| "self": 729.6920052704918 |
| } |
| } |
| }, |
| "workers": { |
| "total": 1.8779251129471959, |
| "count": 333051, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 3233.011003091736, |
| "count": 333051, |
| "is_parallel": true, |
| "self": 1864.9287868584966, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.001038255999901594, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.00024867599950084696, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0007895800004007469, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0007895800004007469 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.011452250999809621, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00024826599974403507, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00020025999992867582, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00020025999992867582 |
| }, |
| "communicator.exchange": { |
| "total": 0.009989683000185323, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.009989683000185323 |
| }, |
| "steps_from_proto": { |
| "total": 0.001014041999951587, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0004733959999612125, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0005406459999903745, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0005406459999903745 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1368.0741441232403, |
| "count": 333050, |
| "is_parallel": true, |
| "self": 77.30506817775859, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 47.11159190898388, |
| "count": 333050, |
| "is_parallel": true, |
| "self": 47.11159190898388 |
| }, |
| "communicator.exchange": { |
| "total": 1027.9904580477087, |
| "count": 333050, |
| "is_parallel": true, |
| "self": 1027.9904580477087 |
| }, |
| "steps_from_proto": { |
| "total": 215.6670259887892, |
| "count": 666100, |
| "is_parallel": true, |
| "self": 39.65504098181145, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 176.01198500697774, |
| "count": 2664400, |
| "is_parallel": true, |
| "self": 176.01198500697774 |
| } |
| } |
| } |
| } |
| }, |
| "steps_from_proto": { |
| "total": 0.008072109998920496, |
| "count": 24, |
| "is_parallel": true, |
| "self": 0.0015158339992922265, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.006556275999628269, |
| "count": 96, |
| "is_parallel": true, |
| "self": 0.006556275999628269 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 769.8140258494582, |
| "count": 333051, |
| "self": 26.450369783342012, |
| "children": { |
| "process_trajectory": { |
| "total": 354.83690559811293, |
| "count": 333051, |
| "self": 354.40445096511394, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.4324546329989971, |
| "count": 10, |
| "self": 0.4324546329989971 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 388.52675046800323, |
| "count": 121, |
| "self": 252.72680414801926, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 135.79994631998397, |
| "count": 7260, |
| "self": 135.79994631998397 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 3.72999238607008e-07, |
| "count": 1, |
| "self": 3.72999238607008e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.03887792599925888, |
| "count": 1, |
| "self": 0.0004916789994240389, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.03838624699983484, |
| "count": 1, |
| "self": 0.03838624699983484 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |