| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 1.11602783203125, |
| "min": 1.1030526161193848, |
| "max": 1.4285537004470825, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 22320.556640625, |
| "min": 21029.970703125, |
| "max": 28662.501953125, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 45.905660377358494, |
| "min": 35.28, |
| "max": 55.38202247191011, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 19464.0, |
| "min": 14112.0, |
| "max": 21312.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1672.5986965358836, |
| "min": 1594.9761687604023, |
| "max": 1684.8696129621046, |
| "count": 500 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 354590.92366560735, |
| "min": 291606.7260394614, |
| "max": 450906.7595913422, |
| "count": 500 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 14999982.0, |
| "min": 10009972.0, |
| "max": 14999982.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 14999982.0, |
| "min": 10009972.0, |
| "max": 14999982.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": -0.033846165984869, |
| "min": -0.10714015364646912, |
| "max": 0.09757562726736069, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": -13.876928329467773, |
| "min": -45.2131462097168, |
| "max": 41.95751953125, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": -0.03533671796321869, |
| "min": -0.11142526566982269, |
| "max": 0.10013997554779053, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": -14.488054275512695, |
| "min": -47.021461486816406, |
| "max": 43.06018829345703, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": -0.07970754661650029, |
| "min": -0.26102524301380786, |
| "max": 0.3510517215934293, |
| "count": 500 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": -16.89799988269806, |
| "min": -55.66319966316223, |
| "max": 81.4439994096756, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": -0.07970754661650029, |
| "min": -0.26102524301380786, |
| "max": 0.3510517215934293, |
| "count": 500 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": -16.89799988269806, |
| "min": -55.66319966316223, |
| "max": 81.4439994096756, |
| "count": 500 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 500 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 500 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.012091718217061499, |
| "min": 0.009822013491066173, |
| "max": 0.015032402960059699, |
| "count": 76 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.012091718217061499, |
| "min": 0.009822013491066173, |
| "max": 0.015032402960059699, |
| "count": 76 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.05806648256257176, |
| "min": 0.05226881531998515, |
| "max": 0.059615218080580235, |
| "count": 76 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.05806648256257176, |
| "min": 0.05226881531998515, |
| "max": 0.059615218080580235, |
| "count": 76 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.05836009904742241, |
| "min": 0.0542876117862761, |
| "max": 0.06110596880316734, |
| "count": 76 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.05836009904742241, |
| "min": 0.0542876117862761, |
| "max": 0.06110596880316734, |
| "count": 76 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 4.0553810392494676e-07, |
| "min": 4.0553810392494676e-07, |
| "max": 0.0001428860023203168, |
| "count": 76 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 4.0553810392494676e-07, |
| "min": 4.0553810392494676e-07, |
| "max": 0.0001428860023203168, |
| "count": 76 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.10005440800688417, |
| "min": 0.10005440800688417, |
| "max": 0.11917465842958205, |
| "count": 76 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.10005440800688417, |
| "min": 0.10005440800688417, |
| "max": 0.11917465842958205, |
| "count": 76 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 1.0169934717551432e-05, |
| "min": 1.0169934717551432e-05, |
| "max": 6.988898235716646e-05, |
| "count": 76 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 1.0169934717551432e-05, |
| "min": 1.0169934717551432e-05, |
| "max": 6.988898235716646e-05, |
| "count": 76 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1710358573", |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
| "command_line_arguments": "/home/stephan/.conda/envs/rl/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos-read-deal --width=1280 --height=720 --resume", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.2.1+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1710372965" |
| }, |
| "total": 14392.268066103992, |
| "count": 1, |
| "self": 0.3203680879960302, |
| "children": { |
| "run_training.setup": { |
| "total": 0.017996288996073417, |
| "count": 1, |
| "self": 0.017996288996073417 |
| }, |
| "TrainerController.start_learning": { |
| "total": 14391.929701727, |
| "count": 1, |
| "self": 7.222826109427842, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 4.3356985290010925, |
| "count": 10, |
| "self": 4.3356985290010925 |
| }, |
| "TrainerController.advance": { |
| "total": 14380.252779454575, |
| "count": 357131, |
| "self": 6.432589866788476, |
| "children": { |
| "env_step": { |
| "total": 6466.631959918537, |
| "count": 357131, |
| "self": 5498.500712261317, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 963.7606686544896, |
| "count": 357131, |
| "self": 29.2971219017345, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 934.4635467527551, |
| "count": 624880, |
| "self": 934.4635467527551 |
| } |
| } |
| }, |
| "workers": { |
| "total": 4.370579002730665, |
| "count": 357131, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 14380.838316511697, |
| "count": 357131, |
| "is_parallel": true, |
| "self": 9673.599672775075, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.06619343400234357, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0004880309716099873, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.06570540303073358, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.06570540303073358 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.027265490003628656, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006784550059819594, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0004930220020469278, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004930220020469278 |
| }, |
| "communicator.exchange": { |
| "total": 0.024494213997968473, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.024494213997968473 |
| }, |
| "steps_from_proto": { |
| "total": 0.0015997989976312965, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.00032821799686644226, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0012715810007648543, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0012715810007648543 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "steps_from_proto": { |
| "total": 0.018047201985609718, |
| "count": 18, |
| "is_parallel": true, |
| "self": 0.0030916809337213635, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.014955521051888354, |
| "count": 72, |
| "is_parallel": true, |
| "self": 0.014955521051888354 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 4707.220596534637, |
| "count": 357130, |
| "is_parallel": true, |
| "self": 257.41373912687413, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 162.74674167780904, |
| "count": 357130, |
| "is_parallel": true, |
| "self": 162.74674167780904 |
| }, |
| "communicator.exchange": { |
| "total": 3645.2510425291694, |
| "count": 357130, |
| "is_parallel": true, |
| "self": 3645.2510425291694 |
| }, |
| "steps_from_proto": { |
| "total": 641.809073200784, |
| "count": 714260, |
| "is_parallel": true, |
| "self": 114.93468356617086, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 526.8743896346132, |
| "count": 2857040, |
| "is_parallel": true, |
| "self": 526.8743896346132 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 7907.188229669249, |
| "count": 357131, |
| "self": 41.56422363645106, |
| "children": { |
| "process_trajectory": { |
| "total": 1667.4114032577781, |
| "count": 357131, |
| "self": 1666.2047581057705, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 1.2066451520076953, |
| "count": 10, |
| "self": 1.2066451520076953 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 6198.21260277502, |
| "count": 76, |
| "self": 967.3907746167824, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 5230.821828158238, |
| "count": 6080, |
| "self": 5230.821828158238 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 7.199996616691351e-07, |
| "count": 1, |
| "self": 7.199996616691351e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.11839691399654839, |
| "count": 1, |
| "self": 0.0024417589884251356, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.11595515500812326, |
| "count": 1, |
| "self": 0.11595515500812326 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |