| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 1.7185440063476562, |
| "min": 1.712857723236084, |
| "max": 3.295708656311035, |
| "count": 800 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 36790.58984375, |
| "min": 18034.27734375, |
| "max": 105462.6796875, |
| "count": 800 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 61.38461538461539, |
| "min": 42.839285714285715, |
| "max": 999.0, |
| "count": 800 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 19152.0, |
| "min": 3996.0, |
| "max": 29320.0, |
| "count": 800 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1720.4272013985615, |
| "min": 1195.1268524246282, |
| "max": 1747.530858757312, |
| "count": 782 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 268386.6434181756, |
| "min": 2390.253704849257, |
| "max": 386028.50408218155, |
| "count": 782 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 7999944.0, |
| "min": 9388.0, |
| "max": 7999944.0, |
| "count": 800 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 7999944.0, |
| "min": 9388.0, |
| "max": 7999944.0, |
| "count": 800 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": -0.04483793303370476, |
| "min": -0.11136051267385483, |
| "max": 0.32275745272636414, |
| "count": 800 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": -7.039555549621582, |
| "min": -24.94475555419922, |
| "max": 42.92183303833008, |
| "count": 800 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": -0.04256414249539375, |
| "min": -0.11507757753133774, |
| "max": 0.32423368096351624, |
| "count": 800 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": -6.682570457458496, |
| "min": -25.77737808227539, |
| "max": 43.09465789794922, |
| "count": 800 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 800 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 800 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": -0.1414394894982599, |
| "min": -0.46153846153846156, |
| "max": 0.8060407765860697, |
| "count": 800 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": -22.205999851226807, |
| "min": -59.10460019111633, |
| "max": 83.02219998836517, |
| "count": 800 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": -0.1414394894982599, |
| "min": -0.46153846153846156, |
| "max": 0.8060407765860697, |
| "count": 800 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": -22.205999851226807, |
| "min": -59.10460019111633, |
| "max": 83.02219998836517, |
| "count": 800 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 800 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 800 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.016280188617793102, |
| "min": 0.011284240738799174, |
| "max": 0.025832497673885277, |
| "count": 385 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.016280188617793102, |
| "min": 0.011284240738799174, |
| "max": 0.025832497673885277, |
| "count": 385 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.10526493216554324, |
| "min": 1.2015580068691634e-05, |
| "max": 0.12397578631838163, |
| "count": 385 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.10526493216554324, |
| "min": 1.2015580068691634e-05, |
| "max": 0.12397578631838163, |
| "count": 385 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.10657266477743785, |
| "min": 1.1846101369883399e-05, |
| "max": 0.12565159474809964, |
| "count": 385 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.10657266477743785, |
| "min": 1.1846101369883399e-05, |
| "max": 0.12565159474809964, |
| "count": 385 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 385 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 385 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.20000000000000007, |
| "min": 0.19999999999999996, |
| "max": 0.20000000000000007, |
| "count": 385 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.20000000000000007, |
| "min": 0.19999999999999996, |
| "max": 0.20000000000000007, |
| "count": 385 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 0.005000000000000001, |
| "min": 0.005, |
| "max": 0.005000000000000001, |
| "count": 385 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 0.005000000000000001, |
| "min": 0.005, |
| "max": 0.005000000000000001, |
| "count": 385 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1675969539", |
| "python_version": "3.9.16 (main, Jan 11 2023, 16:05:54) \n[GCC 11.2.0]", |
| "command_line_arguments": "/home/lsaulier/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos_2 --no-graphics", |
| "mlagents_version": "0.31.0.dev0", |
| "mlagents_envs_version": "0.31.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.11.0+cu102", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1675991702" |
| }, |
| "total": 22163.11969683, |
| "count": 1, |
| "self": 0.21965920000366168, |
| "children": { |
| "run_training.setup": { |
| "total": 0.007608962994709145, |
| "count": 1, |
| "self": 0.007608962994709145 |
| }, |
| "TrainerController.start_learning": { |
| "total": 22162.892428667, |
| "count": 1, |
| "self": 11.635546017918386, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 0.852964419987984, |
| "count": 20, |
| "self": 0.852964419987984 |
| }, |
| "TrainerController.advance": { |
| "total": 22150.273212965105, |
| "count": 546024, |
| "self": 10.067874203523388, |
| "children": { |
| "env_step": { |
| "total": 6366.853094141094, |
| "count": 546024, |
| "self": 5136.617505596732, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 1223.4178501296628, |
| "count": 546024, |
| "self": 50.36454255526769, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 1173.0533075743951, |
| "count": 1003434, |
| "self": 1173.0533075743951 |
| } |
| } |
| }, |
| "workers": { |
| "total": 6.817738414698397, |
| "count": 546024, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 22150.67067910044, |
| "count": 546024, |
| "is_parallel": true, |
| "self": 18097.142765594042, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.001882700998976361, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0005679990063072182, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013147019926691428, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013147019926691428 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.017189674996188842, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00042573100654408336, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00039789799484424293, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00039789799484424293 |
| }, |
| "communicator.exchange": { |
| "total": 0.0151750759978313, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0151750759978313 |
| }, |
| "steps_from_proto": { |
| "total": 0.0011909699969692156, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.00025141499645542353, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.000939555000513792, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.000939555000513792 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 4053.5034054913704, |
| "count": 546023, |
| "is_parallel": true, |
| "self": 245.24890382892045, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 189.3249936548309, |
| "count": 546023, |
| "is_parallel": true, |
| "self": 189.3249936548309 |
| }, |
| "communicator.exchange": { |
| "total": 2939.566085178936, |
| "count": 546023, |
| "is_parallel": true, |
| "self": 2939.566085178936 |
| }, |
| "steps_from_proto": { |
| "total": 679.3634228286828, |
| "count": 1092046, |
| "is_parallel": true, |
| "self": 132.3677148117349, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 546.9957080169479, |
| "count": 4368184, |
| "is_parallel": true, |
| "self": 546.9957080169479 |
| } |
| } |
| } |
| } |
| }, |
| "steps_from_proto": { |
| "total": 0.024508015027095098, |
| "count": 38, |
| "is_parallel": true, |
| "self": 0.004874444020970259, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.01963357100612484, |
| "count": 152, |
| "is_parallel": true, |
| "self": 0.01963357100612484 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 15773.352244620488, |
| "count": 546024, |
| "self": 90.01150891112047, |
| "children": { |
| "process_trajectory": { |
| "total": 1849.1886234544581, |
| "count": 546024, |
| "self": 1847.0379783684475, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 2.150645086010627, |
| "count": 16, |
| "self": 2.150645086010627 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 13834.15211225491, |
| "count": 385, |
| "self": 893.2984637601694, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 12940.85364849474, |
| "count": 11568, |
| "self": 12940.85364849474 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 6.809932528994977e-07, |
| "count": 1, |
| "self": 6.809932528994977e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.13070458299625898, |
| "count": 1, |
| "self": 0.0012228909981786273, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.12948169199808035, |
| "count": 1, |
| "self": 0.12948169199808035 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |