poca-SoccerTwos / run_logs /timers.json
c0ldstudy's picture
First Push
8dfb21e
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 2.8534560203552246,
"min": 0.6876733303070068,
"max": 3.2957088947296143,
"count": 977
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 49399.03125,
"min": 9473.9580078125,
"max": 119219.5546875,
"count": 977
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 999.0,
"min": 383.9230769230769,
"max": 999.0,
"count": 977
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19980.0,
"min": 15568.0,
"max": 24904.0,
"count": 977
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1165.607650045886,
"min": 1163.1255753867908,
"max": 1200.4353352507048,
"count": 151
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 2331.215300091772,
"min": 2326.2511507735817,
"max": 21251.307919762614,
"count": 151
},
"SoccerTwos.Step.mean": {
"value": 9769694.0,
"min": 9070.0,
"max": 9769694.0,
"count": 977
},
"SoccerTwos.Step.sum": {
"value": 9769694.0,
"min": 9070.0,
"max": 9769694.0,
"count": 977
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.0018585395300760865,
"min": -0.02852208912372589,
"max": 0.03621601313352585,
"count": 977
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 0.01858539506793022,
"min": -0.38130223751068115,
"max": 0.5431860685348511,
"count": 977
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.0019360113656148314,
"min": -0.03305850178003311,
"max": 0.03623698651790619,
"count": 977
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 0.019360113888978958,
"min": -0.36394256353378296,
"max": 0.5434552431106567,
"count": 977
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 977
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 977
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.0,
"min": -0.5333333333333333,
"max": 0.32597143203020096,
"count": 977
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 0.0,
"min": -8.831599980592728,
"max": 4.563600048422813,
"count": 977
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.0,
"min": -0.5333333333333333,
"max": 0.32597143203020096,
"count": 977
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 0.0,
"min": -8.831599980592728,
"max": 4.563600048422813,
"count": 977
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 977
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 977
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.01617720452947348,
"min": 0.009041061301347023,
"max": 0.023895814525894822,
"count": 447
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.01617720452947348,
"min": 0.009041061301347023,
"max": 0.023895814525894822,
"count": 447
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 4.3075555424820775e-07,
"min": 3.796161938037409e-11,
"max": 0.007123635763612886,
"count": 447
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 4.3075555424820775e-07,
"min": 3.796161938037409e-11,
"max": 0.007123635763612886,
"count": 447
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 3.827969493386263e-07,
"min": 5.499825155482381e-11,
"max": 0.006830077370007833,
"count": 447
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 3.827969493386263e-07,
"min": 5.499825155482381e-11,
"max": 0.006830077370007833,
"count": 447
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 447
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 447
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 447
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 447
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 447
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 447
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1682399581",
"python_version": "3.8.12 | packaged by conda-forge | (default, Sep 29 2021, 19:50:30) \n[GCC 9.4.0]",
"command_line_arguments": "/home/jason/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume",
"mlagents_version": "0.29.0.dev0",
"mlagents_envs_version": "0.29.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.8.0",
"numpy_version": "1.23.0",
"end_time_seconds": "1682440720"
},
"total": 41139.5746951662,
"count": 1,
"self": 0.0036629438400268555,
"children": {
"run_training.setup": {
"total": 0.018018901348114014,
"count": 1,
"self": 0.018018901348114014
},
"TrainerController.start_learning": {
"total": 41139.55301332101,
"count": 1,
"self": 10.091750759631395,
"children": {
"TrainerController._reset_env": {
"total": 6.643025405704975,
"count": 49,
"self": 6.643025405704975
},
"TrainerController.advance": {
"total": 41122.42403576523,
"count": 635792,
"self": 10.281007185578346,
"children": {
"env_step": {
"total": 38821.82201176509,
"count": 635792,
"self": 36708.06962808967,
"children": {
"SubprocessEnvManager._take_step": {
"total": 2107.2789623625576,
"count": 635792,
"self": 54.651243790984154,
"children": {
"TorchPolicy.evaluate": {
"total": 2052.6277185715735,
"count": 1263618,
"self": 444.1418619453907,
"children": {
"TorchPolicy.sample_actions": {
"total": 1608.4858566261828,
"count": 1263618,
"self": 1608.4858566261828
}
}
}
}
},
"workers": {
"total": 6.473421312868595,
"count": 635792,
"self": 0.0,
"children": {
"worker_root": {
"total": 41122.94743762538,
"count": 635792,
"is_parallel": true,
"self": 5543.7823835499585,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0022903084754943848,
"count": 2,
"is_parallel": true,
"self": 0.00048452243208885193,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0018057860434055328,
"count": 8,
"is_parallel": true,
"self": 0.0018057860434055328
}
}
},
"UnityEnvironment.step": {
"total": 0.06328035518527031,
"count": 1,
"is_parallel": true,
"self": 0.00015142560005187988,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0015549026429653168,
"count": 1,
"is_parallel": true,
"self": 0.0015549026429653168
},
"communicator.exchange": {
"total": 0.059748053550720215,
"count": 1,
"is_parallel": true,
"self": 0.059748053550720215
},
"steps_from_proto": {
"total": 0.001825973391532898,
"count": 2,
"is_parallel": true,
"self": 0.0003262721002101898,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014997012913227081,
"count": 8,
"is_parallel": true,
"self": 0.0014997012913227081
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 35579.07395424321,
"count": 635791,
"is_parallel": true,
"self": 98.12249110639095,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 805.0765328742564,
"count": 635791,
"is_parallel": true,
"self": 805.0765328742564
},
"communicator.exchange": {
"total": 33494.981812007725,
"count": 635791,
"is_parallel": true,
"self": 33494.981812007725
},
"steps_from_proto": {
"total": 1180.8931182548404,
"count": 1271582,
"is_parallel": true,
"self": 197.63392517343163,
"children": {
"_process_rank_one_or_two_observation": {
"total": 983.2591930814087,
"count": 5086328,
"is_parallel": true,
"self": 983.2591930814087
}
}
}
}
},
"steps_from_proto": {
"total": 0.09109983220696449,
"count": 96,
"is_parallel": true,
"self": 0.015366911888122559,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.07573292031884193,
"count": 384,
"is_parallel": true,
"self": 0.07573292031884193
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2290.3210168145597,
"count": 635792,
"self": 69.18487022817135,
"children": {
"process_trajectory": {
"total": 697.5770987719297,
"count": 635792,
"self": 690.940976947546,
"children": {
"RLTrainer._checkpoint": {
"total": 6.636121824383736,
"count": 19,
"self": 6.636121824383736
}
}
},
"_update_policy": {
"total": 1523.5590478144586,
"count": 448,
"self": 751.0578964203596,
"children": {
"TorchPOCAOptimizer.update": {
"total": 772.501151394099,
"count": 13420,
"self": 772.501151394099
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.350478649139404e-07,
"count": 1,
"self": 9.350478649139404e-07
},
"TrainerController._save_models": {
"total": 0.3942004553973675,
"count": 1,
"self": 0.0013845190405845642,
"children": {
"RLTrainer._checkpoint": {
"total": 0.3928159363567829,
"count": 1,
"self": 0.3928159363567829
}
}
}
}
}
}
}