| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.20883840322494507, | |
| "min": 0.19934269785881042, | |
| "max": 1.4834659099578857, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 6305.2490234375, | |
| "min": 5968.60498046875, | |
| "max": 45002.421875, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2999875.0, | |
| "min": 29952.0, | |
| "max": 2999875.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2999875.0, | |
| "min": 29952.0, | |
| "max": 2999875.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.798509418964386, | |
| "min": -0.08498506247997284, | |
| "max": 0.8286927938461304, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 242.7468719482422, | |
| "min": -20.56638526916504, | |
| "max": 249.4365234375, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.00782564003020525, | |
| "min": -0.02389027550816536, | |
| "max": 0.3482888638973236, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 2.3789947032928467, | |
| "min": -6.2114715576171875, | |
| "max": 83.58932495117188, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.0685256353345245, | |
| "min": 0.06373710363663525, | |
| "max": 0.07483905499980742, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9593588946833431, | |
| "min": 0.48028539652994195, | |
| "max": 1.1069516701362434, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015294011145929936, | |
| "min": 0.000883022911804011, | |
| "max": 0.016372764399125182, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.21411615604301912, | |
| "min": 0.010596274941648132, | |
| "max": 0.233787051406027, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 1.506463783592856e-06, | |
| "min": 1.506463783592856e-06, | |
| "max": 0.00029838354339596195, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 2.1090492970299984e-05, | |
| "min": 2.1090492970299984e-05, | |
| "max": 0.004072358742547132, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10050212142857143, | |
| "min": 0.10050212142857143, | |
| "max": 0.19946118095238097, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4070297, | |
| "min": 1.3897045333333333, | |
| "max": 2.8574528666666668, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 6.016193071428568e-05, | |
| "min": 6.016193071428568e-05, | |
| "max": 0.009946171977142856, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0008422670299999995, | |
| "min": 0.0008422670299999995, | |
| "max": 0.13575954138, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.004812297411262989, | |
| "min": 0.004657533951103687, | |
| "max": 0.5557369589805603, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.067372165620327, | |
| "min": 0.06520547717809677, | |
| "max": 3.8901588916778564, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 249.46031746031747, | |
| "min": 213.3014705882353, | |
| "max": 999.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 31432.0, | |
| "min": 15984.0, | |
| "max": 32312.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.7187904574804835, | |
| "min": -1.0000000521540642, | |
| "max": 1.7798248023664864, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 216.56759764254093, | |
| "min": -32.000001668930054, | |
| "max": 243.83599792420864, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.7187904574804835, | |
| "min": -1.0000000521540642, | |
| "max": 1.7798248023664864, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 216.56759764254093, | |
| "min": -32.000001668930054, | |
| "max": 243.83599792420864, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.012556998638342882, | |
| "min": 0.010937422458509365, | |
| "max": 12.201441258192062, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 1.582181828431203, | |
| "min": 1.426591651084891, | |
| "max": 195.223060131073, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1699953005", | |
| "python_version": "3.10.3 (main, Mar 28 2022, 09:30:03) [GCC 7.5.0]", | |
| "command_line_arguments": "/home/yzeng/anaconda3/envs/deeprl_course_unit5/bin/mlagents-learn ../config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.1.0+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1699956693" | |
| }, | |
| "total": 3688.2422509463504, | |
| "count": 1, | |
| "self": 0.3199370610527694, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.01085307402536273, | |
| "count": 1, | |
| "self": 0.01085307402536273 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 3687.9114608112723, | |
| "count": 1, | |
| "self": 3.372778186108917, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 0.8616877705790102, | |
| "count": 1, | |
| "self": 0.8616877705790102 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 3683.61380162742, | |
| "count": 194507, | |
| "self": 3.364317771513015, | |
| "children": { | |
| "env_step": { | |
| "total": 2322.2837941045873, | |
| "count": 194507, | |
| "self": 2124.274842475541, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 195.91820556716993, | |
| "count": 194507, | |
| "self": 9.23077730787918, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 186.68742825929075, | |
| "count": 187562, | |
| "self": 186.68742825929075 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 2.090746061876416, | |
| "count": 194507, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 3683.273943124339, | |
| "count": 194507, | |
| "is_parallel": true, | |
| "self": 1784.8197832303122, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0012163030914962292, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003676139749586582, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.000848689116537571, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.000848689116537571 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.023782378993928432, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00025271298363804817, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.00029502203688025475, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00029502203688025475 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.02243240363895893, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.02243240363895893 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0008022403344511986, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0001949523575603962, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0006072879768908024, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0006072879768908024 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1898.4541598940268, | |
| "count": 194506, | |
| "is_parallel": true, | |
| "self": 53.04335350031033, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 39.29772320250049, | |
| "count": 194506, | |
| "is_parallel": true, | |
| "self": 39.29772320250049 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1648.587595764082, | |
| "count": 194506, | |
| "is_parallel": true, | |
| "self": 1648.587595764082 | |
| }, | |
| "steps_from_proto": { | |
| "total": 157.52548742713407, | |
| "count": 194506, | |
| "is_parallel": true, | |
| "self": 36.79078872175887, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 120.7346987053752, | |
| "count": 1556048, | |
| "is_parallel": true, | |
| "self": 120.7346987053752 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1357.9656897513196, | |
| "count": 194507, | |
| "self": 6.280239996500313, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 229.36559143615887, | |
| "count": 194507, | |
| "self": 228.95419924287125, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.411392193287611, | |
| "count": 6, | |
| "self": 0.411392193287611 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 1122.3198583186604, | |
| "count": 1396, | |
| "self": 592.612791213207, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 529.7070671054535, | |
| "count": 68406, | |
| "self": 529.7070671054535 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.122304618358612e-07, | |
| "count": 1, | |
| "self": 9.122304618358612e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.06319231493398547, | |
| "count": 1, | |
| "self": 0.0008483538404107094, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.06234396109357476, | |
| "count": 1, | |
| "self": 0.06234396109357476 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |