| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.216837540268898, |
| "min": 0.216837540268898, |
| "max": 1.1439133882522583, |
| "count": 47 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 6591.861328125, |
| "min": 1884.1458740234375, |
| "max": 34317.40234375, |
| "count": 47 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 47 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 47 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 1499974.0, |
| "min": 149892.0, |
| "max": 1499974.0, |
| "count": 46 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 1499974.0, |
| "min": 149892.0, |
| "max": 1499974.0, |
| "count": 46 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.5635429620742798, |
| "min": -0.1073768362402916, |
| "max": 0.623300313949585, |
| "count": 46 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 160.6097412109375, |
| "min": -25.98519515991211, |
| "max": 177.64059448242188, |
| "count": 46 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": -0.0032277165446430445, |
| "min": -0.05295085161924362, |
| "max": 0.07620299607515335, |
| "count": 46 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": -0.9198992252349854, |
| "min": -14.08492660522461, |
| "max": 18.060110092163086, |
| "count": 46 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06717732886456708, |
| "min": 0.06439270613191184, |
| "max": 0.0735065735864949, |
| "count": 46 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.940482604103939, |
| "min": 0.583830917285167, |
| "max": 1.067276163356534, |
| "count": 46 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.01711601288081424, |
| "min": 0.0011009482281105403, |
| "max": 0.018873407717587217, |
| "count": 46 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.23962418033139937, |
| "min": 0.015413275193547564, |
| "max": 0.28310111576380825, |
| "count": 46 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 2.8645276166190494e-06, |
| "min": 2.8645276166190494e-06, |
| "max": 0.000272566884144375, |
| "count": 46 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 4.010338663266669e-05, |
| "min": 4.010338663266669e-05, |
| "max": 0.003569852210049334, |
| "count": 46 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10095480952380953, |
| "min": 0.10095480952380953, |
| "max": 0.19085562500000003, |
| "count": 46 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4133673333333334, |
| "min": 1.4133673333333334, |
| "max": 2.5899506666666667, |
| "count": 46 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00010538547142857148, |
| "min": 0.00010538547142857148, |
| "max": 0.009086476937499999, |
| "count": 46 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0014753966000000008, |
| "min": 0.0014753966000000008, |
| "max": 0.1190160716, |
| "count": 46 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.007281546946614981, |
| "min": 0.006628350354731083, |
| "max": 0.061615318059921265, |
| "count": 46 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.10194166004657745, |
| "min": 0.0965542420744896, |
| "max": 0.6112106442451477, |
| "count": 46 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 322.6326530612245, |
| "min": 288.4271844660194, |
| "max": 987.3333333333334, |
| "count": 46 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 31618.0, |
| "min": 16326.0, |
| "max": 33523.0, |
| "count": 46 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.5957163070537606, |
| "min": -0.854693383226792, |
| "max": 1.6708420864061306, |
| "count": 46 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 156.38019809126854, |
| "min": -27.840401589870453, |
| "max": 170.28999785333872, |
| "count": 46 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.5957163070537606, |
| "min": -0.854693383226792, |
| "max": 1.6708420864061306, |
| "count": 46 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 156.38019809126854, |
| "min": -27.840401589870453, |
| "max": 170.28999785333872, |
| "count": 46 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.023973165170158312, |
| "min": 0.022124219301162828, |
| "max": 0.6562520817798727, |
| "count": 46 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 2.3493701866755146, |
| "min": 1.954352687112987, |
| "max": 18.973405182361603, |
| "count": 46 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1687291235", |
| "python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", |
| "mlagents_version": "0.31.0.dev0", |
| "mlagents_envs_version": "0.31.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.11.0+cu102", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1687294292" |
| }, |
| "total": 3056.8792389049995, |
| "count": 1, |
| "self": 0.7496070949996465, |
| "children": { |
| "run_training.setup": { |
| "total": 0.03848574799985727, |
| "count": 1, |
| "self": 0.03848574799985727 |
| }, |
| "TrainerController.start_learning": { |
| "total": 3056.091146062, |
| "count": 1, |
| "self": 1.6334947169725638, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 3.9540592440000637, |
| "count": 1, |
| "self": 3.9540592440000637 |
| }, |
| "TrainerController.advance": { |
| "total": 3050.414175517027, |
| "count": 88556, |
| "self": 1.6999190719966464, |
| "children": { |
| "env_step": { |
| "total": 2206.4400515949983, |
| "count": 88556, |
| "self": 2065.3934808430704, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 140.0602751009783, |
| "count": 88556, |
| "self": 6.13563863390732, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 133.92463646707097, |
| "count": 86323, |
| "self": 133.92463646707097 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.9862956509496144, |
| "count": 88556, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 3049.710723735973, |
| "count": 88556, |
| "is_parallel": true, |
| "self": 1130.1138591509684, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0027872109999407257, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0008003440002539719, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.001986866999686754, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.001986866999686754 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.04545206300008431, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005375059997732023, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.000490628000079596, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.000490628000079596 |
| }, |
| "communicator.exchange": { |
| "total": 0.04279957100015963, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.04279957100015963 |
| }, |
| "steps_from_proto": { |
| "total": 0.0016243580000718794, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.000359045000095648, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0012653129999762314, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0012653129999762314 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1919.5968645850044, |
| "count": 88555, |
| "is_parallel": true, |
| "self": 43.92660406803998, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 29.931304289943682, |
| "count": 88555, |
| "is_parallel": true, |
| "self": 29.931304289943682 |
| }, |
| "communicator.exchange": { |
| "total": 1712.2299676670234, |
| "count": 88555, |
| "is_parallel": true, |
| "self": 1712.2299676670234 |
| }, |
| "steps_from_proto": { |
| "total": 133.5089885599973, |
| "count": 88555, |
| "is_parallel": true, |
| "self": 25.7646578750755, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 107.7443306849218, |
| "count": 708440, |
| "is_parallel": true, |
| "self": 107.7443306849218 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 842.2742048500322, |
| "count": 88556, |
| "self": 3.339937450038633, |
| "children": { |
| "process_trajectory": { |
| "total": 143.5362954599873, |
| "count": 88556, |
| "self": 143.24071930098762, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.2955761589996655, |
| "count": 3, |
| "self": 0.2955761589996655 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 695.3979719400063, |
| "count": 640, |
| "self": 443.9013471990788, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 251.49662474092747, |
| "count": 31458, |
| "self": 251.49662474092747 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.145000169344712e-06, |
| "count": 1, |
| "self": 1.145000169344712e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.08941543899982207, |
| "count": 1, |
| "self": 0.0016526210001757136, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.08776281799964636, |
| "count": 1, |
| "self": 0.08776281799964636 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |