| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.5890570878982544, | |
| "min": 0.5806085467338562, | |
| "max": 1.4019008874893188, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 17558.61328125, | |
| "min": 17511.154296875, | |
| "max": 42528.06640625, | |
| "count": 30 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 899917.0, | |
| "min": 29930.0, | |
| "max": 899917.0, | |
| "count": 30 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 899917.0, | |
| "min": 29930.0, | |
| "max": 899917.0, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.3437330424785614, | |
| "min": -0.1108439713716507, | |
| "max": 0.35709699988365173, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 89.02685546875, | |
| "min": -26.270021438598633, | |
| "max": 94.27360534667969, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.015149506740272045, | |
| "min": 0.015149506740272045, | |
| "max": 0.38376158475875854, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 3.923722267150879, | |
| "min": 3.7801356315612793, | |
| "max": 92.48654174804688, | |
| "count": 30 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06951294143477248, | |
| "min": 0.06556993023151954, | |
| "max": 0.07337778122950193, | |
| "count": 30 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 1.0426941215215872, | |
| "min": 0.5095945363242083, | |
| "max": 1.0585052202804945, | |
| "count": 30 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.011598017428993258, | |
| "min": 0.00011223956655982646, | |
| "max": 0.01402242299586416, | |
| "count": 30 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.17397026143489888, | |
| "min": 0.0014591143652777439, | |
| "max": 0.19631392194209824, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 0.00021150075616642447, | |
| "min": 0.00021150075616642447, | |
| "max": 0.00029838354339596195, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.003172511342496367, | |
| "min": 0.0020886848037717336, | |
| "max": 0.0039690189769937, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.17050024222222224, | |
| "min": 0.17050024222222224, | |
| "max": 0.19946118095238097, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 2.5575036333333334, | |
| "min": 1.3962282666666668, | |
| "max": 2.7824799333333328, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.007052974197999998, | |
| "min": 0.007052974197999998, | |
| "max": 0.009946171977142856, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.10579461296999998, | |
| "min": 0.06962320384, | |
| "max": 0.13230832936999998, | |
| "count": 30 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.01331007108092308, | |
| "min": 0.01331007108092308, | |
| "max": 0.7081205248832703, | |
| "count": 30 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.1996510624885559, | |
| "min": 0.1949319839477539, | |
| "max": 4.956843852996826, | |
| "count": 30 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 499.2105263157895, | |
| "min": 481.1875, | |
| "max": 999.0, | |
| "count": 30 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 28455.0, | |
| "min": 16857.0, | |
| "max": 32992.0, | |
| "count": 30 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.29020698682258, | |
| "min": -0.9999125520698726, | |
| "max": 1.3625155973713845, | |
| "count": 30 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 73.54179824888706, | |
| "min": -31.997201666235924, | |
| "max": 87.20099823176861, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.29020698682258, | |
| "min": -0.9999125520698726, | |
| "max": 1.3625155973713845, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 73.54179824888706, | |
| "min": -31.997201666235924, | |
| "max": 87.20099823176861, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.06815119140185089, | |
| "min": 0.06815119140185089, | |
| "max": 13.717725730994168, | |
| "count": 30 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.8846179099055007, | |
| "min": 3.8846179099055007, | |
| "max": 233.20133742690086, | |
| "count": 30 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 30 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 30 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1712527565", | |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.2.1+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1712529491" | |
| }, | |
| "total": 1926.3899368959997, | |
| "count": 1, | |
| "self": 0.38069954899947334, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.08702658400034124, | |
| "count": 1, | |
| "self": 0.08702658400034124 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 1925.9222107629998, | |
| "count": 1, | |
| "self": 1.2907312730385456, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.3211664730001758, | |
| "count": 1, | |
| "self": 2.3211664730001758 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 1922.1589925839608, | |
| "count": 57373, | |
| "self": 1.3277347779026059, | |
| "children": { | |
| "env_step": { | |
| "total": 1351.3449430410437, | |
| "count": 57373, | |
| "self": 1229.0939210409515, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 121.45048265507648, | |
| "count": 57373, | |
| "self": 4.293766252113983, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 117.1567164029625, | |
| "count": 56583, | |
| "self": 117.1567164029625 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.8005393450157499, | |
| "count": 57372, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 1921.4094024200226, | |
| "count": 57372, | |
| "is_parallel": true, | |
| "self": 805.1252596150844, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.002207309999903373, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006673160005448153, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0015399939993585576, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0015399939993585576 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04839418100027615, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006944440006009245, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004506309996941127, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004506309996941127 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04533611699980611, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04533611699980611 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0019129890001750027, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003753570003937057, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001537631999781297, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001537631999781297 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1116.2841428049383, | |
| "count": 57371, | |
| "is_parallel": true, | |
| "self": 32.07215328902976, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 21.545949239936363, | |
| "count": 57371, | |
| "is_parallel": true, | |
| "self": 21.545949239936363 | |
| }, | |
| "communicator.exchange": { | |
| "total": 970.6019852459776, | |
| "count": 57371, | |
| "is_parallel": true, | |
| "self": 970.6019852459776 | |
| }, | |
| "steps_from_proto": { | |
| "total": 92.0640550299945, | |
| "count": 57371, | |
| "is_parallel": true, | |
| "self": 18.693467616030375, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 73.37058741396413, | |
| "count": 458968, | |
| "is_parallel": true, | |
| "self": 73.37058741396413 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 569.4863147650144, | |
| "count": 57372, | |
| "self": 2.4730959570388222, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 111.68641964897415, | |
| "count": 57372, | |
| "self": 111.57511701097383, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.1113026380003248, | |
| "count": 1, | |
| "self": 0.1113026380003248 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 455.32679915900144, | |
| "count": 402, | |
| "self": 266.89855077501215, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 188.42824838398928, | |
| "count": 20688, | |
| "self": 188.42824838398928 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.3879998732591048e-06, | |
| "count": 1, | |
| "self": 1.3879998732591048e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.15131904500049131, | |
| "count": 1, | |
| "self": 0.002407309000773239, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.14891173599971808, | |
| "count": 1, | |
| "self": 0.14891173599971808 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |