| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.43269777297973633, | |
| "min": 0.43269777297973633, | |
| "max": 1.371383786201477, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 13181.705078125, | |
| "min": 13181.705078125, | |
| "max": 41602.296875, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989964.0, | |
| "min": 29952.0, | |
| "max": 989964.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989964.0, | |
| "min": 29952.0, | |
| "max": 989964.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.5644271969795227, | |
| "min": -0.08764486759901047, | |
| "max": 0.5962366461753845, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 156.9107666015625, | |
| "min": -21.210058212280273, | |
| "max": 167.54249572753906, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.024280712008476257, | |
| "min": -0.025254247710108757, | |
| "max": 0.7589455246925354, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 6.750038146972656, | |
| "min": -6.919663906097412, | |
| "max": 179.87008666992188, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.07187978142645167, | |
| "min": 0.06446054169208044, | |
| "max": 0.07276190655461871, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 1.0063169399703233, | |
| "min": 0.509333345882331, | |
| "max": 1.0538843020028663, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.017543129561610322, | |
| "min": 0.00027802690595879037, | |
| "max": 0.01829602527695464, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.24560381386254448, | |
| "min": 0.0038923766834230654, | |
| "max": 0.25614435387736495, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.632654598671428e-06, | |
| "min": 7.632654598671428e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.0001068571643814, | |
| "min": 0.0001068571643814, | |
| "max": 0.0034928023357326003, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10254418571428571, | |
| "min": 0.10254418571428571, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4356186, | |
| "min": 1.3886848, | |
| "max": 2.527412000000001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00026416415285714285, | |
| "min": 0.00026416415285714285, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.00369829814, | |
| "min": 0.00369829814, | |
| "max": 0.11644031326000001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.014289124868810177, | |
| "min": 0.014289124868810177, | |
| "max": 0.696894109249115, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.20004774630069733, | |
| "min": 0.20004774630069733, | |
| "max": 4.87825870513916, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 334.3804347826087, | |
| "min": 303.8019801980198, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 30763.0, | |
| "min": 15984.0, | |
| "max": 32757.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.6438782430537369, | |
| "min": -1.0000000521540642, | |
| "max": 1.6538845163952445, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 151.2367983609438, | |
| "min": -30.77900169789791, | |
| "max": 165.31419833749533, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.6438782430537369, | |
| "min": -1.0000000521540642, | |
| "max": 1.6538845163952445, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 151.2367983609438, | |
| "min": -30.77900169789791, | |
| "max": 165.31419833749533, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.04913479718253138, | |
| "min": 0.04577270215473224, | |
| "max": 14.993331799283624, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 4.520401340792887, | |
| "min": 4.379859752638367, | |
| "max": 239.89330878853798, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1703984879", | |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.1.2+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1703987082" | |
| }, | |
| "total": 2203.7050966410006, | |
| "count": 1, | |
| "self": 0.9287682379999751, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.07198636900011479, | |
| "count": 1, | |
| "self": 0.07198636900011479 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2202.7043420340005, | |
| "count": 1, | |
| "self": 1.28955770093944, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.2628496709999126, | |
| "count": 1, | |
| "self": 2.2628496709999126 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2199.0324727370603, | |
| "count": 63795, | |
| "self": 1.3718093688648878, | |
| "children": { | |
| "env_step": { | |
| "total": 1565.677520177051, | |
| "count": 63795, | |
| "self": 1438.9510552421903, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 125.93731404285018, | |
| "count": 63795, | |
| "self": 4.561828710750888, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 121.37548533209929, | |
| "count": 62564, | |
| "self": 121.37548533209929 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.7891508920106389, | |
| "count": 63795, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2197.7586115720565, | |
| "count": 63795, | |
| "is_parallel": true, | |
| "self": 875.5834830330823, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0017043299999386363, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005121619997225935, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0011921680002160429, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0011921680002160429 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.05379153800004133, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006080959997234459, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005412160003288591, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005412160003288591 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.05098719900024662, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.05098719900024662 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016550269997424039, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003480849991319701, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013069420006104338, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013069420006104338 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1322.1751285389741, | |
| "count": 63794, | |
| "is_parallel": true, | |
| "self": 34.914668810930834, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 24.189073132123667, | |
| "count": 63794, | |
| "is_parallel": true, | |
| "self": 24.189073132123667 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1165.3040251779203, | |
| "count": 63794, | |
| "is_parallel": true, | |
| "self": 1165.3040251779203 | |
| }, | |
| "steps_from_proto": { | |
| "total": 97.76736141799938, | |
| "count": 63794, | |
| "is_parallel": true, | |
| "self": 19.252387028197973, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 78.51497438980141, | |
| "count": 510352, | |
| "is_parallel": true, | |
| "self": 78.51497438980141 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 631.9831431911443, | |
| "count": 63795, | |
| "self": 2.470314573151427, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 125.1846878289939, | |
| "count": 63795, | |
| "self": 124.96146760299371, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.2232202260001941, | |
| "count": 2, | |
| "self": 0.2232202260001941 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 504.328140788999, | |
| "count": 452, | |
| "self": 299.1198332430454, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 205.20830754595363, | |
| "count": 22842, | |
| "self": 205.20830754595363 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.184000211651437e-06, | |
| "count": 1, | |
| "self": 1.184000211651437e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.11946074100069382, | |
| "count": 1, | |
| "self": 0.002035024001088459, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.11742571699960536, | |
| "count": 1, | |
| "self": 0.11742571699960536 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |