| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.5159269571304321, | |
| "min": 0.5129492878913879, | |
| "max": 1.448936939239502, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 15477.80859375, | |
| "min": 15232.5419921875, | |
| "max": 43954.94921875, | |
| "count": 23 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 689998.0, | |
| "min": 29996.0, | |
| "max": 689998.0, | |
| "count": 23 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 689998.0, | |
| "min": 29996.0, | |
| "max": 689998.0, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.44156432151794434, | |
| "min": -0.0628989040851593, | |
| "max": 0.47608819603919983, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 117.89767456054688, | |
| "min": -15.158636093139648, | |
| "max": 129.0198974609375, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": -0.03201933205127716, | |
| "min": -0.0577508769929409, | |
| "max": 0.3878459632396698, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": -8.549161911010742, | |
| "min": -15.592737197875977, | |
| "max": 92.30734252929688, | |
| "count": 23 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06585418448126543, | |
| "min": 0.06469609509942875, | |
| "max": 0.07125436491927928, | |
| "count": 23 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9219585827377159, | |
| "min": 0.49878055443495495, | |
| "max": 1.0394744463578807, | |
| "count": 23 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.01466034116899772, | |
| "min": 0.0010189180087605602, | |
| "max": 0.016069453655550854, | |
| "count": 23 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.20524477636596808, | |
| "min": 0.013245934113887282, | |
| "max": 0.22497235117771197, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 1.0952851451122447e-05, | |
| "min": 1.0952851451122447e-05, | |
| "max": 0.0002931950226764897, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00015333992031571427, | |
| "min": 0.00015333992031571427, | |
| "max": 0.003484989138337, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10365091836734694, | |
| "min": 0.10365091836734694, | |
| "max": 0.19773167346938775, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.451112857142857, | |
| "min": 1.3841217142857143, | |
| "max": 2.5318924285714286, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00037472674489795916, | |
| "min": 0.00037472674489795916, | |
| "max": 0.009773394179591836, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0052461744285714285, | |
| "min": 0.0052461744285714285, | |
| "max": 0.11618013370000001, | |
| "count": 23 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.01385729480534792, | |
| "min": 0.01385729480534792, | |
| "max": 0.46793070435523987, | |
| "count": 23 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.19400212168693542, | |
| "min": 0.19400212168693542, | |
| "max": 3.275514841079712, | |
| "count": 23 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 418.07042253521126, | |
| "min": 388.71794871794873, | |
| "max": 980.4117647058823, | |
| "count": 23 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29683.0, | |
| "min": 16667.0, | |
| "max": 34018.0, | |
| "count": 23 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.3565182829616775, | |
| "min": -0.8637059322174858, | |
| "max": 1.5475211074234734, | |
| "count": 23 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 96.3127980902791, | |
| "min": -28.119801722466946, | |
| "max": 117.67699871957302, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.3565182829616775, | |
| "min": -0.8637059322174858, | |
| "max": 1.5475211074234734, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 96.3127980902791, | |
| "min": -28.119801722466946, | |
| "max": 117.67699871957302, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.060279124154271495, | |
| "min": 0.05957469614825218, | |
| "max": 9.228095879449564, | |
| "count": 23 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 4.279817814953276, | |
| "min": 4.229803426525905, | |
| "max": 156.87762995064259, | |
| "count": 23 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 23 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 23 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1719674461", | |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training1 --no-graphics", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.3.0+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1719676062" | |
| }, | |
| "total": 1600.8617605089999, | |
| "count": 1, | |
| "self": 0.4436223229997722, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.08845487799999319, | |
| "count": 1, | |
| "self": 0.08845487799999319 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 1600.329683308, | |
| "count": 1, | |
| "self": 1.1158604610075145, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 3.7024018749998504, | |
| "count": 1, | |
| "self": 3.7024018749998504 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 1595.4237527419932, | |
| "count": 44597, | |
| "self": 1.1494493289567345, | |
| "children": { | |
| "env_step": { | |
| "total": 1138.7097346640203, | |
| "count": 44597, | |
| "self": 1035.230790629002, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 102.78661415901774, | |
| "count": 44597, | |
| "self": 3.440552423020563, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 99.34606173599718, | |
| "count": 43803, | |
| "self": 99.34606173599718 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.6923298760004855, | |
| "count": 44597, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 1596.4229978130404, | |
| "count": 44597, | |
| "is_parallel": true, | |
| "self": 654.8639752220511, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.015612085000157094, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.004930926000042746, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.010681159000114349, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.010681159000114349 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.046516110000084154, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006918040000982728, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004822470000362955, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004822470000362955 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.043688985000017055, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.043688985000017055 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016530739999325306, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.000369832999922437, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012832410000100936, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012832410000100936 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 941.5590225909893, | |
| "count": 44596, | |
| "is_parallel": true, | |
| "self": 25.116252618046474, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 16.57159033200537, | |
| "count": 44596, | |
| "is_parallel": true, | |
| "self": 16.57159033200537 | |
| }, | |
| "communicator.exchange": { | |
| "total": 829.7306253509655, | |
| "count": 44596, | |
| "is_parallel": true, | |
| "self": 829.7306253509655 | |
| }, | |
| "steps_from_proto": { | |
| "total": 70.14055428997199, | |
| "count": 44596, | |
| "is_parallel": true, | |
| "self": 14.835980148910494, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 55.304574141061494, | |
| "count": 356768, | |
| "is_parallel": true, | |
| "self": 55.304574141061494 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 455.5645687490162, | |
| "count": 44597, | |
| "self": 2.199988050052525, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 90.09018176896029, | |
| "count": 44597, | |
| "self": 89.90162720396052, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.18855456499977663, | |
| "count": 1, | |
| "self": 0.18855456499977663 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 363.2743989300034, | |
| "count": 318, | |
| "self": 216.69494764799947, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 146.5794512820039, | |
| "count": 15948, | |
| "self": 146.5794512820039 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.7599968285067e-07, | |
| "count": 1, | |
| "self": 9.7599968285067e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.08766725399982533, | |
| "count": 1, | |
| "self": 0.001347486999748071, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.08631976700007726, | |
| "count": 1, | |
| "self": 0.08631976700007726 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |