| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.3530730605125427, | |
| "min": 0.3530730605125427, | |
| "max": 0.46950677037239075, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 10659.9814453125, | |
| "min": 4740.1953125, | |
| "max": 14084.595703125, | |
| "count": 9 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989946.0, | |
| "min": 749959.0, | |
| "max": 989946.0, | |
| "count": 9 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989946.0, | |
| "min": 749959.0, | |
| "max": 989946.0, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.5460996031761169, | |
| "min": 0.40090814232826233, | |
| "max": 0.5610513687133789, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 149.63128662109375, | |
| "min": 33.67628479003906, | |
| "max": 156.5333251953125, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.045362599194049835, | |
| "min": 0.012379592284560204, | |
| "max": 0.07051504403352737, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 12.429351806640625, | |
| "min": 1.9520580768585205, | |
| "max": 19.109577178955078, | |
| "count": 9 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 345.45348837209303, | |
| "min": 307.25, | |
| "max": 409.0945945945946, | |
| "count": 9 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29709.0, | |
| "min": 4916.0, | |
| "max": 31830.0, | |
| "count": 9 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.5875310096247444, | |
| "min": 1.4286972741420205, | |
| "max": 1.6927499761804938, | |
| "count": 9 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 138.11519783735275, | |
| "min": 27.0839996188879, | |
| "max": 138.11519783735275, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.5875310096247444, | |
| "min": 1.4286972741420205, | |
| "max": 1.6927499761804938, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 138.11519783735275, | |
| "min": 27.0839996188879, | |
| "max": 138.11519783735275, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.14356546166176298, | |
| "min": 0.13462204318784643, | |
| "max": 0.18721644777393429, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 12.490195164573379, | |
| "min": 2.153952691005543, | |
| "max": 14.602882926366874, | |
| "count": 9 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.07097199595903482, | |
| "min": 0.06525425311701837, | |
| "max": 0.0711059946500297, | |
| "count": 9 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 1.0645799393855222, | |
| "min": 0.2808688572840765, | |
| "max": 1.0645799393855222, | |
| "count": 9 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015733428199389752, | |
| "min": 0.01045725111180218, | |
| "max": 0.01587640412894654, | |
| "count": 9 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.23600142299084625, | |
| "min": 0.04182900444720872, | |
| "max": 0.23600142299084625, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.504177498640001e-06, | |
| "min": 7.504177498640001e-06, | |
| "max": 7.635472454845e-05, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00011256266247960001, | |
| "min": 0.00011256266247960001, | |
| "max": 0.0009891802702735996, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10250136000000001, | |
| "min": 0.10250136000000001, | |
| "max": 0.12545155, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.5375204000000002, | |
| "min": 0.5018062, | |
| "max": 1.8071838, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.000259885864, | |
| "min": 0.000259885864, | |
| "max": 0.0025526098450000005, | |
| "count": 9 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0038982879600000008, | |
| "min": 0.0038982879600000008, | |
| "max": 0.033079667359999995, | |
| "count": 9 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.04081549867987633, | |
| "min": 0.037990253418684006, | |
| "max": 0.04739264398813248, | |
| "count": 9 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.612232506275177, | |
| "min": 0.1895705759525299, | |
| "max": 0.6411277651786804, | |
| "count": 9 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 9 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 9 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1710504483", | |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.2.1+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1710505447" | |
| }, | |
| "total": 964.5452561530001, | |
| "count": 1, | |
| "self": 0.635988392001309, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.06488856899886741, | |
| "count": 1, | |
| "self": 0.06488856899886741 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 963.8443791919999, | |
| "count": 1, | |
| "self": 0.6310442308713391, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.531344381000963, | |
| "count": 1, | |
| "self": 2.531344381000963 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 960.5842301901284, | |
| "count": 16864, | |
| "self": 0.7213993190562178, | |
| "children": { | |
| "env_step": { | |
| "total": 677.6088358761117, | |
| "count": 16864, | |
| "self": 634.639690495027, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 42.58553765205943, | |
| "count": 16864, | |
| "self": 1.8989050834279624, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 40.68663256863147, | |
| "count": 16296, | |
| "self": 40.68663256863147 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.3836077290252433, | |
| "count": 16864, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 961.8012726820816, | |
| "count": 16864, | |
| "is_parallel": true, | |
| "self": 377.5782632592345, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.002364474999922095, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0007095239961927291, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0016549510037293658, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0016549510037293658 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.06431216400233097, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0008240879978984594, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005248840025160462, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005248840025160462 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.06087844099965878, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.06087844099965878 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.00208475100225769, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005133920058142394, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0015713589964434505, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0015713589964434505 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 584.2230094228471, | |
| "count": 16863, | |
| "is_parallel": true, | |
| "self": 14.070101552333654, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 7.60006464601247, | |
| "count": 16863, | |
| "is_parallel": true, | |
| "self": 7.60006464601247 | |
| }, | |
| "communicator.exchange": { | |
| "total": 526.3479403123783, | |
| "count": 16863, | |
| "is_parallel": true, | |
| "self": 526.3479403123783 | |
| }, | |
| "steps_from_proto": { | |
| "total": 36.204902912122634, | |
| "count": 16863, | |
| "is_parallel": true, | |
| "self": 7.864703232127795, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 28.34019967999484, | |
| "count": 134904, | |
| "is_parallel": true, | |
| "self": 28.34019967999484 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 282.2539949949605, | |
| "count": 16864, | |
| "self": 1.3100764917071501, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 44.93210952625668, | |
| "count": 16864, | |
| "self": 44.81748620525468, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.11462332100200001, | |
| "count": 1, | |
| "self": 0.11462332100200001 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 236.0118089769967, | |
| "count": 122, | |
| "self": 95.06718214407738, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 140.9446268329193, | |
| "count": 5871, | |
| "self": 140.9446268329193 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.469986252952367e-07, | |
| "count": 1, | |
| "self": 9.469986252952367e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.09775944300054107, | |
| "count": 1, | |
| "self": 0.002824500999849988, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.09493494200069108, | |
| "count": 1, | |
| "self": 0.09493494200069108 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |