| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.39161038398742676, | |
| "min": 0.3892679512500763, | |
| "max": 1.4873254299163818, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 9837.2529296875, | |
| "min": 9660.0732421875, | |
| "max": 39027.41796875, | |
| "count": 40 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 999947.0, | |
| "min": 24960.0, | |
| "max": 999947.0, | |
| "count": 40 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 999947.0, | |
| "min": 24960.0, | |
| "max": 999947.0, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.5577706098556519, | |
| "min": -0.10050802677869797, | |
| "max": 0.6519138216972351, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 128.28724670410156, | |
| "min": -20.302621841430664, | |
| "max": 154.50357055664062, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.012868339195847511, | |
| "min": 0.005618416238576174, | |
| "max": 0.4353194832801819, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 2.9597179889678955, | |
| "min": 1.18548583984375, | |
| "max": 86.1932601928711, | |
| "count": 40 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.07048654987496168, | |
| "min": 0.06373778805896614, | |
| "max": 0.07526202773604179, | |
| "count": 40 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.8458385984995402, | |
| "min": 0.3981097612286458, | |
| "max": 0.9031443328325015, | |
| "count": 40 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015799540449532086, | |
| "min": 0.0018626144759534152, | |
| "max": 0.015799540449532086, | |
| "count": 40 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.18959448539438503, | |
| "min": 0.013386984317590738, | |
| "max": 0.18959448539438503, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 3.6753987749000005e-06, | |
| "min": 3.6753987749000005e-06, | |
| "max": 0.0002957568014144, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 4.4104785298800004e-05, | |
| "min": 4.4104785298800004e-05, | |
| "max": 0.0029269388243538, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.1012251, | |
| "min": 0.1012251, | |
| "max": 0.1985856, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.2147012, | |
| "min": 1.1771136000000002, | |
| "max": 2.1756462, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00013238749, | |
| "min": 0.00013238749, | |
| "max": 0.00985870144, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.00158864988, | |
| "min": 0.00158864988, | |
| "max": 0.09758705538, | |
| "count": 40 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.008755751885473728, | |
| "min": 0.008497790433466434, | |
| "max": 0.5597033500671387, | |
| "count": 40 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.10506902635097504, | |
| "min": 0.09569065272808075, | |
| "max": 3.358220100402832, | |
| "count": 40 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 328.0133333333333, | |
| "min": 296.6024096385542, | |
| "max": 999.0, | |
| "count": 40 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 24601.0, | |
| "min": 15984.0, | |
| "max": 31968.0, | |
| "count": 40 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.5919653083880743, | |
| "min": -1.0000000521540642, | |
| "max": 1.6551903460219681, | |
| "count": 40 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 119.39739812910557, | |
| "min": -32.000001668930054, | |
| "max": 137.38079871982336, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.5919653083880743, | |
| "min": -1.0000000521540642, | |
| "max": 1.6551903460219681, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 119.39739812910557, | |
| "min": -32.000001668930054, | |
| "max": 137.38079871982336, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.029587139872989308, | |
| "min": 0.027370002108606666, | |
| "max": 10.958400049246848, | |
| "count": 40 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 2.219035490474198, | |
| "min": 2.0833714419277385, | |
| "max": 175.33440078794956, | |
| "count": 40 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 40 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 40 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1716730011", | |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids3 --no-graphics", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.3.0+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1716732293" | |
| }, | |
| "total": 2281.9890105399995, | |
| "count": 1, | |
| "self": 0.48976659899926744, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.05181883299974288, | |
| "count": 1, | |
| "self": 0.05181883299974288 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2281.4474251080005, | |
| "count": 1, | |
| "self": 1.397449222970863, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.4167706079997515, | |
| "count": 1, | |
| "self": 2.4167706079997515 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2277.54545750003, | |
| "count": 63983, | |
| "self": 1.414589613111275, | |
| "children": { | |
| "env_step": { | |
| "total": 1637.3200555290337, | |
| "count": 63983, | |
| "self": 1504.1230797850653, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 132.3463596849656, | |
| "count": 63983, | |
| "self": 4.706007048048832, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 127.64035263691676, | |
| "count": 62552, | |
| "self": 127.64035263691676 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.8506160590027321, | |
| "count": 63983, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2276.1567987270205, | |
| "count": 63983, | |
| "is_parallel": true, | |
| "self": 895.521353034901, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0020543230002658674, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005948570001237385, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001459466000142129, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001459466000142129 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04804656100031934, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006337940008052101, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005115260000820854, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005115260000820854 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.0452873549998003, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0452873549998003 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016138859996317478, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003391109994481667, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012747750001835811, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012747750001835811 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1380.6354456921194, | |
| "count": 63982, | |
| "is_parallel": true, | |
| "self": 34.525767212177016, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 23.840742276008314, | |
| "count": 63982, | |
| "is_parallel": true, | |
| "self": 23.840742276008314 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1223.704609926931, | |
| "count": 63982, | |
| "is_parallel": true, | |
| "self": 1223.704609926931 | |
| }, | |
| "steps_from_proto": { | |
| "total": 98.56432627700315, | |
| "count": 63982, | |
| "is_parallel": true, | |
| "self": 20.079214052069347, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 78.4851122249338, | |
| "count": 511856, | |
| "is_parallel": true, | |
| "self": 78.4851122249338 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 638.810812357885, | |
| "count": 63983, | |
| "self": 2.6279607609471896, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 129.42429262893575, | |
| "count": 63983, | |
| "self": 129.22864745593552, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.19564517300023, | |
| "count": 2, | |
| "self": 0.19564517300023 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 506.75855896800203, | |
| "count": 454, | |
| "self": 297.20957183900373, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 209.5489871289983, | |
| "count": 22839, | |
| "self": 209.5489871289983 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 8.770002750679851e-07, | |
| "count": 1, | |
| "self": 8.770002750679851e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.08774689999972907, | |
| "count": 1, | |
| "self": 0.0014895069998601684, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.0862573929998689, | |
| "count": 1, | |
| "self": 0.0862573929998689 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |