| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.13997095823287964, | |
| "min": 0.13515740633010864, | |
| "max": 1.5335098505020142, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 4185.69140625, | |
| "min": 4050.397216796875, | |
| "max": 46520.5546875, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2999951.0, | |
| "min": 29974.0, | |
| "max": 2999951.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2999951.0, | |
| "min": 29974.0, | |
| "max": 2999951.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.8112826347351074, | |
| "min": -0.10546746850013733, | |
| "max": 0.8812189102172852, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 245.81863403320312, | |
| "min": -25.417659759521484, | |
| "max": 273.1778564453125, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.013699229806661606, | |
| "min": -0.005644344259053469, | |
| "max": 0.1852613240480423, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 4.150866508483887, | |
| "min": -1.66508150100708, | |
| "max": 44.647979736328125, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.07026074094063092, | |
| "min": 0.06211566593746149, | |
| "max": 0.07511671141892497, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.983650373168833, | |
| "min": 0.5947844996523509, | |
| "max": 1.121613116217001, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015531344338640094, | |
| "min": 0.0005532349624091268, | |
| "max": 0.01795476450795485, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.21743882074096132, | |
| "min": 0.007192054511318649, | |
| "max": 0.2513667031113679, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 1.4412923767452392e-06, | |
| "min": 1.4412923767452392e-06, | |
| "max": 0.00029828397557200837, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 2.017809327443335e-05, | |
| "min": 2.017809327443335e-05, | |
| "max": 0.004010949563016833, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.1004803976190476, | |
| "min": 0.1004803976190476, | |
| "max": 0.19942799166666667, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4067255666666665, | |
| "min": 1.4067255666666665, | |
| "max": 2.7975145666666674, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 5.799172214285719e-05, | |
| "min": 5.799172214285719e-05, | |
| "max": 0.009942856367499999, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0008118841100000007, | |
| "min": 0.0008118841100000007, | |
| "max": 0.13370461835, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.005496342666447163, | |
| "min": 0.005496342666447163, | |
| "max": 0.3608822226524353, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.07694879919290543, | |
| "min": 0.07694879919290543, | |
| "max": 2.8870577812194824, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 231.5859375, | |
| "min": 202.80141843971631, | |
| "max": 995.53125, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29643.0, | |
| "min": 16261.0, | |
| "max": 33373.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.7212968617677689, | |
| "min": -0.9337813011370599, | |
| "max": 1.7942777725143566, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 220.3259983062744, | |
| "min": -29.881001636385918, | |
| "max": 268.265997633338, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.7212968617677689, | |
| "min": -0.9337813011370599, | |
| "max": 1.7942777725143566, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 220.3259983062744, | |
| "min": -29.881001636385918, | |
| "max": 268.265997633338, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.013274244590974149, | |
| "min": 0.012789758633581116, | |
| "max": 7.566931799054146, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 1.699103307644691, | |
| "min": 1.699103307644691, | |
| "max": 128.63784058392048, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1743247210", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.6.0+cu124", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1743254608" | |
| }, | |
| "total": 7398.44707014, | |
| "count": 1, | |
| "self": 0.5312970799986942, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.019611703000009584, | |
| "count": 1, | |
| "self": 0.019611703000009584 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 7397.896161357001, | |
| "count": 1, | |
| "self": 4.140634342924386, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.100141836000148, | |
| "count": 1, | |
| "self": 2.100141836000148 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 7391.564862175074, | |
| "count": 195415, | |
| "self": 4.192528928921092, | |
| "children": { | |
| "env_step": { | |
| "total": 5349.433735135832, | |
| "count": 195415, | |
| "self": 4883.7247261575485, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 463.29011357131367, | |
| "count": 195415, | |
| "self": 13.96375521139953, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 449.32635835991414, | |
| "count": 187555, | |
| "self": 449.32635835991414 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 2.4188954069691135, | |
| "count": 195415, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 7382.397145986948, | |
| "count": 195415, | |
| "is_parallel": true, | |
| "self": 2843.0253636796224, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0021031010001024697, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006904639999447681, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0014126370001577016, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0014126370001577016 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04908028700037903, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005147440001564973, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004972369997631176, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004972369997631176 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04638279300024806, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04638279300024806 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016855130002113583, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00035757500108957174, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013279379991217866, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013279379991217866 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 4539.371782307326, | |
| "count": 195414, | |
| "is_parallel": true, | |
| "self": 95.84744425767713, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 70.715368155139, | |
| "count": 195414, | |
| "is_parallel": true, | |
| "self": 70.715368155139 | |
| }, | |
| "communicator.exchange": { | |
| "total": 4080.673982500776, | |
| "count": 195414, | |
| "is_parallel": true, | |
| "self": 4080.673982500776 | |
| }, | |
| "steps_from_proto": { | |
| "total": 292.13498739373335, | |
| "count": 195414, | |
| "is_parallel": true, | |
| "self": 59.96355395639603, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 232.17143343733733, | |
| "count": 1563312, | |
| "is_parallel": true, | |
| "self": 232.17143343733733 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 2037.9385981103214, | |
| "count": 195415, | |
| "self": 8.572907293308617, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 395.5845103520005, | |
| "count": 195415, | |
| "self": 394.9405266760009, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.6439836759996069, | |
| "count": 6, | |
| "self": 0.6439836759996069 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 1633.7811804650123, | |
| "count": 1401, | |
| "self": 891.1595728188636, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 742.6216076461487, | |
| "count": 68421, | |
| "self": 742.6216076461487 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 8.750012057134882e-07, | |
| "count": 1, | |
| "self": 8.750012057134882e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.09052212800088455, | |
| "count": 1, | |
| "self": 0.001743404001899762, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.08877872399898479, | |
| "count": 1, | |
| "self": 0.08877872399898479 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |