{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.21720464527606964, "min": 0.20768827199935913, "max": 0.29807475209236145, "count": 17 }, "Pyramids.Policy.Entropy.sum": { "value": 6460.53515625, "min": 6210.7099609375, "max": 8664.7734375, "count": 17 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 279.6574074074074, "min": 260.4086956521739, "max": 345.0444444444444, "count": 17 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 30203.0, "min": 16795.0, "max": 31320.0, "count": 17 }, "Pyramids.Step.mean": { "value": 1499980.0, "min": 1019934.0, "max": 1499980.0, "count": 17 }, "Pyramids.Step.sum": { "value": 1499980.0, "min": 1019934.0, "max": 1499980.0, "count": 17 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.6857998371124268, "min": 0.5569564700126648, "max": 0.6999236941337585, "count": 17 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 197.51034545898438, "min": 106.35494995117188, "max": 207.87733459472656, "count": 17 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.011466632597148418, "min": -0.003921444062143564, "max": 0.08421960473060608, "count": 17 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 3.3023900985717773, "min": -1.0901614427566528, "max": 24.002588272094727, "count": 17 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.7042280218311558, "min": 1.502714267716958, "max": 1.7395912886961646, "count": 17 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 182.35239833593369, "min": 99.20499943196774, "max": 200.05299820005894, "count": 17 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.7042280218311558, "min": 1.502714267716958, "max": 1.7395912886961646, "count": 17 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 182.35239833593369, "min": 99.20499943196774, "max": 200.05299820005894, "count": 17 }, "Pyramids.Policy.RndReward.mean": { "value": 0.024416481507300164, "min": 0.022409672142715532, "max": 0.03160340793149042, "count": 17 }, "Pyramids.Policy.RndReward.sum": { "value": 2.6125635212811176, "min": 1.6711126518785022, "max": 3.0019219083333155, "count": 17 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06975638308323964, "min": 0.06622975742485485, "max": 0.07178942280422364, "count": 17 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.9765893631653549, "min": 0.6101926534708279, "max": 1.01275189212916, "count": 17 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.016813369541307025, "min": 0.01431408897596633, "max": 0.017236776922973582, "count": 17 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.23538717357829836, "min": 0.1338397917764572, "max": 0.24501954557490538, "count": 17 }, "Pyramids.Policy.LearningRate.mean": { "value": 2.9738561516047628e-06, "min": 2.9738561516047628e-06, "max": 9.789306736899999e-05, "count": 17 }, "Pyramids.Policy.LearningRate.sum": { "value": 4.1633986122466676e-05, "min": 4.1633986122466676e-05, "max": 0.0013018851660385998, "count": 17 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.1009912523809524, "min": 0.1009912523809524, "max": 0.13263100000000005, "count": 17 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4138775333333335, "min": 1.1936790000000004, "max": 1.9048246000000002, "count": 17 }, "Pyramids.Policy.Beta.mean": { "value": 0.0001090261128571429, "min": 0.0001090261128571429, "max": 0.0032698369000000002, "count": 17 }, "Pyramids.Policy.Beta.sum": { "value": 0.0015263655800000005, "min": 0.0015263655800000005, "max": 0.04349274386, "count": 17 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.00849104393273592, "min": 0.0080970274284482, "max": 0.009547818452119827, "count": 17 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.11887460947036743, "min": 0.08593036234378815, "max": 0.13323572278022766, "count": 17 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 17 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 17 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1726704575", "python_version": "3.10.14 (main, Apr 17 2024, 00:00:00) [GCC 13.2.1 20240316 (Red Hat 13.2.1-7)]", "command_line_arguments": "/home/michael/Repo/DeepRLCourse/venv/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", "mlagents_version": "1.1.0.dev0", "mlagents_envs_version": "1.1.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.4.0+rocm6.1", "numpy_version": "1.23.5", "end_time_seconds": "1726705048" }, "total": 473.71785410499433, "count": 1, "self": 0.21809501701500267, "children": { "run_training.setup": { "total": 0.01654465199680999, "count": 1, "self": 0.01654465199680999 }, "TrainerController.start_learning": { "total": 473.4832144359825, "count": 1, "self": 0.43410689767915756, "children": { "TrainerController._reset_env": { "total": 1.1233860200154595, "count": 1, "self": 1.1233860200154595 }, "TrainerController.advance": { "total": 471.8779994753131, "count": 32645, "self": 0.3900848307821434, "children": { "env_step": { "total": 285.53448172067874, "count": 32645, "self": 236.0893001385557, "children": { "SubprocessEnvManager._take_step": { "total": 49.193108400155324, "count": 32645, "self": 1.0925407735048793, "children": { "TorchPolicy.evaluate": { "total": 48.100567626650445, "count": 31290, "self": 48.100567626650445 } } }, "workers": { "total": 0.25207318196771666, "count": 32645, "self": 0.0, "children": { "worker_root": { "total": 472.8673126748181, "count": 32645, "is_parallel": true, "self": 262.82770341748255, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0011030320019926876, "count": 1, "is_parallel": true, "self": 0.0003565579536370933, "children": { "_process_rank_one_or_two_observation": { "total": 0.0007464740483555943, "count": 8, "is_parallel": true, "self": 0.0007464740483555943 } } }, "UnityEnvironment.step": { "total": 0.016810662986245006, "count": 1, "is_parallel": true, "self": 0.00019693400827236474, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0001981329987756908, "count": 1, "is_parallel": true, "self": 0.0001981329987756908 }, "communicator.exchange": { "total": 0.015795077983057126, "count": 1, "is_parallel": true, "self": 0.015795077983057126 }, "steps_from_proto": { "total": 0.0006205179961398244, "count": 1, "is_parallel": true, "self": 0.0001533749746158719, "children": { "_process_rank_one_or_two_observation": { "total": 0.0004671430215239525, "count": 8, "is_parallel": true, "self": 0.0004671430215239525 } } } } } } }, "UnityEnvironment.step": { "total": 210.03960925733554, "count": 32644, "is_parallel": true, "self": 5.756008195952745, "children": { "UnityEnvironment._generate_step_input": { "total": 4.313196824630722, "count": 32644, "is_parallel": true, "self": 4.313196824630722 }, "communicator.exchange": { "total": 182.56862023012945, "count": 32644, "is_parallel": true, "self": 182.56862023012945 }, "steps_from_proto": { "total": 17.40178400662262, "count": 32644, "is_parallel": true, "self": 4.037765364308143, "children": { "_process_rank_one_or_two_observation": { "total": 13.364018642314477, "count": 261152, "is_parallel": true, "self": 13.364018642314477 } } } } } } } } } } }, "trainer_advance": { "total": 185.95343292385223, "count": 32645, "self": 0.8427105708105955, "children": { "process_trajectory": { "total": 36.69104316688026, "count": 32645, "self": 36.632464149879524, "children": { "RLTrainer._checkpoint": { "total": 0.05857901700073853, "count": 1, "self": 0.05857901700073853 } } }, "_update_policy": { "total": 148.41967918616137, "count": 236, "self": 82.20424556016224, "children": { "TorchPPOOptimizer.update": { "total": 66.21543362599914, "count": 11352, "self": 66.21543362599914 } } } } } } }, "trainer_threads": { "total": 5.599868018180132e-07, "count": 1, "self": 5.599868018180132e-07 }, "TrainerController._save_models": { "total": 0.04772148298798129, "count": 1, "self": 0.0014789959823247045, "children": { "RLTrainer._checkpoint": { "total": 0.046242487005656585, "count": 1, "self": 0.046242487005656585 } } } } } } }