| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.13767725229263306, | |
| "min": 0.11736847460269928, | |
| "max": 1.4065113067626953, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 4145.7373046875, | |
| "min": 3506.031005859375, | |
| "max": 42667.92578125, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2999893.0, | |
| "min": 29952.0, | |
| "max": 2999893.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2999893.0, | |
| "min": 29952.0, | |
| "max": 2999893.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.8235560655593872, | |
| "min": -0.09233143925666809, | |
| "max": 0.8545447587966919, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 249.53749084472656, | |
| "min": -22.1595458984375, | |
| "max": 259.052001953125, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.060299649834632874, | |
| "min": -0.03345511481165886, | |
| "max": 0.3823799788951874, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 18.270793914794922, | |
| "min": -9.802349090576172, | |
| "max": 92.9183349609375, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06712005015267633, | |
| "min": 0.06505776217037906, | |
| "max": 0.07593477028441173, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9396807021374686, | |
| "min": 0.5315433919908821, | |
| "max": 1.0888115173438564, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.01675657390759337, | |
| "min": 0.0009381663753779158, | |
| "max": 0.017523056156711563, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.23459203470630718, | |
| "min": 0.01313432925529082, | |
| "max": 0.2464741367233835, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 1.4351280930857127e-06, | |
| "min": 1.4351280930857127e-06, | |
| "max": 0.00029838354339596195, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 2.0091793303199977e-05, | |
| "min": 2.0091793303199977e-05, | |
| "max": 0.004010773063075666, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10047834285714287, | |
| "min": 0.10047834285714287, | |
| "max": 0.19946118095238097, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4066968000000002, | |
| "min": 1.3962282666666668, | |
| "max": 2.8275804, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 5.778645142857135e-05, | |
| "min": 5.778645142857135e-05, | |
| "max": 0.009946171977142856, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0008090103199999989, | |
| "min": 0.0008090103199999989, | |
| "max": 0.1336987409, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.013224425725638866, | |
| "min": 0.013007568195462227, | |
| "max": 0.5398194193840027, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.18514196574687958, | |
| "min": 0.18210595846176147, | |
| "max": 3.778736114501953, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 207.41007194244605, | |
| "min": 207.41007194244605, | |
| "max": 999.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 28830.0, | |
| "min": 15984.0, | |
| "max": 32857.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.7649485568915095, | |
| "min": -1.0000000521540642, | |
| "max": 1.7738753476220628, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 247.09279796481133, | |
| "min": -28.120801649987698, | |
| "max": 247.09279796481133, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.7649485568915095, | |
| "min": -1.0000000521540642, | |
| "max": 1.7738753476220628, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 247.09279796481133, | |
| "min": -28.120801649987698, | |
| "max": 247.09279796481133, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.028046778935095062, | |
| "min": 0.028046778935095062, | |
| "max": 9.988997579552233, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.9265490509133087, | |
| "min": 3.9265490509133087, | |
| "max": 159.82396127283573, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1742648685", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.6.0+cu124", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1742657080" | |
| }, | |
| "total": 8394.721010406, | |
| "count": 1, | |
| "self": 1.4242156300006172, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.023512602999971932, | |
| "count": 1, | |
| "self": 0.023512602999971932 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 8393.273282172999, | |
| "count": 1, | |
| "self": 4.931491036239095, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 3.5326586170000382, | |
| "count": 1, | |
| "self": 3.5326586170000382 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 8384.665987793762, | |
| "count": 195779, | |
| "self": 5.072668996564971, | |
| "children": { | |
| "env_step": { | |
| "total": 6171.229749677905, | |
| "count": 195779, | |
| "self": 5648.074184336097, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 520.2704272579558, | |
| "count": 195779, | |
| "self": 15.971823155933237, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 504.2986041020226, | |
| "count": 187559, | |
| "self": 504.2986041020226 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 2.8851380838523255, | |
| "count": 195779, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 8375.217938242642, | |
| "count": 195779, | |
| "is_parallel": true, | |
| "self": 3120.3453993627563, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.005836607999981425, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.004307386999926166, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0015292210000552586, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0015292210000552586 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.05865269499997794, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005673469999578629, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005633929999930842, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005633929999930842 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.052018168000017795, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.052018168000017795 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.005503787000009197, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.004223927000055028, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012798599999541693, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012798599999541693 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 5254.872538879886, | |
| "count": 195778, | |
| "is_parallel": true, | |
| "self": 105.91264481711005, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 78.69610648391279, | |
| "count": 195778, | |
| "is_parallel": true, | |
| "self": 78.69610648391279 | |
| }, | |
| "communicator.exchange": { | |
| "total": 4738.607032636858, | |
| "count": 195778, | |
| "is_parallel": true, | |
| "self": 4738.607032636858 | |
| }, | |
| "steps_from_proto": { | |
| "total": 331.6567549420054, | |
| "count": 195778, | |
| "is_parallel": true, | |
| "self": 69.50220483661946, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 262.15455010538597, | |
| "count": 1566224, | |
| "is_parallel": true, | |
| "self": 262.15455010538597 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 2208.3635691192926, | |
| "count": 195779, | |
| "self": 9.606010087308277, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 436.6751568659881, | |
| "count": 195779, | |
| "self": 435.9109330989888, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.7642237669992937, | |
| "count": 6, | |
| "self": 0.7642237669992937 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 1762.0824021659964, | |
| "count": 1406, | |
| "self": 968.5204899701068, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 793.5619121958896, | |
| "count": 68364, | |
| "self": 793.5619121958896 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.4139986888039857e-06, | |
| "count": 1, | |
| "self": 1.4139986888039857e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.14314331199966546, | |
| "count": 1, | |
| "self": 0.0025536149987601675, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.1405896970009053, | |
| "count": 1, | |
| "self": 0.1405896970009053 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |