| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.5280116200447083, | |
| "min": 0.5280116200447083, | |
| "max": 1.3660978078842163, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 15907.93359375, | |
| "min": 15907.93359375, | |
| "max": 41441.94140625, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989970.0, | |
| "min": 29952.0, | |
| "max": 989970.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989970.0, | |
| "min": 29952.0, | |
| "max": 989970.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.053314488381147385, | |
| "min": -0.11195410788059235, | |
| "max": 0.18728280067443848, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 13.115364074707031, | |
| "min": -27.092893600463867, | |
| "max": 44.386024475097656, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.013439892791211605, | |
| "min": 0.011330770328640938, | |
| "max": 0.49259132146835327, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 3.306213617324829, | |
| "min": 2.810030937194824, | |
| "max": 116.744140625, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06902576163933162, | |
| "min": 0.06497942256949045, | |
| "max": 0.07245671332323288, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9663606629506426, | |
| "min": 0.5071969932626301, | |
| "max": 1.035204475665666, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.008374417846084123, | |
| "min": 8.181983830072212e-05, | |
| "max": 0.012613309092369586, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.11724184984517773, | |
| "min": 0.0011454777362101096, | |
| "max": 0.14626419761075607, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.361240403428575e-06, | |
| "min": 7.361240403428575e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00010305736564800005, | |
| "min": 0.00010305736564800005, | |
| "max": 0.0033817808727397993, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10245371428571429, | |
| "min": 0.10245371428571429, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.434352, | |
| "min": 1.3886848, | |
| "max": 2.5272602000000006, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00025512605714285734, | |
| "min": 0.00025512605714285734, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0035717648000000027, | |
| "min": 0.0035717648000000027, | |
| "max": 0.11275329398, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.01734367571771145, | |
| "min": 0.017181305214762688, | |
| "max": 0.7163676619529724, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.24281147122383118, | |
| "min": 0.24053826928138733, | |
| "max": 5.014573574066162, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 811.7222222222222, | |
| "min": 728.6666666666666, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29222.0, | |
| "min": 15984.0, | |
| "max": 32626.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 0.29912773540450466, | |
| "min": -1.0000000521540642, | |
| "max": 0.4276139114138692, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 10.768598474562168, | |
| "min": -31.99920167028904, | |
| "max": 18.387398190796375, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 0.29912773540450466, | |
| "min": -1.0000000521540642, | |
| "max": 0.4276139114138692, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 10.768598474562168, | |
| "min": -31.99920167028904, | |
| "max": 18.387398190796375, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.14433983834492714, | |
| "min": 0.1334694708388862, | |
| "max": 14.515450745821, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 5.1962341804173775, | |
| "min": 4.871754383377265, | |
| "max": 232.247211933136, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1691031744", | |
| "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "0.31.0.dev0", | |
| "mlagents_envs_version": "0.31.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.11.0+cu102", | |
| "numpy_version": "1.21.2", | |
| "end_time_seconds": "1691034019" | |
| }, | |
| "total": 2275.55502193, | |
| "count": 1, | |
| "self": 0.4915565409996816, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.06689123799998242, | |
| "count": 1, | |
| "self": 0.06689123799998242 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2274.996574151, | |
| "count": 1, | |
| "self": 1.6048196840069977, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 5.762007885000003, | |
| "count": 1, | |
| "self": 5.762007885000003 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2267.533115889993, | |
| "count": 63214, | |
| "self": 1.676050937002401, | |
| "children": { | |
| "env_step": { | |
| "total": 1568.596108532004, | |
| "count": 63214, | |
| "self": 1443.6516747410005, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 123.96927312102986, | |
| "count": 63214, | |
| "self": 5.2763418730484375, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 118.69293124798142, | |
| "count": 62563, | |
| "self": 118.69293124798142 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.9751606699738318, | |
| "count": 63214, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2269.3755010989835, | |
| "count": 63214, | |
| "is_parallel": true, | |
| "self": 954.8299821089788, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.007158458000020573, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.005704014000116331, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0014544439999042424, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0014544439999042424 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.05180290399999876, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005849090000253909, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005819109999833927, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005819109999833927 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04866447000000562, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04866447000000562 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0019716139999843563, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003828699999814944, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0015887440000028619, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0015887440000028619 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1314.5455189900047, | |
| "count": 63213, | |
| "is_parallel": true, | |
| "self": 36.25944546500364, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 25.742639747044052, | |
| "count": 63213, | |
| "is_parallel": true, | |
| "self": 25.742639747044052 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1135.5403156469388, | |
| "count": 63213, | |
| "is_parallel": true, | |
| "self": 1135.5403156469388 | |
| }, | |
| "steps_from_proto": { | |
| "total": 117.00311813101817, | |
| "count": 63213, | |
| "is_parallel": true, | |
| "self": 23.14488491912067, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 93.8582332118975, | |
| "count": 505704, | |
| "is_parallel": true, | |
| "self": 93.8582332118975 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 697.2609564209864, | |
| "count": 63214, | |
| "self": 2.866747943014957, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 120.90293706697315, | |
| "count": 63214, | |
| "self": 120.68252031297305, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.22041675400009808, | |
| "count": 2, | |
| "self": 0.22041675400009808 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 573.4912714109983, | |
| "count": 439, | |
| "self": 376.47104737696566, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 197.02022403403257, | |
| "count": 22875, | |
| "self": 197.02022403403257 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.99999883788405e-07, | |
| "count": 1, | |
| "self": 9.99999883788405e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.09662969200007865, | |
| "count": 1, | |
| "self": 0.001425008000296657, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.09520468399978199, | |
| "count": 1, | |
| "self": 0.09520468399978199 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |