| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.5703490972518921, | |
| "min": 0.5494472980499268, | |
| "max": 1.4027103185653687, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 17101.34765625, | |
| "min": 16562.5390625, | |
| "max": 42552.62109375, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989997.0, | |
| "min": 29952.0, | |
| "max": 989997.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989997.0, | |
| "min": 29952.0, | |
| "max": 989997.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.09232138842344284, | |
| "min": -0.12184180319309235, | |
| "max": 0.09232138842344284, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 22.988025665283203, | |
| "min": -28.876506805419922, | |
| "max": 22.988025665283203, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.013315600343048573, | |
| "min": 0.007485616020858288, | |
| "max": 0.4585472345352173, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 3.315584421157837, | |
| "min": 1.8264902830123901, | |
| "max": 108.67569732666016, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06612502732708131, | |
| "min": 0.06429373416306969, | |
| "max": 0.07457556224764238, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9257503825791383, | |
| "min": 0.5012756362031368, | |
| "max": 1.049068538531976, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.006806938070403141, | |
| "min": 0.00013274726171743837, | |
| "max": 0.01624260973897305, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.09529713298564398, | |
| "min": 0.0017257144023266986, | |
| "max": 0.11369826817281137, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.546790341578573e-06, | |
| "min": 7.546790341578573e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00010565506478210003, | |
| "min": 0.00010565506478210003, | |
| "max": 0.0035071946309352, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.1025155642857143, | |
| "min": 0.1025155642857143, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4352179000000003, | |
| "min": 1.3886848, | |
| "max": 2.5690648, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0002613048721428573, | |
| "min": 0.0002613048721428573, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.003658268210000002, | |
| "min": 0.003658268210000002, | |
| "max": 0.11692957352, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.014894582331180573, | |
| "min": 0.014894582331180573, | |
| "max": 0.5332163572311401, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.20852415263652802, | |
| "min": 0.20852415263652802, | |
| "max": 3.7325146198272705, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 737.3255813953489, | |
| "min": 737.3255813953489, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 31705.0, | |
| "min": 15984.0, | |
| "max": 32528.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 0.28570693956558096, | |
| "min": -1.0000000521540642, | |
| "max": 0.28570693956558096, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 12.28539840131998, | |
| "min": -31.994401648640633, | |
| "max": 12.28539840131998, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 0.28570693956558096, | |
| "min": -1.0000000521540642, | |
| "max": 0.28570693956558096, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 12.28539840131998, | |
| "min": -31.994401648640633, | |
| "max": 12.28539840131998, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.1159303622553125, | |
| "min": 0.1159303622553125, | |
| "max": 11.660213833674788, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 4.985005576978438, | |
| "min": 4.483415444614366, | |
| "max": 186.56342133879662, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1759783143", | |
| "python_version": "3.10.12 (main, Aug 15 2025, 14:32:43) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.1.0", | |
| "mlagents_envs_version": "1.1.0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.8.0+cpu", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1759785239" | |
| }, | |
| "total": 2096.077959533999, | |
| "count": 1, | |
| "self": 0.4292326389977461, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.016560984000534518, | |
| "count": 1, | |
| "self": 0.016560984000534518 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2095.632165911001, | |
| "count": 1, | |
| "self": 1.3077462239789384, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 1.6186284680006793, | |
| "count": 1, | |
| "self": 1.6186284680006793 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2092.6537368150202, | |
| "count": 63283, | |
| "self": 1.3465351380928041, | |
| "children": { | |
| "env_step": { | |
| "total": 1369.5665481859487, | |
| "count": 63283, | |
| "self": 1271.5928540321793, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 97.20022819699898, | |
| "count": 63283, | |
| "self": 4.6554433552519185, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 92.54478484174706, | |
| "count": 62552, | |
| "self": 92.54478484174706 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.7734659567704512, | |
| "count": 63283, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2090.506994118112, | |
| "count": 63283, | |
| "is_parallel": true, | |
| "self": 933.0590825298386, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0023786649999237852, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0007521420011471491, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001626522998776636, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001626522998776636 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04664285899980314, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005312780003805528, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004587119992720545, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004587119992720545 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04399000400007935, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04399000400007935 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016628650000711787, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003587480014175526, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001304116998653626, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001304116998653626 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1157.4479115882732, | |
| "count": 63282, | |
| "is_parallel": true, | |
| "self": 32.63660534833434, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 23.34338906888661, | |
| "count": 63282, | |
| "is_parallel": true, | |
| "self": 23.34338906888661 | |
| }, | |
| "communicator.exchange": { | |
| "total": 986.3345122918918, | |
| "count": 63282, | |
| "is_parallel": true, | |
| "self": 986.3345122918918 | |
| }, | |
| "steps_from_proto": { | |
| "total": 115.13340487916048, | |
| "count": 63282, | |
| "is_parallel": true, | |
| "self": 25.490181528660287, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 89.6432233505002, | |
| "count": 506256, | |
| "is_parallel": true, | |
| "self": 89.6432233505002 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 721.7406534909787, | |
| "count": 63283, | |
| "self": 2.3948062549025053, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 118.50225092205801, | |
| "count": 63283, | |
| "self": 118.29783259005853, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.20441833199947723, | |
| "count": 2, | |
| "self": 0.20441833199947723 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 600.8435963140182, | |
| "count": 449, | |
| "self": 282.71514406496317, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 318.12845224905504, | |
| "count": 22788, | |
| "self": 318.12845224905504 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.739997040014714e-07, | |
| "count": 1, | |
| "self": 9.739997040014714e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.0520534300012514, | |
| "count": 1, | |
| "self": 0.0010650080021150643, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.050988421999136335, | |
| "count": 1, | |
| "self": 0.050988421999136335 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |