| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.19634008407592773, | |
| "min": 0.18254616856575012, | |
| "max": 0.20913568139076233, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 6015.8603515625, | |
| "min": 1244.887939453125, | |
| "max": 6404.5712890625, | |
| "count": 8 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 227.02307692307693, | |
| "min": 156.0, | |
| "max": 274.3669724770642, | |
| "count": 8 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29513.0, | |
| "min": 4056.0, | |
| "max": 30708.0, | |
| "count": 8 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2999867.0, | |
| "min": 2789758.0, | |
| "max": 2999867.0, | |
| "count": 8 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2999867.0, | |
| "min": 2789758.0, | |
| "max": 2999867.0, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.6668941378593445, | |
| "min": 0.5666171908378601, | |
| "max": 0.6668941378593445, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 90.69760131835938, | |
| "min": 14.709369659423828, | |
| "max": 90.69760131835938, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.007446997333317995, | |
| "min": -0.0014452653704211116, | |
| "max": 0.013798771426081657, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 1.012791633605957, | |
| "min": -0.17054131627082825, | |
| "max": 1.6834501028060913, | |
| "count": 8 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.773646126802151, | |
| "min": 1.6794156214465266, | |
| "max": 1.847959976196289, | |
| "count": 8 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 230.57399648427963, | |
| "min": 46.19899940490723, | |
| "max": 230.57399648427963, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.773646126802151, | |
| "min": 1.6794156214465266, | |
| "max": 1.847959976196289, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 230.57399648427963, | |
| "min": 46.19899940490723, | |
| "max": 230.57399648427963, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.02162035130895674, | |
| "min": 0.01450827432796359, | |
| "max": 0.026932200510909252, | |
| "count": 8 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 2.8106456701643765, | |
| "min": 0.36270685819908977, | |
| "max": 2.9356098556891084, | |
| "count": 8 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 8 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 8 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.045205598968702056, | |
| "min": 0.04513349834208687, | |
| "max": 0.05072030359828592, | |
| "count": 7 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.31643919278091437, | |
| "min": 0.3159344883946081, | |
| "max": 0.40231775108487433, | |
| "count": 7 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.01756046380614862, | |
| "min": 0.01689078080843213, | |
| "max": 0.018238895967457945, | |
| "count": 7 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.12292324664304033, | |
| "min": 0.11823546565902493, | |
| "max": 0.13659650496636316, | |
| "count": 7 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 4.547376405999977e-07, | |
| "min": 4.547376405999977e-07, | |
| "max": 6.504610162150001e-06, | |
| "count": 7 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 3.183163484199984e-06, | |
| "min": 3.183163484199984e-06, | |
| "max": 5.2036881297200007e-05, | |
| "count": 7 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10045463809523807, | |
| "min": 0.10045463809523807, | |
| "max": 0.10650451666666667, | |
| "count": 7 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 0.7031824666666665, | |
| "min": 0.7031824666666665, | |
| "max": 0.8520361333333334, | |
| "count": 7 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 1.450091714285712e-05, | |
| "min": 1.450091714285712e-05, | |
| "max": 7.4394715e-05, | |
| "count": 7 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.00010150641999999984, | |
| "min": 0.00010150641999999984, | |
| "max": 0.00059515772, | |
| "count": 7 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.009293955750763416, | |
| "min": 0.008975865319371223, | |
| "max": 0.009324299171566963, | |
| "count": 7 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.06505768746137619, | |
| "min": 0.06283105909824371, | |
| "max": 0.07334689050912857, | |
| "count": 7 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1736614884", | |
| "python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.5.1+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1736615475" | |
| }, | |
| "total": 591.3225794409991, | |
| "count": 1, | |
| "self": 0.7973925389997021, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.05759276599928853, | |
| "count": 1, | |
| "self": 0.05759276599928853 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 590.4675941360001, | |
| "count": 1, | |
| "self": 0.39906842290110944, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 3.1235094540006685, | |
| "count": 1, | |
| "self": 3.1235094540006685 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 586.819589131097, | |
| "count": 14188, | |
| "self": 0.4218017009425239, | |
| "children": { | |
| "env_step": { | |
| "total": 466.5465965630483, | |
| "count": 14188, | |
| "self": 426.67460349303656, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 39.630197194972425, | |
| "count": 14188, | |
| "self": 1.191651979848757, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 38.43854521512367, | |
| "count": 13536, | |
| "self": 38.43854521512367 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.24179587503931543, | |
| "count": 14188, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 588.8598102130964, | |
| "count": 14188, | |
| "is_parallel": true, | |
| "self": 192.91342673410145, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.002846036999471835, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0009063310008059489, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001939705998665886, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001939705998665886 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.11663748899991333, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.005320938000295428, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005124399995111162, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005124399995111162 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.10718975000054343, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.10718975000054343 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0036143609995633597, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.002300742997249472, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013136180023138877, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013136180023138877 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 395.9463834789949, | |
| "count": 14187, | |
| "is_parallel": true, | |
| "self": 8.27391039919712, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 5.66011124700708, | |
| "count": 14187, | |
| "is_parallel": true, | |
| "self": 5.66011124700708 | |
| }, | |
| "communicator.exchange": { | |
| "total": 357.27115853094074, | |
| "count": 14187, | |
| "is_parallel": true, | |
| "self": 357.27115853094074 | |
| }, | |
| "steps_from_proto": { | |
| "total": 24.741203301849964, | |
| "count": 14187, | |
| "is_parallel": true, | |
| "self": 5.356703152297996, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 19.384500149551968, | |
| "count": 113496, | |
| "is_parallel": true, | |
| "self": 19.384500149551968 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 119.8511908671062, | |
| "count": 14188, | |
| "self": 0.85680559807588, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 27.788448726028946, | |
| "count": 14188, | |
| "self": 27.60438441102815, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.18406431500079634, | |
| "count": 1, | |
| "self": 0.18406431500079634 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 91.20593654300137, | |
| "count": 50, | |
| "self": 60.63762731401221, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 30.568309228989165, | |
| "count": 2430, | |
| "self": 30.568309228989165 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.1990014172624797e-06, | |
| "count": 1, | |
| "self": 1.1990014172624797e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.12542592899990268, | |
| "count": 1, | |
| "self": 0.003000004000568879, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.1224259249993338, | |
| "count": 1, | |
| "self": 0.1224259249993338 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |