| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.4484938085079193, | |
| "min": 0.4484938085079193, | |
| "max": 1.507041573524475, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 13361.52734375, | |
| "min": 13361.52734375, | |
| "max": 45717.61328125, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989890.0, | |
| "min": 29952.0, | |
| "max": 989890.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989890.0, | |
| "min": 29952.0, | |
| "max": 989890.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.24449053406715393, | |
| "min": -0.08303222805261612, | |
| "max": 0.34761524200439453, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 62.34508514404297, | |
| "min": -19.927734375, | |
| "max": 90.37995910644531, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": -1.879557490348816, | |
| "min": -1.9528666734695435, | |
| "max": 2.180330753326416, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": -479.28717041015625, | |
| "min": -509.6982116699219, | |
| "max": 566.885986328125, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.0711138052494524, | |
| "min": 0.06491783739918554, | |
| "max": 0.07402172435731044, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9955932734923337, | |
| "min": 0.48381534922532143, | |
| "max": 1.0571641896830817, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.523038732927196, | |
| "min": 0.00012919346758292347, | |
| "max": 0.523038732927196, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 7.322542260980745, | |
| "min": 0.0018087085461609286, | |
| "max": 7.322542260980745, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.289090427478574e-06, | |
| "min": 7.289090427478574e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00010204726598470004, | |
| "min": 0.00010204726598470004, | |
| "max": 0.0032558954147015994, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10242966428571428, | |
| "min": 0.10242966428571428, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4340152999999998, | |
| "min": 1.3691136000000002, | |
| "max": 2.4431072000000005, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0002527234621428573, | |
| "min": 0.0002527234621428573, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.003538128470000002, | |
| "min": 0.003538128470000002, | |
| "max": 0.10855131016000003, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.009125393815338612, | |
| "min": 0.009125393815338612, | |
| "max": 0.41734614968299866, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.12775550782680511, | |
| "min": 0.12775550782680511, | |
| "max": 2.9214229583740234, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 571.2307692307693, | |
| "min": 495.52542372881356, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29704.0, | |
| "min": 15984.0, | |
| "max": 32747.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.0825345877271433, | |
| "min": -1.0000000521540642, | |
| "max": 1.2685573508993524, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 56.29179856181145, | |
| "min": -32.000001668930054, | |
| "max": 77.3819984048605, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.0825345877271433, | |
| "min": -1.0000000521540642, | |
| "max": 1.2685573508993524, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 56.29179856181145, | |
| "min": -32.000001668930054, | |
| "max": 77.3819984048605, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.054566108950754054, | |
| "min": 0.05042585650493284, | |
| "max": 8.928653911687434, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 2.837437665439211, | |
| "min": 2.837437665439211, | |
| "max": 142.85846258699894, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1750681963", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.7.1+cu126", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1750684028" | |
| }, | |
| "total": 2064.788200636, | |
| "count": 1, | |
| "self": 0.5462420210001255, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.023352799999997842, | |
| "count": 1, | |
| "self": 0.023352799999997842 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2064.218605815, | |
| "count": 1, | |
| "self": 1.2372683429771314, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 3.893654857999991, | |
| "count": 1, | |
| "self": 3.893654857999991 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2059.007950086023, | |
| "count": 63415, | |
| "self": 1.3015567399934298, | |
| "children": { | |
| "env_step": { | |
| "total": 1410.5149525910017, | |
| "count": 63415, | |
| "self": 1266.0507895819883, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 143.72092754401172, | |
| "count": 63415, | |
| "self": 4.353773891001765, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 139.36715365300995, | |
| "count": 62571, | |
| "self": 139.36715365300995 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.7432354650015895, | |
| "count": 63415, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2059.430335816015, | |
| "count": 63415, | |
| "is_parallel": true, | |
| "self": 900.7864853950146, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.006355205999966529, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00448609399995803, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0018691120000084993, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0018691120000084993 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.046859011000037754, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005552520000264849, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004497239999636804, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004497239999636804 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04431933000000754, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04431933000000754 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0015347050000400486, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003312390000473897, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001203465999992659, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001203465999992659 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1158.6438504210005, | |
| "count": 63414, | |
| "is_parallel": true, | |
| "self": 31.204137168012494, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 21.797103267958278, | |
| "count": 63414, | |
| "is_parallel": true, | |
| "self": 21.797103267958278 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1014.5155729170086, | |
| "count": 63414, | |
| "is_parallel": true, | |
| "self": 1014.5155729170086 | |
| }, | |
| "steps_from_proto": { | |
| "total": 91.12703706802108, | |
| "count": 63414, | |
| "is_parallel": true, | |
| "self": 17.963086770020368, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 73.16395029800071, | |
| "count": 507312, | |
| "is_parallel": true, | |
| "self": 73.16395029800071 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 647.1914407550277, | |
| "count": 63415, | |
| "self": 2.358597632058718, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 121.70408041196868, | |
| "count": 63415, | |
| "self": 121.42279381996866, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.28128659200001493, | |
| "count": 2, | |
| "self": 0.28128659200001493 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 523.1287627110003, | |
| "count": 443, | |
| "self": 290.450171928984, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 232.67859078201627, | |
| "count": 22788, | |
| "self": 232.67859078201627 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.0579997251625173e-06, | |
| "count": 1, | |
| "self": 1.0579997251625173e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.07973147000029712, | |
| "count": 1, | |
| "self": 0.0012926150006933312, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.07843885499960379, | |
| "count": 1, | |
| "self": 0.07843885499960379 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |