| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.5708699822425842, | |
| "min": 0.5708699822425842, | |
| "max": 1.5417309999465942, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 17144.3671875, | |
| "min": 17144.3671875, | |
| "max": 46769.953125, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989943.0, | |
| "min": 29952.0, | |
| "max": 989943.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989943.0, | |
| "min": 29952.0, | |
| "max": 989943.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.05284634977579117, | |
| "min": -0.09831222891807556, | |
| "max": 0.06268835067749023, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 12.894509315490723, | |
| "min": -23.693246841430664, | |
| "max": 15.233268737792969, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.0025327419862151146, | |
| "min": 0.0025327419862151146, | |
| "max": 0.18176408112049103, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 0.6179890632629395, | |
| "min": 0.6179890632629395, | |
| "max": 43.078086853027344, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.13629314735778095, | |
| "min": 0.1306943559024466, | |
| "max": 0.1492144265051077, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 2.0443972103667143, | |
| "min": 0.9850428738347232, | |
| "max": 2.0564164466948096, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.0037154096802173883, | |
| "min": 1.2028345910264857e-05, | |
| "max": 0.0038143186133076136, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.05573114520326083, | |
| "min": 0.00015636849683344314, | |
| "max": 0.05573114520326083, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.531077489673336e-06, | |
| "min": 7.531077489673336e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00011296616234510004, | |
| "min": 0.00011296616234510004, | |
| "max": 0.0033709783763406, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10251032666666668, | |
| "min": 0.10251032666666668, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.5376549000000002, | |
| "min": 1.3691136000000002, | |
| "max": 2.4236594000000005, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0002607816340000001, | |
| "min": 0.0002607816340000001, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0039117245100000015, | |
| "min": 0.0039117245100000015, | |
| "max": 0.11238357405999996, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.002305775647982955, | |
| "min": 0.002305775647982955, | |
| "max": 0.0496012307703495, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.03458663448691368, | |
| "min": 0.032689835876226425, | |
| "max": 0.3472086191177368, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 839.2222222222222, | |
| "min": 823.6969696969697, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 30212.0, | |
| "min": 15984.0, | |
| "max": 32758.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": -0.1174278271694978, | |
| "min": -1.0000000521540642, | |
| "max": -0.06450593208565432, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": -4.227401778101921, | |
| "min": -32.000001668930054, | |
| "max": -2.1932016909122467, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": -0.1174278271694978, | |
| "min": -1.0000000521540642, | |
| "max": -0.06450593208565432, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": -4.227401778101921, | |
| "min": -32.000001668930054, | |
| "max": -2.1932016909122467, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.02464868994179091, | |
| "min": 0.02464868994179091, | |
| "max": 3.899521377723431, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 0.8873528379044728, | |
| "min": 0.8586896556953434, | |
| "max": 62.3923420435749, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1739421261", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.6.0+cu124", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1739430259" | |
| }, | |
| "total": 8997.871636274002, | |
| "count": 1, | |
| "self": 0.6377635150020069, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.028000285000416625, | |
| "count": 1, | |
| "self": 0.028000285000416625 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 8997.205872473998, | |
| "count": 1, | |
| "self": 2.309451950031871, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 3.065918163999413, | |
| "count": 1, | |
| "self": 3.065918163999413 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 8991.746659109966, | |
| "count": 63166, | |
| "self": 2.6027346748669515, | |
| "children": { | |
| "env_step": { | |
| "total": 1785.149796195018, | |
| "count": 63166, | |
| "self": 1615.4986482201475, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 168.29640332503732, | |
| "count": 63166, | |
| "self": 7.068450350054263, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 161.22795297498305, | |
| "count": 62564, | |
| "self": 161.22795297498305 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 1.3547446498332647, | |
| "count": 63166, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 8990.315897837005, | |
| "count": 63166, | |
| "is_parallel": true, | |
| "self": 7547.556474579211, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.003094344000601268, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.000881360000676068, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0022129839999252, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0022129839999252 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.09327848900011304, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006488999997600331, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005738550007663434, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005738550007663434 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.09008829399954266, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.09008829399954266 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0019674400000440073, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00047225499838532414, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0014951850016586832, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0014951850016586832 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1442.759423257794, | |
| "count": 63165, | |
| "is_parallel": true, | |
| "self": 44.107836898750975, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 30.747484571862515, | |
| "count": 63165, | |
| "is_parallel": true, | |
| "self": 30.747484571862515 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1242.6184983570183, | |
| "count": 63165, | |
| "is_parallel": true, | |
| "self": 1242.6184983570183 | |
| }, | |
| "steps_from_proto": { | |
| "total": 125.28560343016215, | |
| "count": 63165, | |
| "is_parallel": true, | |
| "self": 27.168742916220253, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 98.1168605139419, | |
| "count": 505320, | |
| "is_parallel": true, | |
| "self": 98.1168605139419 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 7203.9941282400805, | |
| "count": 63166, | |
| "self": 4.602254039779837, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 163.6972787543, | |
| "count": 63166, | |
| "self": 163.48777815430003, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.20950059999995574, | |
| "count": 2, | |
| "self": 0.20950059999995574 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 7035.694595446001, | |
| "count": 439, | |
| "self": 2027.1261700761625, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 5008.568425369838, | |
| "count": 310530, | |
| "self": 5008.568425369838 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.1040010576834902e-06, | |
| "count": 1, | |
| "self": 1.1040010576834902e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.08384214599936968, | |
| "count": 1, | |
| "self": 0.003034474999367376, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.0808076710000023, | |
| "count": 1, | |
| "self": 0.0808076710000023 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |