Jenny22255's picture
First Push
658d286 verified
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.13997095823287964,
"min": 0.13515740633010864,
"max": 1.5335098505020142,
"count": 100
},
"Pyramids.Policy.Entropy.sum": {
"value": 4185.69140625,
"min": 4050.397216796875,
"max": 46520.5546875,
"count": 100
},
"Pyramids.Step.mean": {
"value": 2999951.0,
"min": 29974.0,
"max": 2999951.0,
"count": 100
},
"Pyramids.Step.sum": {
"value": 2999951.0,
"min": 29974.0,
"max": 2999951.0,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.8112826347351074,
"min": -0.10546746850013733,
"max": 0.8812189102172852,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 245.81863403320312,
"min": -25.417659759521484,
"max": 273.1778564453125,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.013699229806661606,
"min": -0.005644344259053469,
"max": 0.1852613240480423,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 4.150866508483887,
"min": -1.66508150100708,
"max": 44.647979736328125,
"count": 100
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.07026074094063092,
"min": 0.06211566593746149,
"max": 0.07511671141892497,
"count": 100
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.983650373168833,
"min": 0.5947844996523509,
"max": 1.121613116217001,
"count": 100
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.015531344338640094,
"min": 0.0005532349624091268,
"max": 0.01795476450795485,
"count": 100
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.21743882074096132,
"min": 0.007192054511318649,
"max": 0.2513667031113679,
"count": 100
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.4412923767452392e-06,
"min": 1.4412923767452392e-06,
"max": 0.00029828397557200837,
"count": 100
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.017809327443335e-05,
"min": 2.017809327443335e-05,
"max": 0.004010949563016833,
"count": 100
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.1004803976190476,
"min": 0.1004803976190476,
"max": 0.19942799166666667,
"count": 100
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4067255666666665,
"min": 1.4067255666666665,
"max": 2.7975145666666674,
"count": 100
},
"Pyramids.Policy.Beta.mean": {
"value": 5.799172214285719e-05,
"min": 5.799172214285719e-05,
"max": 0.009942856367499999,
"count": 100
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0008118841100000007,
"min": 0.0008118841100000007,
"max": 0.13370461835,
"count": 100
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.005496342666447163,
"min": 0.005496342666447163,
"max": 0.3608822226524353,
"count": 100
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.07694879919290543,
"min": 0.07694879919290543,
"max": 2.8870577812194824,
"count": 100
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 231.5859375,
"min": 202.80141843971631,
"max": 995.53125,
"count": 100
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29643.0,
"min": 16261.0,
"max": 33373.0,
"count": 100
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.7212968617677689,
"min": -0.9337813011370599,
"max": 1.7942777725143566,
"count": 100
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 220.3259983062744,
"min": -29.881001636385918,
"max": 268.265997633338,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.7212968617677689,
"min": -0.9337813011370599,
"max": 1.7942777725143566,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 220.3259983062744,
"min": -29.881001636385918,
"max": 268.265997633338,
"count": 100
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.013274244590974149,
"min": 0.012789758633581116,
"max": 7.566931799054146,
"count": 100
},
"Pyramids.Policy.RndReward.sum": {
"value": 1.699103307644691,
"min": 1.699103307644691,
"max": 128.63784058392048,
"count": 100
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1743247210",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.6.0+cu124",
"numpy_version": "1.23.5",
"end_time_seconds": "1743254608"
},
"total": 7398.44707014,
"count": 1,
"self": 0.5312970799986942,
"children": {
"run_training.setup": {
"total": 0.019611703000009584,
"count": 1,
"self": 0.019611703000009584
},
"TrainerController.start_learning": {
"total": 7397.896161357001,
"count": 1,
"self": 4.140634342924386,
"children": {
"TrainerController._reset_env": {
"total": 2.100141836000148,
"count": 1,
"self": 2.100141836000148
},
"TrainerController.advance": {
"total": 7391.564862175074,
"count": 195415,
"self": 4.192528928921092,
"children": {
"env_step": {
"total": 5349.433735135832,
"count": 195415,
"self": 4883.7247261575485,
"children": {
"SubprocessEnvManager._take_step": {
"total": 463.29011357131367,
"count": 195415,
"self": 13.96375521139953,
"children": {
"TorchPolicy.evaluate": {
"total": 449.32635835991414,
"count": 187555,
"self": 449.32635835991414
}
}
},
"workers": {
"total": 2.4188954069691135,
"count": 195415,
"self": 0.0,
"children": {
"worker_root": {
"total": 7382.397145986948,
"count": 195415,
"is_parallel": true,
"self": 2843.0253636796224,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0021031010001024697,
"count": 1,
"is_parallel": true,
"self": 0.0006904639999447681,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014126370001577016,
"count": 8,
"is_parallel": true,
"self": 0.0014126370001577016
}
}
},
"UnityEnvironment.step": {
"total": 0.04908028700037903,
"count": 1,
"is_parallel": true,
"self": 0.0005147440001564973,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0004972369997631176,
"count": 1,
"is_parallel": true,
"self": 0.0004972369997631176
},
"communicator.exchange": {
"total": 0.04638279300024806,
"count": 1,
"is_parallel": true,
"self": 0.04638279300024806
},
"steps_from_proto": {
"total": 0.0016855130002113583,
"count": 1,
"is_parallel": true,
"self": 0.00035757500108957174,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0013279379991217866,
"count": 8,
"is_parallel": true,
"self": 0.0013279379991217866
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 4539.371782307326,
"count": 195414,
"is_parallel": true,
"self": 95.84744425767713,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 70.715368155139,
"count": 195414,
"is_parallel": true,
"self": 70.715368155139
},
"communicator.exchange": {
"total": 4080.673982500776,
"count": 195414,
"is_parallel": true,
"self": 4080.673982500776
},
"steps_from_proto": {
"total": 292.13498739373335,
"count": 195414,
"is_parallel": true,
"self": 59.96355395639603,
"children": {
"_process_rank_one_or_two_observation": {
"total": 232.17143343733733,
"count": 1563312,
"is_parallel": true,
"self": 232.17143343733733
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2037.9385981103214,
"count": 195415,
"self": 8.572907293308617,
"children": {
"process_trajectory": {
"total": 395.5845103520005,
"count": 195415,
"self": 394.9405266760009,
"children": {
"RLTrainer._checkpoint": {
"total": 0.6439836759996069,
"count": 6,
"self": 0.6439836759996069
}
}
},
"_update_policy": {
"total": 1633.7811804650123,
"count": 1401,
"self": 891.1595728188636,
"children": {
"TorchPPOOptimizer.update": {
"total": 742.6216076461487,
"count": 68421,
"self": 742.6216076461487
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.750012057134882e-07,
"count": 1,
"self": 8.750012057134882e-07
},
"TrainerController._save_models": {
"total": 0.09052212800088455,
"count": 1,
"self": 0.001743404001899762,
"children": {
"RLTrainer._checkpoint": {
"total": 0.08877872399898479,
"count": 1,
"self": 0.08877872399898479
}
}
}
}
}
}
}