| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.31334707140922546, | |
| "min": 0.30935412645339966, | |
| "max": 1.39408540725708, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 9385.37109375, | |
| "min": 9245.9765625, | |
| "max": 42290.9765625, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989998.0, | |
| "min": 29969.0, | |
| "max": 989998.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989998.0, | |
| "min": 29969.0, | |
| "max": 989998.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.5813647508621216, | |
| "min": -0.12382816523313522, | |
| "max": 0.6586253643035889, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 162.2007598876953, | |
| "min": -29.47110366821289, | |
| "max": 192.318603515625, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.0019777491688728333, | |
| "min": -0.009812026284635067, | |
| "max": 0.6466519236564636, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 0.5517920255661011, | |
| "min": -2.6590590476989746, | |
| "max": 153.9031524658203, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06847971635338015, | |
| "min": 0.06537009039350412, | |
| "max": 0.07386962259331205, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 1.0271957453007023, | |
| "min": 0.5909569807464964, | |
| "max": 1.092487700687557, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.014425657873115732, | |
| "min": 0.00026462271859441374, | |
| "max": 0.018428373553130463, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.216384868096736, | |
| "min": 0.0029108499045385513, | |
| "max": 0.2579972297438265, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.504977498373329e-06, | |
| "min": 7.504977498373329e-06, | |
| "max": 0.00029501025166325, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00011257466247559994, | |
| "min": 0.00011257466247559994, | |
| "max": 0.0035071697309435, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10250162666666666, | |
| "min": 0.10250162666666666, | |
| "max": 0.19833675, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.5375244, | |
| "min": 1.4779451, | |
| "max": 2.5727063999999995, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00025991250399999994, | |
| "min": 0.00025991250399999994, | |
| "max": 0.009833841325, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.003898687559999999, | |
| "min": 0.003898687559999999, | |
| "max": 0.11692874434999999, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.015914293006062508, | |
| "min": 0.015914293006062508, | |
| "max": 0.4476422071456909, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.23871439695358276, | |
| "min": 0.2271513044834137, | |
| "max": 3.5811376571655273, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 306.2083333333333, | |
| "min": 282.0740740740741, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29396.0, | |
| "min": 16128.0, | |
| "max": 32802.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.652108315533648, | |
| "min": -0.9999625524505973, | |
| "max": 1.6993999867527574, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 158.6023982912302, | |
| "min": -31.998801678419113, | |
| "max": 183.5351985692978, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.652108315533648, | |
| "min": -0.9999625524505973, | |
| "max": 1.6993999867527574, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 158.6023982912302, | |
| "min": -31.998801678419113, | |
| "max": 183.5351985692978, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.051195131506877566, | |
| "min": 0.04807348390830965, | |
| "max": 8.44656971447608, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 4.914732624660246, | |
| "min": 4.721565438841935, | |
| "max": 143.59168514609337, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1685092403", | |
| "python_version": "3.10.11 (main, Apr 5 2023, 14:15:10) [GCC 9.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "0.31.0.dev0", | |
| "mlagents_envs_version": "0.31.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.11.0+cu102", | |
| "numpy_version": "1.21.2", | |
| "end_time_seconds": "1685094654" | |
| }, | |
| "total": 2250.111906167999, | |
| "count": 1, | |
| "self": 0.4742552079987945, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0368981880001229, | |
| "count": 1, | |
| "self": 0.0368981880001229 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2249.6007527720003, | |
| "count": 1, | |
| "self": 1.4274300211282025, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 4.282503080999959, | |
| "count": 1, | |
| "self": 4.282503080999959 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2243.7998358968716, | |
| "count": 64046, | |
| "self": 1.4643321889489016, | |
| "children": { | |
| "env_step": { | |
| "total": 1587.2225887509248, | |
| "count": 64046, | |
| "self": 1471.5691050439818, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 114.78610137293526, | |
| "count": 64046, | |
| "self": 5.183988015075556, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 109.60211335785971, | |
| "count": 62571, | |
| "self": 109.60211335785971 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.8673823340077433, | |
| "count": 64046, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2243.9662676449434, | |
| "count": 64046, | |
| "is_parallel": true, | |
| "self": 894.6123245579674, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0019796659998974064, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.000650848999612208, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013288170002851984, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013288170002851984 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.09669417300028726, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.000580125999476877, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005716140003642067, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005716140003642067 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.09357961499972589, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.09357961499972589 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.00196281800072029, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00040389799869444687, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0015589200020258431, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0015589200020258431 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1349.353943086976, | |
| "count": 64045, | |
| "is_parallel": true, | |
| "self": 32.37307871989924, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 25.458546876033324, | |
| "count": 64045, | |
| "is_parallel": true, | |
| "self": 25.458546876033324 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1186.4374435568798, | |
| "count": 64045, | |
| "is_parallel": true, | |
| "self": 1186.4374435568798 | |
| }, | |
| "steps_from_proto": { | |
| "total": 105.08487393416362, | |
| "count": 64045, | |
| "is_parallel": true, | |
| "self": 21.895063486982508, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 83.18981044718112, | |
| "count": 512360, | |
| "is_parallel": true, | |
| "self": 83.18981044718112 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 655.1129149569979, | |
| "count": 64046, | |
| "self": 2.784611811081959, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 115.83891026491801, | |
| "count": 64046, | |
| "self": 115.62544336891824, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.21346689599977253, | |
| "count": 2, | |
| "self": 0.21346689599977253 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 536.4893928809979, | |
| "count": 453, | |
| "self": 350.5962974689983, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 185.89309541199964, | |
| "count": 22785, | |
| "self": 185.89309541199964 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.479999789618887e-07, | |
| "count": 1, | |
| "self": 9.479999789618887e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.09098282500053756, | |
| "count": 1, | |
| "self": 0.0012675340003625024, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.08971529100017506, | |
| "count": 1, | |
| "self": 0.08971529100017506 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |