{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.31657862663269043, "min": 0.31657862663269043, "max": 1.4554413557052612, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 9477.09765625, "min": 9477.09765625, "max": 44152.26953125, "count": 33 }, "Pyramids.Step.mean": { "value": 989980.0, "min": 29952.0, "max": 989980.0, "count": 33 }, "Pyramids.Step.sum": { "value": 989980.0, "min": 29952.0, "max": 989980.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.6274967193603516, "min": -0.11481665819883347, "max": 0.6775597333908081, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 176.3265838623047, "min": -27.670814514160156, "max": 193.6967010498047, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.007007249165326357, "min": 0.0015687725972384214, "max": 0.2707160711288452, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 1.9690370559692383, "min": 0.3968994617462158, "max": 64.97185516357422, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06876534378738904, "min": 0.0638591812139133, "max": 0.07539782882806667, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 1.0314801568108356, "min": 0.4858075592386865, "max": 1.0861022743920332, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.015090243930276331, "min": 0.0014578654519899834, "max": 0.01636559136651446, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.22635365895414497, "min": 0.014578654519899835, "max": 0.23666382780841863, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 7.471197509633331e-06, "min": 7.471197509633331e-06, "max": 0.00029515063018788575, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.00011206796264449996, "min": 0.00011206796264449996, "max": 0.003633119888960099, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10249036666666664, "min": 0.10249036666666664, "max": 0.19838354285714285, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.5373554999999997, "min": 1.3886848, "max": 2.6177872000000004, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.00025878762999999994, "min": 0.00025878762999999994, "max": 0.00983851593142857, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.003881814449999999, "min": 0.003881814449999999, "max": 0.12112288601000001, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.013059018179774284, "min": 0.013059018179774284, "max": 0.3602496087551117, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.19588527083396912, "min": 0.18780364096164703, "max": 2.521747350692749, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 294.9072164948454, "min": 273.9259259259259, "max": 999.0, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 28606.0, "min": 15984.0, "max": 33199.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.6638412233634092, "min": -1.0000000521540642, "max": 1.7112599892914295, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 161.3925986662507, "min": -30.58620174229145, "max": 184.41499803215265, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.6638412233634092, "min": -1.0000000521540642, "max": 1.7112599892914295, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 161.3925986662507, "min": -30.58620174229145, "max": 184.41499803215265, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.03977758732813977, "min": 0.038694411753331895, "max": 5.93458700645715, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 3.8584259708295576, "min": 3.8584259708295576, "max": 94.9533921033144, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1707503277", "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids_Training_2 --no-graphics", "mlagents_version": "1.1.0.dev0", "mlagents_envs_version": "1.1.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.2.0+cu121", "numpy_version": "1.23.5", "end_time_seconds": "1707505522" }, "total": 2245.319947405, "count": 1, "self": 0.5272818630000984, "children": { "run_training.setup": { "total": 0.045931434000067384, "count": 1, "self": 0.045931434000067384 }, "TrainerController.start_learning": { "total": 2244.746734108, "count": 1, "self": 1.3551528949469684, "children": { "TrainerController._reset_env": { "total": 2.591978273999757, "count": 1, "self": 2.591978273999757 }, "TrainerController.advance": { "total": 2240.715435246053, "count": 64307, "self": 1.3556013230345343, "children": { "env_step": { "total": 1622.8087104969645, "count": 64307, "self": 1495.0211759589215, "children": { "SubprocessEnvManager._take_step": { "total": 126.96520265190884, "count": 64307, "self": 4.483194459915467, "children": { "TorchPolicy.evaluate": { "total": 122.48200819199337, "count": 62551, "self": 122.48200819199337 } } }, "workers": { "total": 0.8223318861341795, "count": 64307, "self": 0.0, "children": { "worker_root": { "total": 2239.8021957169412, "count": 64307, "is_parallel": true, "self": 856.1966301607363, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.002120863000072859, "count": 1, "is_parallel": true, "self": 0.0007098269993548456, "children": { "_process_rank_one_or_two_observation": { "total": 0.0014110360007180134, "count": 8, "is_parallel": true, "self": 0.0014110360007180134 } } }, "UnityEnvironment.step": { "total": 0.07481945000017731, "count": 1, "is_parallel": true, "self": 0.0005770530005975161, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00048371000002589426, "count": 1, "is_parallel": true, "self": 0.00048371000002589426 }, "communicator.exchange": { "total": 0.07214259699958347, "count": 1, "is_parallel": true, "self": 0.07214259699958347 }, "steps_from_proto": { "total": 0.001616089999970427, "count": 1, "is_parallel": true, "self": 0.0003722429996741994, "children": { "_process_rank_one_or_two_observation": { "total": 0.0012438470002962276, "count": 8, "is_parallel": true, "self": 0.0012438470002962276 } } } } } } }, "UnityEnvironment.step": { "total": 1383.605565556205, "count": 64306, "is_parallel": true, "self": 34.697032933224364, "children": { "UnityEnvironment._generate_step_input": { "total": 23.583619527958035, "count": 64306, "is_parallel": true, "self": 23.583619527958035 }, "communicator.exchange": { "total": 1228.2680790799955, "count": 64306, "is_parallel": true, "self": 1228.2680790799955 }, "steps_from_proto": { "total": 97.0568340150271, "count": 64306, "is_parallel": true, "self": 18.96307213379896, "children": { "_process_rank_one_or_two_observation": { "total": 78.09376188122815, "count": 514448, "is_parallel": true, "self": 78.09376188122815 } } } } } } } } } } }, "trainer_advance": { "total": 616.5511234260539, "count": 64307, "self": 2.6369264381287394, "children": { "process_trajectory": { "total": 123.49490136293343, "count": 64307, "self": 123.29177375393328, "children": { "RLTrainer._checkpoint": { "total": 0.20312760900014837, "count": 2, "self": 0.20312760900014837 } } }, "_update_policy": { "total": 490.4192956249917, "count": 451, "self": 285.5619166979768, "children": { "TorchPPOOptimizer.update": { "total": 204.8573789270149, "count": 22755, "self": 204.8573789270149 } } } } } } }, "trainer_threads": { "total": 9.55000359681435e-07, "count": 1, "self": 9.55000359681435e-07 }, "TrainerController._save_models": { "total": 0.08416673800002172, "count": 1, "self": 0.0013754459996562218, "children": { "RLTrainer._checkpoint": { "total": 0.0827912920003655, "count": 1, "self": 0.0827912920003655 } } } } } } }