| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.4969807267189026, | |
| "min": 0.42631274461746216, | |
| "max": 0.542986273765564, | |
| "count": 7 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 14694.7265625, | |
| "min": 873.0885009765625, | |
| "max": 16254.837890625, | |
| "count": 7 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 7 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 7 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989971.0, | |
| "min": 839959.0, | |
| "max": 989971.0, | |
| "count": 6 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989971.0, | |
| "min": 839959.0, | |
| "max": 989971.0, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.25633999705314636, | |
| "min": 0.0464077964425087, | |
| "max": 0.25633999705314636, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 65.36669921875, | |
| "min": 11.509133338928223, | |
| "max": 65.36669921875, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.007073692977428436, | |
| "min": 0.007073692977428436, | |
| "max": 0.015582084655761719, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 1.8037917613983154, | |
| "min": 1.8037917613983154, | |
| "max": 3.879939079284668, | |
| "count": 6 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06593973143865924, | |
| "min": 0.06584821953645563, | |
| "max": 0.0691815057926921, | |
| "count": 6 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9231562401412292, | |
| "min": 0.7901786344374676, | |
| "max": 1.0377225868903814, | |
| "count": 6 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.010510177725807996, | |
| "min": 0.006338277656357689, | |
| "max": 0.010510177725807996, | |
| "count": 6 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.14714248816131195, | |
| "min": 0.08873588718900766, | |
| "max": 0.14714248816131195, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 1.2788740299414286e-05, | |
| "min": 1.2788740299414286e-05, | |
| "max": 8.7043207591375e-05, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.0001790423641918, | |
| "min": 0.0001790423641918, | |
| "max": 0.0010873237825354998, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10255772857142857, | |
| "min": 0.10255772857142857, | |
| "max": 0.117408625, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4358082, | |
| "min": 1.4089035, | |
| "max": 1.7174645000000002, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00026551708428571437, | |
| "min": 0.00026551708428571437, | |
| "max": 0.0017491216375000007, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.003717239180000001, | |
| "min": 0.003717239180000001, | |
| "max": 0.021874703550000003, | |
| "count": 6 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.011271917261183262, | |
| "min": 0.01120806485414505, | |
| "max": 0.01225132867693901, | |
| "count": 6 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.15780684351921082, | |
| "min": 0.14701594412326813, | |
| "max": 0.18066348135471344, | |
| "count": 6 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 635.1132075471698, | |
| "min": 588.7083333333334, | |
| "max": 773.952380952381, | |
| "count": 6 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 33661.0, | |
| "min": 22501.0, | |
| "max": 33661.0, | |
| "count": 6 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 0.8746716693606017, | |
| "min": 0.32096186422166373, | |
| "max": 0.9086637983613826, | |
| "count": 6 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 46.35759847611189, | |
| "min": 13.480398297309875, | |
| "max": 46.35759847611189, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 0.8746716693606017, | |
| "min": 0.32096186422166373, | |
| "max": 0.9086637983613826, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 46.35759847611189, | |
| "min": 13.480398297309875, | |
| "max": 46.35759847611189, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.07392889281892974, | |
| "min": 0.06827661918167847, | |
| "max": 0.09641892619575151, | |
| "count": 6 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.918231319403276, | |
| "min": 2.90527749795001, | |
| "max": 4.049594900221564, | |
| "count": 6 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1706806088", | |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", | |
| "mlagents_version": "1.1.0.dev0", | |
| "mlagents_envs_version": "1.1.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.2.0+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1706806501" | |
| }, | |
| "total": 412.98999239900013, | |
| "count": 1, | |
| "self": 0.5277990220001811, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.045968931000061275, | |
| "count": 1, | |
| "self": 0.045968931000061275 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 412.4162244459999, | |
| "count": 1, | |
| "self": 0.25361718202157135, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.2507146850002755, | |
| "count": 1, | |
| "self": 2.2507146850002755 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 409.8228079509777, | |
| "count": 12149, | |
| "self": 0.26849173005894045, | |
| "children": { | |
| "env_step": { | |
| "total": 288.91952816193316, | |
| "count": 12149, | |
| "self": 264.12411645289967, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 24.64340950700489, | |
| "count": 12149, | |
| "self": 0.8946365079896168, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 23.748772999015273, | |
| "count": 11939, | |
| "self": 23.748772999015273 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.15200220202859782, | |
| "count": 12149, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 411.31628305100185, | |
| "count": 12149, | |
| "is_parallel": true, | |
| "self": 168.8024168019865, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.001999697999963246, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006718100003126892, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013278879996505566, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013278879996505566 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.057077552000009746, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006223160003173689, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005332819996510807, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005332819996510807 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.05407051500014859, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.05407051500014859 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0018514389998927072, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003821119989879662, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001469327000904741, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001469327000904741 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 242.51386624901534, | |
| "count": 12148, | |
| "is_parallel": true, | |
| "self": 6.68029840002373, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 4.86561667698561, | |
| "count": 12148, | |
| "is_parallel": true, | |
| "self": 4.86561667698561 | |
| }, | |
| "communicator.exchange": { | |
| "total": 211.74738936802714, | |
| "count": 12148, | |
| "is_parallel": true, | |
| "self": 211.74738936802714 | |
| }, | |
| "steps_from_proto": { | |
| "total": 19.220561803978853, | |
| "count": 12148, | |
| "is_parallel": true, | |
| "self": 3.8417280820990527, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 15.3788337218798, | |
| "count": 97184, | |
| "is_parallel": true, | |
| "self": 15.3788337218798 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 120.63478805898558, | |
| "count": 12149, | |
| "self": 0.5097322969668312, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 24.777226010020513, | |
| "count": 12149, | |
| "self": 24.661879365020468, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.1153466450000451, | |
| "count": 1, | |
| "self": 0.1153466450000451 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 95.34782975199823, | |
| "count": 88, | |
| "self": 55.45195364298252, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 39.89587610901572, | |
| "count": 4308, | |
| "self": 39.89587610901572 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.22000253922306e-07, | |
| "count": 1, | |
| "self": 9.22000253922306e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.0890837060001104, | |
| "count": 1, | |
| "self": 0.0023088230000212207, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.08677488300008918, | |
| "count": 1, | |
| "self": 0.08677488300008918 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |