| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.12553852796554565, | |
| "min": 0.11824634671211243, | |
| "max": 1.4317291975021362, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 3772.181640625, | |
| "min": 3494.416015625, | |
| "max": 43432.9375, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2999950.0, | |
| "min": 29936.0, | |
| "max": 2999950.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2999950.0, | |
| "min": 29936.0, | |
| "max": 2999950.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.8255670070648193, | |
| "min": -0.1056881994009018, | |
| "max": 0.8739468455314636, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 244.36782836914062, | |
| "min": -25.36516761779785, | |
| "max": 267.7449645996094, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.006503860000520945, | |
| "min": -0.007723746355623007, | |
| "max": 0.25734537839889526, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 1.925142526626587, | |
| "min": -2.32484769821167, | |
| "max": 61.24820327758789, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06850176529994877, | |
| "min": 0.06402704119857316, | |
| "max": 0.07390006545572489, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9590247141992827, | |
| "min": 0.5912005236457991, | |
| "max": 1.086389510737111, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.0127631435877577, | |
| "min": 0.00021577098309802402, | |
| "max": 0.015772829781700342, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.1786840102286078, | |
| "min": 0.0025892517971762884, | |
| "max": 0.2365924467255051, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 1.511928067485715e-06, | |
| "min": 1.511928067485715e-06, | |
| "max": 0.0002982555005815, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 2.116699294480001e-05, | |
| "min": 2.116699294480001e-05, | |
| "max": 0.0040273597575468, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10050394285714284, | |
| "min": 0.10050394285714284, | |
| "max": 0.19941850000000003, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4070551999999998, | |
| "min": 1.4070551999999998, | |
| "max": 2.8424532000000005, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 6.034389142857146e-05, | |
| "min": 6.034389142857146e-05, | |
| "max": 0.00994190815, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0008448144800000005, | |
| "min": 0.0008448144800000005, | |
| "max": 0.13426107467999998, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.006635910831391811, | |
| "min": 0.006482395809143782, | |
| "max": 0.35374540090560913, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.09290274977684021, | |
| "min": 0.09075354039669037, | |
| "max": 2.829963207244873, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 234.3875968992248, | |
| "min": 204.9496402877698, | |
| "max": 999.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 30236.0, | |
| "min": 17374.0, | |
| "max": 32363.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.686531237559393, | |
| "min": -0.9999548913009705, | |
| "max": 1.7897655008168056, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 215.8759984076023, | |
| "min": -30.998601630330086, | |
| "max": 262.6509977579117, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.686531237559393, | |
| "min": -0.9999548913009705, | |
| "max": 1.7897655008168056, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 215.8759984076023, | |
| "min": -30.998601630330086, | |
| "max": 262.6509977579117, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.01615269563626498, | |
| "min": 0.015062907016595248, | |
| "max": 6.780477455920643, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 2.0675450414419174, | |
| "min": 1.9996734989690594, | |
| "max": 122.04859420657158, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1763807741", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.8.0+cu128", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1763814852" | |
| }, | |
| "total": 7110.628740669, | |
| "count": 1, | |
| "self": 0.4781213249989378, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.024683900000127323, | |
| "count": 1, | |
| "self": 0.024683900000127323 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 7110.125935444001, | |
| "count": 1, | |
| "self": 4.128506202121571, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.129107746000045, | |
| "count": 1, | |
| "self": 2.129107746000045 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 7103.791995125878, | |
| "count": 195338, | |
| "self": 4.225939400385869, | |
| "children": { | |
| "env_step": { | |
| "total": 5134.34242768532, | |
| "count": 195338, | |
| "self": 4701.639765515445, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 430.2864781819321, | |
| "count": 195338, | |
| "self": 13.385923708935024, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 416.9005544729971, | |
| "count": 187559, | |
| "self": 416.9005544729971 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 2.4161839879425315, | |
| "count": 195338, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 7090.553305423986, | |
| "count": 195338, | |
| "is_parallel": true, | |
| "self": 2729.4876868156, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0018687289998524648, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005384839996622759, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013302450001901889, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013302450001901889 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.05043522300002223, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005382559997997305, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004357020002316858, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004357020002316858 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.047882385999855615, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.047882385999855615 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0015788790001352027, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00032912900041992543, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012497499997152772, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012497499997152772 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 4361.065618608386, | |
| "count": 195337, | |
| "is_parallel": true, | |
| "self": 98.42024283779938, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 65.98915173519481, | |
| "count": 195337, | |
| "is_parallel": true, | |
| "self": 65.98915173519481 | |
| }, | |
| "communicator.exchange": { | |
| "total": 3890.9488635243956, | |
| "count": 195337, | |
| "is_parallel": true, | |
| "self": 3890.9488635243956 | |
| }, | |
| "steps_from_proto": { | |
| "total": 305.7073605109963, | |
| "count": 195337, | |
| "is_parallel": true, | |
| "self": 63.33539562973874, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 242.37196488125755, | |
| "count": 1562696, | |
| "is_parallel": true, | |
| "self": 242.37196488125755 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1965.2236280401721, | |
| "count": 195338, | |
| "self": 8.071110169227723, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 369.82641224293957, | |
| "count": 195338, | |
| "self": 369.2383903789387, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.5880218640008934, | |
| "count": 6, | |
| "self": 0.5880218640008934 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 1587.3261056280048, | |
| "count": 1400, | |
| "self": 878.8522808369398, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 708.473824791065, | |
| "count": 68394, | |
| "self": 708.473824791065 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.86001396086067e-07, | |
| "count": 1, | |
| "self": 9.86001396086067e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.07632538399957411, | |
| "count": 1, | |
| "self": 0.0010348949999752222, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.07529048899959889, | |
| "count": 1, | |
| "self": 0.07529048899959889 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |