| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.4165646731853485, | |
| "min": 0.40163546800613403, | |
| "max": 1.4806667566299438, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 12223.673828125, | |
| "min": 12132.6044921875, | |
| "max": 44917.5078125, | |
| "count": 52 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 1559875.0, | |
| "min": 29952.0, | |
| "max": 1559875.0, | |
| "count": 52 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 1559875.0, | |
| "min": 29952.0, | |
| "max": 1559875.0, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.5290877223014832, | |
| "min": -0.11454473435878754, | |
| "max": 0.5587700605392456, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 144.97003173828125, | |
| "min": -27.49073600769043, | |
| "max": 152.54421997070312, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": -0.006103459279984236, | |
| "min": -0.0251805130392313, | |
| "max": 0.25557011365890503, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": -1.672347903251648, | |
| "min": -6.723196983337402, | |
| "max": 61.336830139160156, | |
| "count": 52 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06869723334999302, | |
| "min": 0.06460764174421672, | |
| "max": 0.0727808943636835, | |
| "count": 52 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9617612668999023, | |
| "min": 0.47909215814434, | |
| "max": 1.0839812987844697, | |
| "count": 52 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.012419828267047196, | |
| "min": 9.521335650952962e-05, | |
| "max": 0.012419828267047196, | |
| "count": 52 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.17387759573866074, | |
| "min": 0.001237773634623885, | |
| "max": 0.17387759573866074, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 0.00014549720864380475, | |
| "min": 0.00014549720864380475, | |
| "max": 0.00029838354339596195, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.0020369609210132665, | |
| "min": 0.002027104024298666, | |
| "max": 0.0037594509468497324, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.1484990523809524, | |
| "min": 0.1484990523809524, | |
| "max": 0.19946118095238097, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 2.0789867333333336, | |
| "min": 1.3757013333333334, | |
| "max": 2.6531502666666675, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0048550553328571425, | |
| "min": 0.0048550553328571425, | |
| "max": 0.009946171977142856, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.06797077466, | |
| "min": 0.06757256319999999, | |
| "max": 0.12532971164, | |
| "count": 52 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.004804596770554781, | |
| "min": 0.00433261226862669, | |
| "max": 0.3447306454181671, | |
| "count": 52 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.06726435571908951, | |
| "min": 0.06065656989812851, | |
| "max": 2.413114547729492, | |
| "count": 52 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 377.07894736842104, | |
| "min": 345.23809523809524, | |
| "max": 999.0, | |
| "count": 52 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 28658.0, | |
| "min": 15984.0, | |
| "max": 33896.0, | |
| "count": 52 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.5176262921212536, | |
| "min": -1.0000000521540642, | |
| "max": 1.5833095061991895, | |
| "count": 52 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 115.33959820121527, | |
| "min": -32.000001668930054, | |
| "max": 132.99799852073193, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.5176262921212536, | |
| "min": -1.0000000521540642, | |
| "max": 1.5833095061991895, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 115.33959820121527, | |
| "min": -32.000001668930054, | |
| "max": 132.99799852073193, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.018644611067812594, | |
| "min": 0.01617049040162653, | |
| "max": 6.940789316780865, | |
| "count": 52 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 1.4169904411537573, | |
| "min": 1.3122262909600977, | |
| "max": 111.05262906849384, | |
| "count": 52 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 52 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 52 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1736165049", | |
| "python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsTraining --no-graphics --force", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.5.1+cu121", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1736168427" | |
| }, | |
| "total": 3378.282926876, | |
| "count": 1, | |
| "self": 0.3825557620007203, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.07782670900007815, | |
| "count": 1, | |
| "self": 0.07782670900007815 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 3377.8225444049995, | |
| "count": 1, | |
| "self": 1.9590828259451882, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 5.535551100000021, | |
| "count": 1, | |
| "self": 5.535551100000021 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 3370.1835454630545, | |
| "count": 100233, | |
| "self": 2.102668974996959, | |
| "children": { | |
| "env_step": { | |
| "total": 2278.0289274559677, | |
| "count": 100233, | |
| "self": 2056.4789919720215, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 220.37158759004126, | |
| "count": 100233, | |
| "self": 6.804709509081363, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 213.5668780809599, | |
| "count": 98685, | |
| "self": 213.5668780809599 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 1.1783478939048564, | |
| "count": 100232, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 3370.7720719059885, | |
| "count": 100232, | |
| "is_parallel": true, | |
| "self": 1487.4161913319726, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.003491411000027256, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0009558240001297236, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0025355869998975322, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0025355869998975322 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.047565000999952645, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006084649999138492, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004494990000694088, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004494990000694088 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04488320100006149, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04488320100006149 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016238359999078966, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003395269998236472, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012843090000842494, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012843090000842494 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1883.3558805740158, | |
| "count": 100231, | |
| "is_parallel": true, | |
| "self": 51.207851367937565, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 35.77328111900772, | |
| "count": 100231, | |
| "is_parallel": true, | |
| "self": 35.77328111900772 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1647.3357374390148, | |
| "count": 100231, | |
| "is_parallel": true, | |
| "self": 1647.3357374390148 | |
| }, | |
| "steps_from_proto": { | |
| "total": 149.03901064805586, | |
| "count": 100231, | |
| "is_parallel": true, | |
| "self": 29.171997597124346, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 119.86701305093152, | |
| "count": 801848, | |
| "is_parallel": true, | |
| "self": 119.86701305093152 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1090.0519490320899, | |
| "count": 100232, | |
| "self": 3.579410602092821, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 204.11210338300464, | |
| "count": 100232, | |
| "self": 203.741378542005, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.3707248409996282, | |
| "count": 3, | |
| "self": 0.3707248409996282 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 882.3604350469924, | |
| "count": 698, | |
| "self": 496.85726357902286, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 385.50317146796954, | |
| "count": 36093, | |
| "self": 385.50317146796954 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.6379999578930438e-06, | |
| "count": 1, | |
| "self": 1.6379999578930438e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.14436337799998, | |
| "count": 1, | |
| "self": 0.002059250999991491, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.1423041269999885, | |
| "count": 1, | |
| "self": 0.1423041269999885 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |