| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.30174532532691956, | |
| "min": 0.30111098289489746, | |
| "max": 1.4569752216339111, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 9177.8857421875, | |
| "min": 8893.6142578125, | |
| "max": 44198.80078125, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989907.0, | |
| "min": 29952.0, | |
| "max": 989907.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989907.0, | |
| "min": 29952.0, | |
| "max": 989907.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.485789030790329, | |
| "min": -0.11082945764064789, | |
| "max": 0.5344838500022888, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 133.59197998046875, | |
| "min": -26.70989990234375, | |
| "max": 144.31063842773438, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.06109166890382767, | |
| "min": -0.016629774123430252, | |
| "max": 0.3125622868537903, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 16.800209045410156, | |
| "min": -4.523298740386963, | |
| "max": 75.3275146484375, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.07247156131192807, | |
| "min": 0.0639174328909056, | |
| "max": 0.07273752634566755, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 1.014601858366993, | |
| "min": 0.48495898766047724, | |
| "max": 1.0463508848333731, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.01701817784322418, | |
| "min": 0.0007437264070160322, | |
| "max": 0.01701817784322418, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.23825448980513853, | |
| "min": 0.008924716884192387, | |
| "max": 0.23825448980513853, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.333490412678569e-06, | |
| "min": 7.333490412678569e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00010266886577749996, | |
| "min": 0.00010266886577749996, | |
| "max": 0.0032589569136811, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10244446428571428, | |
| "min": 0.10244446428571428, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4342225, | |
| "min": 1.3886848, | |
| "max": 2.3863189, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0002542019821428571, | |
| "min": 0.0002542019821428571, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.003558827749999999, | |
| "min": 0.003558827749999999, | |
| "max": 0.10865325811000001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.011915902607142925, | |
| "min": 0.011915902607142925, | |
| "max": 0.41923269629478455, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.1668226420879364, | |
| "min": 0.1668226420879364, | |
| "max": 2.934628963470459, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 394.9875, | |
| "min": 361.58620689655174, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 31599.0, | |
| "min": 15984.0, | |
| "max": 33810.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.4299374838359653, | |
| "min": -1.0000000521540642, | |
| "max": 1.5665973110993703, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 114.39499870687723, | |
| "min": -30.604801654815674, | |
| "max": 134.53999774158, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.4299374838359653, | |
| "min": -1.0000000521540642, | |
| "max": 1.5665973110993703, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 114.39499870687723, | |
| "min": -30.604801654815674, | |
| "max": 134.53999774158, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.04875061192142312, | |
| "min": 0.04630890977928231, | |
| "max": 8.244974036701024, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.900048953713849, | |
| "min": 3.662518389726756, | |
| "max": 131.91958458721638, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1739874870", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.6.0+cu124", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1739877141" | |
| }, | |
| "total": 2270.917346591, | |
| "count": 1, | |
| "self": 0.5317507879994992, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.020596433999799046, | |
| "count": 1, | |
| "self": 0.020596433999799046 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2270.3649993690005, | |
| "count": 1, | |
| "self": 1.4216132280434977, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.1535198769997805, | |
| "count": 1, | |
| "self": 2.1535198769997805 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2266.697146882958, | |
| "count": 63715, | |
| "self": 1.4656953820572198, | |
| "children": { | |
| "env_step": { | |
| "total": 1584.6988095608945, | |
| "count": 63715, | |
| "self": 1424.0284235659528, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 159.81959405201223, | |
| "count": 63715, | |
| "self": 4.82011118288392, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 154.99948286912831, | |
| "count": 62558, | |
| "self": 154.99948286912831 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.8507919429293906, | |
| "count": 63715, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2265.141849779913, | |
| "count": 63715, | |
| "is_parallel": true, | |
| "self": 957.9124650790386, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0021050399996056512, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0007095929986462579, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013954470009593933, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013954470009593933 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04745150000007925, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005292370005918201, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004973239997525525, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004973239997525525 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04471848499997577, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04471848499997577 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0017064539997591055, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00037717499890277395, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013292790008563315, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013292790008563315 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1307.2293847008746, | |
| "count": 63714, | |
| "is_parallel": true, | |
| "self": 32.143628979924415, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 24.11649713707584, | |
| "count": 63714, | |
| "is_parallel": true, | |
| "self": 24.11649713707584 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1150.885577916907, | |
| "count": 63714, | |
| "is_parallel": true, | |
| "self": 1150.885577916907 | |
| }, | |
| "steps_from_proto": { | |
| "total": 100.08368066696721, | |
| "count": 63714, | |
| "is_parallel": true, | |
| "self": 20.654079620931498, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 79.42960104603571, | |
| "count": 509712, | |
| "is_parallel": true, | |
| "self": 79.42960104603571 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 680.5326419400062, | |
| "count": 63715, | |
| "self": 2.6487831570852904, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 130.1719660099343, | |
| "count": 63715, | |
| "self": 129.91227057293418, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.25969543700011855, | |
| "count": 2, | |
| "self": 0.25969543700011855 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 547.7118927729866, | |
| "count": 444, | |
| "self": 300.1547657120068, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 247.55712706097984, | |
| "count": 22833, | |
| "self": 247.55712706097984 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.28000190469902e-07, | |
| "count": 1, | |
| "self": 9.28000190469902e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.09271845299917914, | |
| "count": 1, | |
| "self": 0.0014304439991974505, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.09128800899998168, | |
| "count": 1, | |
| "self": 0.09128800899998168 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |