Pyramids / run_logs /timers.json
Icarus013's picture
First push
5ca6bb6 verified
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.9925450086593628,
"min": 0.9847832918167114,
"max": 1.466425895690918,
"count": 5
},
"Pyramids.Policy.Entropy.sum": {
"value": 30316.294921875,
"min": 29496.228515625,
"max": 44485.49609375,
"count": 5
},
"Pyramids.Step.mean": {
"value": 149970.0,
"min": 29952.0,
"max": 149970.0,
"count": 5
},
"Pyramids.Step.sum": {
"value": 149970.0,
"min": 29952.0,
"max": 149970.0,
"count": 5
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.11928949505090714,
"min": -0.11928949505090714,
"max": 0.007646649144589901,
"count": 5
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": -28.748767852783203,
"min": -28.748767852783203,
"max": 1.812255859375,
"count": 5
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.08848647773265839,
"min": 0.08848647773265839,
"max": 0.4663185477256775,
"count": 5
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 21.325241088867188,
"min": 21.325241088867188,
"max": 110.51749420166016,
"count": 5
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.07245683489965793,
"min": 0.07033540763214483,
"max": 0.07588012771551118,
"count": 5
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.7970251838962372,
"min": 0.5065388291637312,
"max": 0.7970251838962372,
"count": 5
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.0005877865855996381,
"min": 0.0005877865855996381,
"max": 0.009045908642764408,
"count": 5
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.006465652441596019,
"min": 0.00532774068794121,
"max": 0.06332136049935086,
"count": 5
},
"Pyramids.Policy.LearningRate.mean": {
"value": 0.00028655179539182723,
"min": 0.00028655179539182723,
"max": 0.00029838354339596195,
"count": 5
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.0031520697493100996,
"min": 0.0020691136102954665,
"max": 0.0031520697493100996,
"count": 5
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.19551726363636365,
"min": 0.19551726363636365,
"max": 0.19946118095238097,
"count": 5
},
"Pyramids.Policy.Epsilon.sum": {
"value": 2.1506899,
"min": 1.3897045333333333,
"max": 2.1506899,
"count": 5
},
"Pyramids.Policy.Beta.mean": {
"value": 0.009552174637272728,
"min": 0.009552174637272728,
"max": 0.009946171977142856,
"count": 5
},
"Pyramids.Policy.Beta.sum": {
"value": 0.10507392101,
"min": 0.06897148288,
"max": 0.10507392101,
"count": 5
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.0687025710940361,
"min": 0.0687025710940361,
"max": 0.45670634508132935,
"count": 5
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.7557282447814941,
"min": 0.7099942564964294,
"max": 3.19694447517395,
"count": 5
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 996.15625,
"min": 984.40625,
"max": 999.0,
"count": 5
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 31877.0,
"min": 15984.0,
"max": 31968.0,
"count": 5
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": -0.9346125507727265,
"min": -1.0000000521540642,
"max": -0.9228750506881624,
"count": 5
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": -29.90760162472725,
"min": -32.000001668930054,
"max": -16.000000834465027,
"count": 5
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": -0.9346125507727265,
"min": -1.0000000521540642,
"max": -0.9228750506881624,
"count": 5
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": -29.90760162472725,
"min": -32.000001668930054,
"max": -16.000000834465027,
"count": 5
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.7536459516268224,
"min": 0.7536459516268224,
"max": 8.610899567604065,
"count": 5
},
"Pyramids.Policy.RndReward.sum": {
"value": 24.116670452058315,
"min": 24.116670452058315,
"max": 137.77439308166504,
"count": 5
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 5
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 5
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1748528443",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.7.0+cu126",
"numpy_version": "1.23.5",
"end_time_seconds": "1748528788"
},
"total": 344.56960941700004,
"count": 1,
"self": 0.5216151859999627,
"children": {
"run_training.setup": {
"total": 0.021093043000064426,
"count": 1,
"self": 0.021093043000064426
},
"TrainerController.start_learning": {
"total": 344.026901188,
"count": 1,
"self": 0.2570713980030632,
"children": {
"TrainerController._reset_env": {
"total": 2.447821465000061,
"count": 1,
"self": 2.447821465000061
},
"TrainerController.advance": {
"total": 340.9616144319971,
"count": 9783,
"self": 0.28863897802102656,
"children": {
"env_step": {
"total": 228.421792245995,
"count": 9783,
"self": 200.272148808986,
"children": {
"SubprocessEnvManager._take_step": {
"total": 28.000657919996,
"count": 9783,
"self": 0.8493236969950431,
"children": {
"TorchPolicy.evaluate": {
"total": 27.15133422300096,
"count": 9781,
"self": 27.15133422300096
}
}
},
"workers": {
"total": 0.14898551701298857,
"count": 9782,
"self": 0.0,
"children": {
"worker_root": {
"total": 342.82997307999176,
"count": 9782,
"is_parallel": true,
"self": 162.237793356976,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0021176360000936256,
"count": 1,
"is_parallel": true,
"self": 0.0006946779999452701,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014229580001483555,
"count": 8,
"is_parallel": true,
"self": 0.0014229580001483555
}
}
},
"UnityEnvironment.step": {
"total": 0.05272724099995685,
"count": 1,
"is_parallel": true,
"self": 0.0006332640000437095,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0005856350001067767,
"count": 1,
"is_parallel": true,
"self": 0.0005856350001067767
},
"communicator.exchange": {
"total": 0.04968257099994844,
"count": 1,
"is_parallel": true,
"self": 0.04968257099994844
},
"steps_from_proto": {
"total": 0.001825770999857923,
"count": 1,
"is_parallel": true,
"self": 0.0004133489997002471,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001412422000157676,
"count": 8,
"is_parallel": true,
"self": 0.001412422000157676
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 180.59217972301576,
"count": 9781,
"is_parallel": true,
"self": 5.447545174037259,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 4.101706276997675,
"count": 9781,
"is_parallel": true,
"self": 4.101706276997675
},
"communicator.exchange": {
"total": 154.1020959519915,
"count": 9781,
"is_parallel": true,
"self": 154.1020959519915
},
"steps_from_proto": {
"total": 16.94083231998934,
"count": 9781,
"is_parallel": true,
"self": 3.5175229909548307,
"children": {
"_process_rank_one_or_two_observation": {
"total": 13.42330932903451,
"count": 78248,
"is_parallel": true,
"self": 13.42330932903451
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 112.25118320798106,
"count": 9782,
"self": 0.3296399020075569,
"children": {
"process_trajectory": {
"total": 21.554079229972558,
"count": 9782,
"self": 21.554079229972558
},
"_update_policy": {
"total": 90.36746407600094,
"count": 43,
"self": 50.6577351279966,
"children": {
"TorchPPOOptimizer.update": {
"total": 39.70972894800434,
"count": 3597,
"self": 39.70972894800434
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.2549999155453406e-06,
"count": 1,
"self": 1.2549999155453406e-06
},
"TrainerController._save_models": {
"total": 0.36039263799989385,
"count": 1,
"self": 0.0037798139999267732,
"children": {
"RLTrainer._checkpoint": {
"total": 0.3566128239999671,
"count": 1,
"self": 0.3566128239999671
}
}
}
}
}
}
}