| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.3846076428890228, | |
| "min": 0.3833308815956116, | |
| "max": 1.5098246335983276, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 11655.150390625, | |
| "min": 11422.2412109375, | |
| "max": 45802.0390625, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989886.0, | |
| "min": 29952.0, | |
| "max": 989886.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989886.0, | |
| "min": 29952.0, | |
| "max": 989886.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.5818838477134705, | |
| "min": -0.10555002838373184, | |
| "max": 0.5818838477134705, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 163.50936889648438, | |
| "min": -25.332006454467773, | |
| "max": 163.50936889648438, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.024695392698049545, | |
| "min": 0.009741031564772129, | |
| "max": 0.2150718718767166, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 6.93940544128418, | |
| "min": 2.5229272842407227, | |
| "max": 51.83232116699219, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06807303992098429, | |
| "min": 0.06524180654317, | |
| "max": 0.07394013747608384, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9530225588937801, | |
| "min": 0.49190884980827376, | |
| "max": 1.0545428169619604, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015759560995241523, | |
| "min": 0.0008012288526890431, | |
| "max": 0.015759560995241523, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.22063385393338134, | |
| "min": 0.007498496669599157, | |
| "max": 0.22273432953321998, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.417811813142858e-06, | |
| "min": 7.417811813142858e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00010384936538400001, | |
| "min": 0.00010384936538400001, | |
| "max": 0.0032551202149599997, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10247257142857145, | |
| "min": 0.10247257142857145, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4346160000000003, | |
| "min": 1.3886848, | |
| "max": 2.4442957, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00025700988571428576, | |
| "min": 0.00025700988571428576, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0035981384000000004, | |
| "min": 0.0035981384000000004, | |
| "max": 0.10852549599999997, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.013441706076264381, | |
| "min": 0.013441706076264381, | |
| "max": 0.38476258516311646, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.18818388879299164, | |
| "min": 0.18818388879299164, | |
| "max": 2.69333815574646, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 331.56382978723406, | |
| "min": 331.56382978723406, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 31167.0, | |
| "min": 15984.0, | |
| "max": 33016.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.6292905081259577, | |
| "min": -1.0000000521540642, | |
| "max": 1.6372344543536503, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 154.78259827196598, | |
| "min": -30.049201622605324, | |
| "max": 154.78259827196598, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.6292905081259577, | |
| "min": -1.0000000521540642, | |
| "max": 1.6372344543536503, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 154.78259827196598, | |
| "min": -30.049201622605324, | |
| "max": 154.78259827196598, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.045566108817154984, | |
| "min": 0.045566108817154984, | |
| "max": 8.569565658457577, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 4.328780337629723, | |
| "min": 4.185864482540637, | |
| "max": 137.11305053532124, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1756033779", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.8.0+cu128", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1756035970" | |
| }, | |
| "total": 2190.6587630259996, | |
| "count": 1, | |
| "self": 0.4754521499994553, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.02901185800010353, | |
| "count": 1, | |
| "self": 0.02901185800010353 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2190.154299018, | |
| "count": 1, | |
| "self": 1.334541701975013, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.6416640039999493, | |
| "count": 1, | |
| "self": 2.6416640039999493 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2186.102888007025, | |
| "count": 63772, | |
| "self": 1.3463753530977556, | |
| "children": { | |
| "env_step": { | |
| "total": 1542.0807603559792, | |
| "count": 63772, | |
| "self": 1397.695528086949, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 143.57964742903664, | |
| "count": 63772, | |
| "self": 4.487461024081767, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 139.09218640495487, | |
| "count": 62565, | |
| "self": 139.09218640495487 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.8055848399935712, | |
| "count": 63772, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2185.5679823199816, | |
| "count": 63772, | |
| "is_parallel": true, | |
| "self": 898.4433286818878, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0023612289999164204, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0007332099996801844, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001628019000236236, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001628019000236236 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04882033499984573, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005025779994412005, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004909250001219334, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004909250001219334 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.046210541000164085, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.046210541000164085 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016162910001185082, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00032748000012361445, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012888109999948938, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012888109999948938 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1287.1246536380938, | |
| "count": 63771, | |
| "is_parallel": true, | |
| "self": 31.25416772613744, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 22.63729023499286, | |
| "count": 63771, | |
| "is_parallel": true, | |
| "self": 22.63729023499286 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1137.4952609380114, | |
| "count": 63771, | |
| "is_parallel": true, | |
| "self": 1137.4952609380114 | |
| }, | |
| "steps_from_proto": { | |
| "total": 95.73793473895216, | |
| "count": 63771, | |
| "is_parallel": true, | |
| "self": 19.03209970907278, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 76.70583502987938, | |
| "count": 510168, | |
| "is_parallel": true, | |
| "self": 76.70583502987938 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 642.6757522979478, | |
| "count": 63772, | |
| "self": 2.6000749130355416, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 122.3217346359138, | |
| "count": 63772, | |
| "self": 122.13009232691365, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.19164230900014445, | |
| "count": 2, | |
| "self": 0.19164230900014445 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 517.7539427489985, | |
| "count": 447, | |
| "self": 289.45424722399116, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 228.29969552500734, | |
| "count": 22857, | |
| "self": 228.29969552500734 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 7.990001904545352e-07, | |
| "count": 1, | |
| "self": 7.990001904545352e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.07520450599986361, | |
| "count": 1, | |
| "self": 0.0013040220001130365, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.07390048399975058, | |
| "count": 1, | |
| "self": 0.07390048399975058 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |