| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.4847096800804138, | |
| "min": 0.46653735637664795, | |
| "max": 1.4601467847824097, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 14502.513671875, | |
| "min": 13966.2626953125, | |
| "max": 44295.01171875, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989964.0, | |
| "min": 29952.0, | |
| "max": 989964.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989964.0, | |
| "min": 29952.0, | |
| "max": 989964.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.1252206414937973, | |
| "min": -0.10299812257289886, | |
| "max": 0.15921834111213684, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 31.43037986755371, | |
| "min": -24.822547912597656, | |
| "max": 40.12302017211914, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.005594240035861731, | |
| "min": -0.00724094407632947, | |
| "max": 0.3427627682685852, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 1.4041543006896973, | |
| "min": -1.8102359771728516, | |
| "max": 81.23477935791016, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.07184295480191293, | |
| "min": 0.06533377064103373, | |
| "max": 0.0738250105108212, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 1.077644322028694, | |
| "min": 0.47667058811177787, | |
| "max": 1.077644322028694, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.00940623532268445, | |
| "min": 0.00012526080969339925, | |
| "max": 0.014668392195239896, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.14109352984026674, | |
| "min": 0.00162839052601419, | |
| "max": 0.14109352984026674, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.43491752172667e-06, | |
| "min": 7.43491752172667e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00011152376282590004, | |
| "min": 0.00011152376282590004, | |
| "max": 0.0031367948544017994, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10247827333333336, | |
| "min": 0.10247827333333336, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.5371741000000003, | |
| "min": 1.3691136000000002, | |
| "max": 2.4435580000000003, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00025757950600000006, | |
| "min": 0.00025757950600000006, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0038636925900000013, | |
| "min": 0.0038636925900000013, | |
| "max": 0.10458526018000001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.00657698605209589, | |
| "min": 0.00657698605209589, | |
| "max": 0.517527163028717, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.09865479171276093, | |
| "min": 0.0958457887172699, | |
| "max": 3.622690200805664, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 679.2, | |
| "min": 679.2, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 30564.0, | |
| "min": 15984.0, | |
| "max": 32377.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 0.520542184346252, | |
| "min": -1.0000000521540642, | |
| "max": 0.520542184346252, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 23.42439829558134, | |
| "min": -32.000001668930054, | |
| "max": 23.42439829558134, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 0.520542184346252, | |
| "min": -1.0000000521540642, | |
| "max": 0.520542184346252, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 23.42439829558134, | |
| "min": -32.000001668930054, | |
| "max": 23.42439829558134, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.047264640302617206, | |
| "min": 0.047264640302617206, | |
| "max": 11.028586469590664, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 2.1269088136177743, | |
| "min": 2.0501779096666723, | |
| "max": 176.45738351345062, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1742841161", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.6.0+cu124", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1742843624" | |
| }, | |
| "total": 2463.127621471, | |
| "count": 1, | |
| "self": 0.4773878609998974, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.03236518199992133, | |
| "count": 1, | |
| "self": 0.03236518199992133 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2462.6178684280003, | |
| "count": 1, | |
| "self": 1.8110850909538385, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.969214313999828, | |
| "count": 1, | |
| "self": 2.969214313999828 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2457.736359339047, | |
| "count": 63277, | |
| "self": 1.8236922660958044, | |
| "children": { | |
| "env_step": { | |
| "total": 1686.2510285079898, | |
| "count": 63277, | |
| "self": 1493.418697969987, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 191.78908464103188, | |
| "count": 63277, | |
| "self": 5.594146105048367, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 186.1949385359835, | |
| "count": 62571, | |
| "self": 186.1949385359835 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 1.0432458969708023, | |
| "count": 63277, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2456.789050299968, | |
| "count": 63277, | |
| "is_parallel": true, | |
| "self": 1100.9937586339079, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.004023516999950516, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0014513099995383527, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0025722070004121633, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0025722070004121633 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.05513158099984139, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006038229998921452, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005018900001232396, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005018900001232396 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.05207881299998007, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.05207881299998007 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0019470549998459319, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004085319994828751, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0015385230003630568, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0015385230003630568 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1355.7952916660602, | |
| "count": 63276, | |
| "is_parallel": true, | |
| "self": 37.29202799700556, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 27.97431511197101, | |
| "count": 63276, | |
| "is_parallel": true, | |
| "self": 27.97431511197101 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1174.8277466860347, | |
| "count": 63276, | |
| "is_parallel": true, | |
| "self": 1174.8277466860347 | |
| }, | |
| "steps_from_proto": { | |
| "total": 115.70120187104885, | |
| "count": 63276, | |
| "is_parallel": true, | |
| "self": 24.307458746011207, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 91.39374312503764, | |
| "count": 506208, | |
| "is_parallel": true, | |
| "self": 91.39374312503764 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 769.6616385649613, | |
| "count": 63277, | |
| "self": 3.207955299908008, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 146.1378363480544, | |
| "count": 63277, | |
| "self": 145.90893373305425, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.22890261500015185, | |
| "count": 2, | |
| "self": 0.22890261500015185 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 620.3158469169989, | |
| "count": 435, | |
| "self": 340.43439565998506, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 279.88145125701385, | |
| "count": 22782, | |
| "self": 279.88145125701385 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.1269999049545731e-06, | |
| "count": 1, | |
| "self": 1.1269999049545731e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.10120855700006359, | |
| "count": 1, | |
| "self": 0.0017361909999635827, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.09947236600010001, | |
| "count": 1, | |
| "self": 0.09947236600010001 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |