| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.31941959261894226, | |
| "min": 0.31941959261894226, | |
| "max": 1.5913751125335693, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 9597.919921875, | |
| "min": 9597.919921875, | |
| "max": 48275.95703125, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2999873.0, | |
| "min": 29952.0, | |
| "max": 2999873.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2999873.0, | |
| "min": 29952.0, | |
| "max": 2999873.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.746780514717102, | |
| "min": -0.1449412703514099, | |
| "max": 0.8288553953170776, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 203.87107849121094, | |
| "min": -34.93084716796875, | |
| "max": 233.7372283935547, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.9310639500617981, | |
| "min": 0.9151319265365601, | |
| "max": 26.376020431518555, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 254.1804656982422, | |
| "min": 252.17361450195312, | |
| "max": 6356.62109375, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.03764318283388598, | |
| "min": 0.030007568025030195, | |
| "max": 0.04330179998274344, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.11292954850165793, | |
| "min": 0.06378415991396955, | |
| "max": 0.12503808459588506, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015089578854127062, | |
| "min": 0.011777677055862216, | |
| "max": 50.34082246057078, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.04526873656238119, | |
| "min": 0.025758922534684342, | |
| "max": 100.68164492114155, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 4.844772934000003e-07, | |
| "min": 4.844772934000003e-07, | |
| "max": 9.939200060800002e-05, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 1.4534318802000007e-06, | |
| "min": 1.4534318802000007e-06, | |
| "max": 0.00029531847134820003, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10048437777777779, | |
| "min": 0.10048437777777779, | |
| "max": 0.19939199999999999, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 0.30145313333333335, | |
| "min": 0.21301233333333333, | |
| "max": 0.5953184666666668, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 5.8389340000000017e-05, | |
| "min": 5.8389340000000017e-05, | |
| "max": 0.009939260800000002, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.00017516802000000004, | |
| "min": 0.00017516802000000004, | |
| "max": 0.029532314820000002, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.10602808743715286, | |
| "min": 0.10435324162244797, | |
| "max": 5.4608564376831055, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.3180842697620392, | |
| "min": 0.20994243025779724, | |
| "max": 10.921712875366211, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 364.8, | |
| "min": 340.8255813953488, | |
| "max": 999.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 27360.0, | |
| "min": 15984.0, | |
| "max": 33116.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.5551786492268245, | |
| "min": -1.0000000521540642, | |
| "max": 1.626434069465507, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 116.63839869201183, | |
| "min": -31.99600164592266, | |
| "max": 147.78939798474312, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.5551786492268245, | |
| "min": -1.0000000521540642, | |
| "max": 1.626434069465507, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 116.63839869201183, | |
| "min": -31.99600164592266, | |
| "max": 147.78939798474312, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 3.9185459551836055, | |
| "min": 3.687487304524478, | |
| "max": 917.0562484264374, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 293.8909466387704, | |
| "min": 292.1203705649823, | |
| "max": 14672.899974822998, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1756817588", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/home/hungchan/miniconda3/envs/rl_31012/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training Run 2 --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.8.0+cu128", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1756821270" | |
| }, | |
| "total": 3682.686553206, | |
| "count": 1, | |
| "self": 0.3711183870000241, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.015643329999875277, | |
| "count": 1, | |
| "self": 0.015643329999875277 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 3682.299791489, | |
| "count": 1, | |
| "self": 4.471573963244737, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 1.4596728899996378, | |
| "count": 1, | |
| "self": 1.4596728899996378 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 3676.2634758217555, | |
| "count": 191819, | |
| "self": 4.349057315184837, | |
| "children": { | |
| "env_step": { | |
| "total": 2625.6239074529876, | |
| "count": 191819, | |
| "self": 2112.8629158190943, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 509.92004004172304, | |
| "count": 191819, | |
| "self": 12.48315074475795, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 497.4368892969651, | |
| "count": 187562, | |
| "self": 497.4368892969651 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 2.8409515921703132, | |
| "count": 191819, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 3676.8532693950747, | |
| "count": 191819, | |
| "is_parallel": true, | |
| "self": 1823.0812916923696, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0010134390013263328, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00029463299870258197, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0007188060026237508, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0007188060026237508 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.022171808001075988, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0002565689992479747, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.00017987100000027567, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00017987100000027567 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.02116701700106205, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.02116701700106205 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0005683510007656878, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00014758399993297644, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.00042076700083271135, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.00042076700083271135 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1853.771977702705, | |
| "count": 191818, | |
| "is_parallel": true, | |
| "self": 49.113975984328135, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 36.795314528650124, | |
| "count": 191818, | |
| "is_parallel": true, | |
| "self": 36.795314528650124 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1633.0751300659904, | |
| "count": 191818, | |
| "is_parallel": true, | |
| "self": 1633.0751300659904 | |
| }, | |
| "steps_from_proto": { | |
| "total": 134.7875571237364, | |
| "count": 191818, | |
| "is_parallel": true, | |
| "self": 30.88800354094201, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 103.8995535827944, | |
| "count": 1534544, | |
| "is_parallel": true, | |
| "self": 103.8995535827944 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1046.290511053583, | |
| "count": 191819, | |
| "self": 8.3830967354952, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 330.46261656308525, | |
| "count": 191819, | |
| "self": 329.9796428390855, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.48297372399974847, | |
| "count": 6, | |
| "self": 0.48297372399974847 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 707.4447977550026, | |
| "count": 289, | |
| "self": 501.9307063850556, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 205.51409136994698, | |
| "count": 17421, | |
| "self": 205.51409136994698 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 8.53000528877601e-07, | |
| "count": 1, | |
| "self": 8.53000528877601e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.1050679609998042, | |
| "count": 1, | |
| "self": 0.001174913000795641, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.10389304799900856, | |
| "count": 1, | |
| "self": 0.10389304799900856 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |