| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.5923354625701904, | |
| "min": 0.5923354625701904, | |
| "max": 1.453642725944519, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 17770.064453125, | |
| "min": 17759.767578125, | |
| "max": 44097.70703125, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989873.0, | |
| "min": 29965.0, | |
| "max": 989873.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989873.0, | |
| "min": 29965.0, | |
| "max": 989873.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.3344428837299347, | |
| "min": -0.0984574481844902, | |
| "max": 0.34629690647125244, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 88.62736511230469, | |
| "min": -23.72824478149414, | |
| "max": 90.38349151611328, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.05180658772587776, | |
| "min": -0.28089454770088196, | |
| "max": 0.35120537877082825, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 13.728745460510254, | |
| "min": -69.66184997558594, | |
| "max": 90.25978088378906, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06997550553448188, | |
| "min": 0.06425170784352797, | |
| "max": 0.07310933458437593, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9796570774827463, | |
| "min": 0.582261218396315, | |
| "max": 1.041276920989142, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.012712154459829133, | |
| "min": 0.0008688371122270388, | |
| "max": 0.02862670648358312, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.17797016243760785, | |
| "min": 0.010426045346724465, | |
| "max": 0.4007738907701637, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.4385546633714305e-06, | |
| "min": 7.4385546633714305e-06, | |
| "max": 0.0002948529392156875, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00010413976528720003, | |
| "min": 0.00010413976528720003, | |
| "max": 0.0035072252309249997, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10247948571428574, | |
| "min": 0.10247948571428574, | |
| "max": 0.1982843125, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4347128000000002, | |
| "min": 1.4347128000000002, | |
| "max": 2.5690749999999993, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00025770062285714295, | |
| "min": 0.00025770062285714295, | |
| "max": 0.00982860281875, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0036078087200000016, | |
| "min": 0.0036078087200000016, | |
| "max": 0.11693059250000001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.010181399993598461, | |
| "min": 0.010181399993598461, | |
| "max": 0.3752458989620209, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.1425396054983139, | |
| "min": 0.1425396054983139, | |
| "max": 3.001967191696167, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 484.36507936507934, | |
| "min": 484.36507936507934, | |
| "max": 995.125, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 30515.0, | |
| "min": 16380.0, | |
| "max": 32314.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.2616031470279845, | |
| "min": -0.9335688014980406, | |
| "max": 1.2966101457506924, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 79.48099826276302, | |
| "min": -30.3302016928792, | |
| "max": 79.48099826276302, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.2616031470279845, | |
| "min": -0.9335688014980406, | |
| "max": 1.2966101457506924, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 79.48099826276302, | |
| "min": -30.3302016928792, | |
| "max": 79.48099826276302, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.05217204827400449, | |
| "min": 0.05217204827400449, | |
| "max": 7.4629862904548645, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.286839041262283, | |
| "min": 3.1645436639664695, | |
| "max": 126.8707669377327, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1693278128", | |
| "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "0.31.0.dev0", | |
| "mlagents_envs_version": "0.31.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.11.0+cu102", | |
| "numpy_version": "1.21.2", | |
| "end_time_seconds": "1693280301" | |
| }, | |
| "total": 2172.348605834, | |
| "count": 1, | |
| "self": 0.9464471530000083, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.03929160200004844, | |
| "count": 1, | |
| "self": 0.03929160200004844 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2171.362867079, | |
| "count": 1, | |
| "self": 1.3687063490865512, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 4.165315903000192, | |
| "count": 1, | |
| "self": 4.165315903000192 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2165.675295324913, | |
| "count": 63476, | |
| "self": 1.465319106950119, | |
| "children": { | |
| "env_step": { | |
| "total": 1491.1658271249685, | |
| "count": 63476, | |
| "self": 1380.6189804020503, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 109.6901809039673, | |
| "count": 63476, | |
| "self": 4.712852147020385, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 104.97732875694692, | |
| "count": 62563, | |
| "self": 104.97732875694692 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.8566658189508871, | |
| "count": 63476, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2166.253374350974, | |
| "count": 63476, | |
| "is_parallel": true, | |
| "self": 899.4275699979933, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0018353539999225177, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00057408999987274, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012612640000497777, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012612640000497777 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.04719254699989506, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005619129999558936, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.00044521199993141636, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00044521199993141636 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.04432291600005556, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.04432291600005556 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.001862505999952191, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00036607999936677516, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0014964260005854157, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0014964260005854157 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1266.8258043529806, | |
| "count": 63475, | |
| "is_parallel": true, | |
| "self": 33.885897840031475, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 22.451233962985725, | |
| "count": 63475, | |
| "is_parallel": true, | |
| "self": 22.451233962985725 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1105.4327092980307, | |
| "count": 63475, | |
| "is_parallel": true, | |
| "self": 1105.4327092980307 | |
| }, | |
| "steps_from_proto": { | |
| "total": 105.05596325193278, | |
| "count": 63475, | |
| "is_parallel": true, | |
| "self": 20.5368303991188, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 84.51913285281398, | |
| "count": 507800, | |
| "is_parallel": true, | |
| "self": 84.51913285281398 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 673.0441490929943, | |
| "count": 63476, | |
| "self": 2.6526126299525004, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 111.22933297604277, | |
| "count": 63476, | |
| "self": 110.97428075304333, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.2550522229994385, | |
| "count": 2, | |
| "self": 0.2550522229994385 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 559.162203486999, | |
| "count": 453, | |
| "self": 364.15018279099013, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 195.0120206960089, | |
| "count": 22779, | |
| "self": 195.0120206960089 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.4360002751345746e-06, | |
| "count": 1, | |
| "self": 1.4360002751345746e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.15354806599998483, | |
| "count": 1, | |
| "self": 0.001977783999791427, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.1515702820001934, | |
| "count": 1, | |
| "self": 0.1515702820001934 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |