ppo-PyramidsTraining / run_logs /timers.json

Second Push

a2d60b7 over 2 years ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.16728255152702332,
	"min": 0.15525735914707184,
	"max": 0.21002553403377533,
	"count": 34
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 5053.271484375,
	"min": 1868.0673828125,
	"max": 6280.603515625,
	"count": 34
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 234.51181102362204,
	"min": 212.17948717948718,
	"max": 283.64761904761906,
	"count": 34
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29783.0,
	"min": 8275.0,
	"max": 31880.0,
	"count": 34
	},
	"Pyramids.Step.mean": {
	"value": 2999883.0,
	"min": 2009983.0,
	"max": 2999883.0,
	"count": 34
	},
	"Pyramids.Step.sum": {
	"value": 2999883.0,
	"min": 2009983.0,
	"max": 2999883.0,
	"count": 34
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7479361891746521,
	"min": 0.6622505784034729,
	"max": 0.8450698852539062,
	"count": 34
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 224.380859375,
	"min": 73.65901184082031,
	"max": 252.65277099609375,
	"count": 34
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.005168822593986988,
	"min": -0.012601537629961967,
	"max": 0.01932157576084137,
	"count": 34
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 1.5506467819213867,
	"min": -3.742656707763672,
	"max": 5.680543422698975,
	"count": 34
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7497338478959452,
	"min": 1.6608981324566736,
	"max": 1.787820503497735,
	"count": 34
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 222.21619868278503,
	"min": 69.72499963641167,
	"max": 244.80299776792526,
	"count": 34
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7497338478959452,
	"min": 1.6608981324566736,
	"max": 1.787820503497735,
	"count": 34
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 222.21619868278503,
	"min": 69.72499963641167,
	"max": 244.80299776792526,
	"count": 34
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.01949155884766532,
	"min": 0.019372238134383223,
	"max": 0.028201485868443604,
	"count": 34
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.4754279736534954,
	"min": 0.8830385050969198,
	"max": 3.0416997363208793,
	"count": 34
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07110694913851966,
	"min": 0.06405901443975467,
	"max": 0.07133843297612788,
	"count": 34
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9954972879392753,
	"min": 0.27638910769019276,
	"max": 1.0520664500654675,
	"count": 34
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01526131886429302,
	"min": 0.012369724602710143,
	"max": 0.016298255188782248,
	"count": 34
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.21365846410010228,
	"min": 0.06191515453004589,
	"max": 0.23520687879257218,
	"count": 34
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.5590351946404768e-06,
	"min": 1.5590351946404768e-06,
	"max": 9.947719184095832e-05,
	"count": 34
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.1826492724966673e-05,
	"min": 2.1826492724966673e-05,
	"max": 0.0014621597126137666,
	"count": 34
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10051964523809527,
	"min": 0.10051964523809527,
	"max": 0.13315904166666664,
	"count": 34
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4072750333333337,
	"min": 0.5326361666666666,
	"max": 1.9873862333333334,
	"count": 34
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 6.191255928571431e-05,
	"min": 6.191255928571431e-05,
	"max": 0.0033225882625,
	"count": 34
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008667758300000004,
	"min": 0.0008667758300000004,
	"max": 0.048839884709999996,
	"count": 34
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.008113382384181023,
	"min": 0.007795785553753376,
	"max": 0.010242822580039501,
	"count": 34
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.11358735710382462,
	"min": 0.040971290320158005,
	"max": 0.14452455937862396,
	"count": 34
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 34
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 34
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1693050399",
	"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsTraining --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1693053095"
	},
	"total": 2695.543802821001,
	"count": 1,
	"self": 1.1324325500017949,
	"children": {
	"run_training.setup": {
	"total": 0.040259501000036835,
	"count": 1,
	"self": 0.040259501000036835
	},
	"TrainerController.start_learning": {
	"total": 2694.371110769999,
	"count": 1,
	"self": 1.6563902417110512,
	"children": {
	"TrainerController._reset_env": {
	"total": 5.44096331899982,
	"count": 1,
	"self": 5.44096331899982
	},
	"TrainerController.advance": {
	"total": 2687.100431038287,
	"count": 65705,
	"self": 1.5864545440545044,
	"children": {
	"env_step": {
	"total": 2001.4026687082624,
	"count": 65705,
	"self": 1886.4337987335402,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 114.04875525803072,
	"count": 65705,
	"self": 4.902434129653557,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 109.14632112837717,
	"count": 62569,
	"self": 109.14632112837717
	}
	}
	},
	"workers": {
	"total": 0.920114716691387,
	"count": 65705,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2687.969531494088,
	"count": 65705,
	"is_parallel": true,
	"self": 926.9245235840926,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0019770689996221336,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006251910008359118,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013518779987862217,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013518779987862217
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.08333673800007091,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005924659999436699,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00046607700005552033,
	"count": 1,
	"is_parallel": true,
	"self": 0.00046607700005552033
	},
	"communicator.exchange": {
	"total": 0.07168196800012083,
	"count": 1,
	"is_parallel": true,
	"self": 0.07168196800012083
	},
	"steps_from_proto": {
	"total": 0.010596226999950886,
	"count": 1,
	"is_parallel": true,
	"self": 0.009075192998352577,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0015210340015983093,
	"count": 8,
	"is_parallel": true,
	"self": 0.0015210340015983093
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1761.0450079099955,
	"count": 65704,
	"is_parallel": true,
	"self": 34.77587164081251,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 23.156331481118286,
	"count": 65704,
	"is_parallel": true,
	"self": 23.156331481118286
	},
	"communicator.exchange": {
	"total": 1592.8627225269947,
	"count": 65704,
	"is_parallel": true,
	"self": 1592.8627225269947
	},
	"steps_from_proto": {
	"total": 110.25008226107002,
	"count": 65704,
	"is_parallel": true,
	"self": 22.365261638236916,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 87.8848206228331,
	"count": 525632,
	"is_parallel": true,
	"self": 87.8848206228331
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 684.11130778597,
	"count": 65705,
	"self": 3.081327651087122,
	"children": {
	"process_trajectory": {
	"total": 120.54025942088992,
	"count": 65705,
	"self": 120.27275603989074,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.26750338099918736,
	"count": 2,
	"self": 0.26750338099918736
	}
	}
	},
	"_update_policy": {
	"total": 560.4897207139929,
	"count": 473,
	"self": 366.8761716950967,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 193.61354901889626,
	"count": 22752,
	"self": 193.61354901889626
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 2.3588001567986794e-05,
	"count": 1,
	"self": 2.3588001567986794e-05
	},
	"TrainerController._save_models": {
	"total": 0.1733025829998951,
	"count": 1,
	"self": 0.0039729189993522596,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.16932966400054283,
	"count": 1,
	"self": 0.16932966400054283
	}
	}
	}
	}
	}
	}
	}