secondPush

27aaa56 verified almost 2 years ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.6050494909286499,
	"min": 0.6050494909286499,
	"max": 0.8366415500640869,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 18093.400390625,
	"min": 12879.2548828125,
	"max": 25483.14453125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 1979883.0,
	"min": 1019966.0,
	"max": 1979883.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 1979883.0,
	"min": 1019966.0,
	"max": 1979883.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.62385094165802,
	"min": 0.21211732923984528,
	"max": 0.6899233460426331,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 177.79751586914062,
	"min": 34.999359130859375,
	"max": 194.5907745361328,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.018732663244009018,
	"min": -0.016395842656493187,
	"max": 0.02733149379491806,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 5.338809013366699,
	"min": -2.7053141593933105,
	"max": 7.570823669433594,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 274.0571428571429,
	"min": 260.8256880733945,
	"max": 702.4090909090909,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28776.0,
	"min": 15453.0,
	"max": 31444.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.6687866522442727,
	"min": 0.7518635967915709,
	"max": 1.716990372739159,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 175.22259848564863,
	"min": 16.54099912941456,
	"max": 185.8733986467123,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.6687866522442727,
	"min": 0.7518635967915709,
	"max": 1.716990372739159,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 175.22259848564863,
	"min": 16.54099912941456,
	"max": 185.8733986467123,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.02576101848667133,
	"min": 0.023524496236008618,
	"max": 0.08017137258800423,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.7049069411004893,
	"min": 1.7637701969360933,
	"max": 3.418516769306734,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06855222881477814,
	"min": 0.06581879631201712,
	"max": 0.07266657747234041,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.959731203406894,
	"min": 0.6165068184463801,
	"max": 1.0516260387569978,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014468770938817346,
	"min": 0.007192014726918317,
	"max": 0.015923273303390793,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.20256279314344283,
	"min": 0.06472813254226485,
	"max": 0.23874681045708715,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 5.1469839986571415e-06,
	"min": 5.1469839986571415e-06,
	"max": 0.00014839503386833888,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 7.205777598119998e-05,
	"min": 7.205777598119998e-05,
	"max": 0.0020257139747622502,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10171562857142857,
	"min": 0.10171562857142857,
	"max": 0.14946499444444444,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4240188,
	"min": 1.34518495,
	"max": 2.1564492000000004,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0008676427228571425,
	"min": 0.0008676427228571425,
	"max": 0.02473755072277778,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.012146998119999995,
	"min": 0.012146998119999995,
	"max": 0.33769135122499994,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.008959934115409851,
	"min": 0.00835987739264965,
	"max": 0.01113196648657322,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.12543907761573792,
	"min": 0.0981353372335434,
	"max": 0.15584753453731537,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1715156388",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1715158946"
	},
	"total": 2558.318411821,
	"count": 1,
	"self": 0.4771156560000236,
	"children": {
	"run_training.setup": {
	"total": 0.051621190999867395,
	"count": 1,
	"self": 0.051621190999867395
	},
	"TrainerController.start_learning": {
	"total": 2557.7896749740003,
	"count": 1,
	"self": 1.5009321149082098,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.1861396180001975,
	"count": 1,
	"self": 2.1861396180001975
	},
	"TrainerController.advance": {
	"total": 2554.007595873092,
	"count": 64646,
	"self": 1.5691814611809605,
	"children": {
	"env_step": {
	"total": 1868.7834362149733,
	"count": 64646,
	"self": 1727.1443113118885,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 140.72589767201407,
	"count": 64646,
	"self": 5.442068254879814,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 135.28382941713426,
	"count": 62549,
	"self": 135.28382941713426
	}
	}
	},
	"workers": {
	"total": 0.9132272310707776,
	"count": 64646,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2551.910830787956,
	"count": 64646,
	"is_parallel": true,
	"self": 963.0787922048903,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002196669999648293,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006604640002478845,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0015362059994004085,
	"count": 8,
	"is_parallel": true,
	"self": 0.0015362059994004085
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05332669800009171,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007138900009522331,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.000479559999803314,
	"count": 1,
	"is_parallel": true,
	"self": 0.000479559999803314
	},
	"communicator.exchange": {
	"total": 0.05028351399960229,
	"count": 1,
	"is_parallel": true,
	"self": 0.05028351399960229
	},
	"steps_from_proto": {
	"total": 0.0018497339997338713,
	"count": 1,
	"is_parallel": true,
	"self": 0.00036156599890091456,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014881680008329567,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014881680008329567
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1588.8320385830657,
	"count": 64645,
	"is_parallel": true,
	"self": 36.778021791972606,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 26.658363137064953,
	"count": 64645,
	"is_parallel": true,
	"self": 26.658363137064953
	},
	"communicator.exchange": {
	"total": 1413.5190357680112,
	"count": 64645,
	"is_parallel": true,
	"self": 1413.5190357680112
	},
	"steps_from_proto": {
	"total": 111.8766178860169,
	"count": 64645,
	"is_parallel": true,
	"self": 23.183875133140646,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 88.69274275287626,
	"count": 517160,
	"is_parallel": true,
	"self": 88.69274275287626
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 683.6549781969379,
	"count": 64646,
	"self": 2.9432743299876165,
	"children": {
	"process_trajectory": {
	"total": 145.74747356994885,
	"count": 64646,
	"self": 145.46585365194915,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.28161991799970565,
	"count": 2,
	"self": 0.28161991799970565
	}
	}
	},
	"_update_policy": {
	"total": 534.9642302970014,
	"count": 473,
	"self": 317.0337109129723,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 217.93051938402914,
	"count": 22764,
	"self": 217.93051938402914
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0049998309114017e-06,
	"count": 1,
	"self": 1.0049998309114017e-06
	},
	"TrainerController._save_models": {
	"total": 0.09500636299981124,
	"count": 1,
	"self": 0.002084752999508055,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09292161000030319,
	"count": 1,
	"self": 0.09292161000030319
	}
	}
	}
	}
	}
	}
	}