First Push

a6f9269 about 2 years ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.639274537563324,
	"min": 0.5915811061859131,
	"max": 1.4332571029663086,
	"count": 17
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 19188.46484375,
	"min": 17737.96875,
	"max": 43479.2890625,
	"count": 17
	},
	"Pyramids.Step.mean": {
	"value": 509935.0,
	"min": 29952.0,
	"max": 509935.0,
	"count": 17
	},
	"Pyramids.Step.sum": {
	"value": 509935.0,
	"min": 29952.0,
	"max": 509935.0,
	"count": 17
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.11859557032585144,
	"min": -0.10357686877250671,
	"max": 0.12504062056541443,
	"count": 17
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 29.411701202392578,
	"min": -25.065601348876953,
	"max": 29.634628295898438,
	"count": 17
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.016931630671024323,
	"min": 0.016931630671024323,
	"max": 0.5171031951904297,
	"count": 17
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 4.199044227600098,
	"min": 4.199044227600098,
	"max": 122.55345916748047,
	"count": 17
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06818488614515635,
	"min": 0.0657610722773621,
	"max": 0.07274229939553108,
	"count": 17
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9545884060321888,
	"min": 0.4722085593240844,
	"max": 1.043816227892724,
	"count": 17
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.010209054549653932,
	"min": 0.0009644156510168019,
	"max": 0.014433882215921292,
	"count": 17
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.14292676369515506,
	"min": 0.006750909557117614,
	"max": 0.14292676369515506,
	"count": 17
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 8.952576007436974e-06,
	"min": 8.952576007436974e-06,
	"max": 0.0002904914317409524,
	"count": 17
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00012533606410411764,
	"min": 0.00012533606410411764,
	"max": 0.0028422628055203925,
	"count": 17
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10298415966386557,
	"min": 0.10298415966386557,
	"max": 0.1968304761904762,
	"count": 17
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.441778235294118,
	"min": 1.3394384313725491,
	"max": 2.347420784313725,
	"count": 17
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00030811755042016805,
	"min": 0.00030811755042016805,
	"max": 0.009683364571428571,
	"count": 17
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.004313645705882353,
	"min": 0.004313645705882353,
	"max": 0.09478733635294119,
	"count": 17
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.024871045723557472,
	"min": 0.024871045723557472,
	"max": 0.642286479473114,
	"count": 17
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.3481946289539337,
	"min": 0.3481946289539337,
	"max": 4.496005535125732,
	"count": 17
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 764.578947368421,
	"min": 734.275,
	"max": 999.0,
	"count": 17
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29054.0,
	"min": 15984.0,
	"max": 32542.0,
	"count": 17
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 0.4983473263288799,
	"min": -1.0000000521540642,
	"max": 0.4983473263288799,
	"count": 17
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 18.937198400497437,
	"min": -32.000001668930054,
	"max": 18.937198400497437,
	"count": 17
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 0.4983473263288799,
	"min": -1.0000000521540642,
	"max": 0.4983473263288799,
	"count": 17
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 18.937198400497437,
	"min": -32.000001668930054,
	"max": 18.937198400497437,
	"count": 17
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.20070622358042256,
	"min": 0.20070622358042256,
	"max": 13.79836150072515,
	"count": 17
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 7.6268364960560575,
	"min": 7.6268364960560575,
	"max": 220.7737840116024,
	"count": 17
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 17
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 17
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1704188202",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.1.2+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1704189301"
	},
	"total": 1099.137461053,
	"count": 1,
	"self": 0.49136940900007176,
	"children": {
	"run_training.setup": {
	"total": 0.06661161799979709,
	"count": 1,
	"self": 0.06661161799979709
	},
	"TrainerController.start_learning": {
	"total": 1098.579480026,
	"count": 1,
	"self": 0.7164097740055695,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.4781658629999583,
	"count": 1,
	"self": 2.4781658629999583
	},
	"TrainerController.advance": {
	"total": 1095.3017732739945,
	"count": 32245,
	"self": 0.7304094999669815,
	"children": {
	"env_step": {
	"total": 773.0819093490215,
	"count": 32245,
	"self": 702.4890763390185,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 70.13889533697579,
	"count": 32245,
	"self": 2.525001555978861,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 67.61389378099693,
	"count": 31935,
	"self": 67.61389378099693
	}
	}
	},
	"workers": {
	"total": 0.45393767302721244,
	"count": 32245,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 1095.9815441419985,
	"count": 32245,
	"is_parallel": true,
	"self": 457.2725648129915,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0026979579999988346,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007224289997793676,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001975529000219467,
	"count": 8,
	"is_parallel": true,
	"self": 0.001975529000219467
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.06406370099989545,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007856179995542334,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005379640001592634,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005379640001592634
	},
	"communicator.exchange": {
	"total": 0.06111625600010484,
	"count": 1,
	"is_parallel": true,
	"self": 0.06111625600010484
	},
	"steps_from_proto": {
	"total": 0.0016238630000771082,
	"count": 1,
	"is_parallel": true,
	"self": 0.00034962500058099977,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012742379994961084,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012742379994961084
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 638.708979329007,
	"count": 32244,
	"is_parallel": true,
	"self": 18.538913360987635,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 13.679534008974088,
	"count": 32244,
	"is_parallel": true,
	"self": 13.679534008974088
	},
	"communicator.exchange": {
	"total": 552.2876547070209,
	"count": 32244,
	"is_parallel": true,
	"self": 552.2876547070209
	},
	"steps_from_proto": {
	"total": 54.20287725202434,
	"count": 32244,
	"is_parallel": true,
	"self": 10.996816603038269,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 43.20606064898607,
	"count": 257952,
	"is_parallel": true,
	"self": 43.20606064898607
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 321.489454425006,
	"count": 32245,
	"self": 1.3052822480221948,
	"children": {
	"process_trajectory": {
	"total": 65.06064911698195,
	"count": 32245,
	"self": 64.95811968998169,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.10252942700026324,
	"count": 1,
	"self": 0.10252942700026324
	}
	}
	},
	"_update_policy": {
	"total": 255.12352306000184,
	"count": 212,
	"self": 151.62375964099147,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 103.49976341901038,
	"count": 11664,
	"self": 103.49976341901038
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.059999683813658e-07,
	"count": 1,
	"self": 9.059999683813658e-07
	},
	"TrainerController._save_models": {
	"total": 0.0831302090000463,
	"count": 1,
	"self": 0.001595688000179507,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0815345209998668,
	"count": 1,
	"self": 0.0815345209998668
	}
	}
	}
	}
	}
	}
	}