| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.2992294430732727, | |
| "min": 0.2992294430732727, | |
| "max": 1.492452621459961, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 9048.6982421875, | |
| "min": 9048.6982421875, | |
| "max": 45275.04296875, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989926.0, | |
| "min": 29957.0, | |
| "max": 989926.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989926.0, | |
| "min": 29957.0, | |
| "max": 989926.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.587913990020752, | |
| "min": -0.09508303552865982, | |
| "max": 0.6669148206710815, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 162.26426696777344, | |
| "min": -22.91501235961914, | |
| "max": 194.07220458984375, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.011886782944202423, | |
| "min": -0.031833529472351074, | |
| "max": 0.20138977468013763, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 3.280752182006836, | |
| "min": -7.576379776000977, | |
| "max": 48.736324310302734, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.0704758680319459, | |
| "min": 0.06429999697040727, | |
| "max": 0.07241002595678549, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9866621524472425, | |
| "min": 0.5020450306949259, | |
| "max": 1.0506646613745638, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.014914674551175816, | |
| "min": 0.0001606622993645703, | |
| "max": 0.015761754097286067, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.20880544371646143, | |
| "min": 0.0022492721911039843, | |
| "max": 0.2339067940566547, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.690511722242855e-06, | |
| "min": 7.690511722242855e-06, | |
| "max": 0.00029523818730155715, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00010766716411139996, | |
| "min": 0.00010766716411139996, | |
| "max": 0.0036084981971673, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10256347142857143, | |
| "min": 0.10256347142857143, | |
| "max": 0.19841272857142855, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4358886, | |
| "min": 1.3888890999999999, | |
| "max": 2.5695068, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00026609079571428566, | |
| "min": 0.00026609079571428566, | |
| "max": 0.009841431584285715, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0037252711399999995, | |
| "min": 0.0037252711399999995, | |
| "max": 0.12029298673, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.01237169187515974, | |
| "min": 0.01237169187515974, | |
| "max": 0.3624524772167206, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.17320369184017181, | |
| "min": 0.17320369184017181, | |
| "max": 2.5371673107147217, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 328.22727272727275, | |
| "min": 284.6990291262136, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 28884.0, | |
| "min": 16628.0, | |
| "max": 32781.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.649034072306346, | |
| "min": -0.9998375521972775, | |
| "max": 1.7141851693115853, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 145.11499836295843, | |
| "min": -31.99480167031288, | |
| "max": 185.1319982856512, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.649034072306346, | |
| "min": -0.9998375521972775, | |
| "max": 1.7141851693115853, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 145.11499836295843, | |
| "min": -31.99480167031288, | |
| "max": 185.1319982856512, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.04222177033476659, | |
| "min": 0.03835009137839328, | |
| "max": 7.25148319453001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.7155157894594595, | |
| "min": 3.7155157894594595, | |
| "max": 123.27521430701017, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1679200891", | |
| "python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "0.31.0.dev0", | |
| "mlagents_envs_version": "0.31.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.11.0+cu102", | |
| "numpy_version": "1.21.2", | |
| "end_time_seconds": "1679203020" | |
| }, | |
| "total": 2129.645745955, | |
| "count": 1, | |
| "self": 0.4741174550008509, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.10579601399967942, | |
| "count": 1, | |
| "self": 0.10579601399967942 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2129.0658324859996, | |
| "count": 1, | |
| "self": 1.506976754923926, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 6.197753757999635, | |
| "count": 1, | |
| "self": 6.197753757999635 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2121.268153165076, | |
| "count": 64017, | |
| "self": 1.602584594106247, | |
| "children": { | |
| "env_step": { | |
| "total": 1503.9630158600344, | |
| "count": 64017, | |
| "self": 1389.157125215048, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 113.89014844903159, | |
| "count": 64017, | |
| "self": 4.751692930037734, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 109.13845551899385, | |
| "count": 62558, | |
| "self": 109.13845551899385 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.9157421959548628, | |
| "count": 64017, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2124.198507129002, | |
| "count": 64017, | |
| "is_parallel": true, | |
| "self": 853.9254579731282, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0019010460000572493, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006330769997475727, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012679690003096766, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012679690003096766 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.08576096200022221, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005926660001023265, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.00040959699981613085, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00040959699981613085 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.08316502000025139, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.08316502000025139 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0015936790000523615, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00036088500019104686, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012327939998613147, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012327939998613147 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1270.2730491558737, | |
| "count": 64016, | |
| "is_parallel": true, | |
| "self": 31.001365252864616, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 22.399567527079853, | |
| "count": 64016, | |
| "is_parallel": true, | |
| "self": 22.399567527079853 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1125.852470723948, | |
| "count": 64016, | |
| "is_parallel": true, | |
| "self": 1125.852470723948 | |
| }, | |
| "steps_from_proto": { | |
| "total": 91.01964565198114, | |
| "count": 64016, | |
| "is_parallel": true, | |
| "self": 19.654464270681274, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 71.36518138129986, | |
| "count": 512128, | |
| "is_parallel": true, | |
| "self": 71.36518138129986 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 615.7025527109354, | |
| "count": 64017, | |
| "self": 2.8630582349819633, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 117.09458153496371, | |
| "count": 64017, | |
| "self": 116.89556704396409, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.1990144909996161, | |
| "count": 2, | |
| "self": 0.1990144909996161 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 495.7449129409897, | |
| "count": 458, | |
| "self": 312.1669926319523, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 183.57792030903738, | |
| "count": 22791, | |
| "self": 183.57792030903738 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.420000424142927e-07, | |
| "count": 1, | |
| "self": 9.420000424142927e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.09294786600003135, | |
| "count": 1, | |
| "self": 0.0014057910002520657, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.09154207499977929, | |
| "count": 1, | |
| "self": 0.09154207499977929 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |