First Push

0779ac3 verified almost 2 years ago

18.6 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.39161038398742676,
	"min": 0.3892679512500763,
	"max": 1.4873254299163818,
	"count": 40
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 9837.2529296875,
	"min": 9660.0732421875,
	"max": 39027.41796875,
	"count": 40
	},
	"Pyramids.Step.mean": {
	"value": 999947.0,
	"min": 24960.0,
	"max": 999947.0,
	"count": 40
	},
	"Pyramids.Step.sum": {
	"value": 999947.0,
	"min": 24960.0,
	"max": 999947.0,
	"count": 40
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.5577706098556519,
	"min": -0.10050802677869797,
	"max": 0.6519138216972351,
	"count": 40
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 128.28724670410156,
	"min": -20.302621841430664,
	"max": 154.50357055664062,
	"count": 40
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.012868339195847511,
	"min": 0.005618416238576174,
	"max": 0.4353194832801819,
	"count": 40
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 2.9597179889678955,
	"min": 1.18548583984375,
	"max": 86.1932601928711,
	"count": 40
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07048654987496168,
	"min": 0.06373778805896614,
	"max": 0.07526202773604179,
	"count": 40
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.8458385984995402,
	"min": 0.3981097612286458,
	"max": 0.9031443328325015,
	"count": 40
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.015799540449532086,
	"min": 0.0018626144759534152,
	"max": 0.015799540449532086,
	"count": 40
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.18959448539438503,
	"min": 0.013386984317590738,
	"max": 0.18959448539438503,
	"count": 40
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 3.6753987749000005e-06,
	"min": 3.6753987749000005e-06,
	"max": 0.0002957568014144,
	"count": 40
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 4.4104785298800004e-05,
	"min": 4.4104785298800004e-05,
	"max": 0.0029269388243538,
	"count": 40
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1012251,
	"min": 0.1012251,
	"max": 0.1985856,
	"count": 40
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.2147012,
	"min": 1.1771136000000002,
	"max": 2.1756462,
	"count": 40
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00013238749,
	"min": 0.00013238749,
	"max": 0.00985870144,
	"count": 40
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.00158864988,
	"min": 0.00158864988,
	"max": 0.09758705538,
	"count": 40
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.008755751885473728,
	"min": 0.008497790433466434,
	"max": 0.5597033500671387,
	"count": 40
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.10506902635097504,
	"min": 0.09569065272808075,
	"max": 3.358220100402832,
	"count": 40
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 328.0133333333333,
	"min": 296.6024096385542,
	"max": 999.0,
	"count": 40
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 24601.0,
	"min": 15984.0,
	"max": 31968.0,
	"count": 40
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.5919653083880743,
	"min": -1.0000000521540642,
	"max": 1.6551903460219681,
	"count": 40
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 119.39739812910557,
	"min": -32.000001668930054,
	"max": 137.38079871982336,
	"count": 40
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.5919653083880743,
	"min": -1.0000000521540642,
	"max": 1.6551903460219681,
	"count": 40
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 119.39739812910557,
	"min": -32.000001668930054,
	"max": 137.38079871982336,
	"count": 40
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.029587139872989308,
	"min": 0.027370002108606666,
	"max": 10.958400049246848,
	"count": 40
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.219035490474198,
	"min": 2.0833714419277385,
	"max": 175.33440078794956,
	"count": 40
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 40
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 40
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1716730011",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids3 --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.0+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1716732293"
	},
	"total": 2281.9890105399995,
	"count": 1,
	"self": 0.48976659899926744,
	"children": {
	"run_training.setup": {
	"total": 0.05181883299974288,
	"count": 1,
	"self": 0.05181883299974288
	},
	"TrainerController.start_learning": {
	"total": 2281.4474251080005,
	"count": 1,
	"self": 1.397449222970863,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.4167706079997515,
	"count": 1,
	"self": 2.4167706079997515
	},
	"TrainerController.advance": {
	"total": 2277.54545750003,
	"count": 63983,
	"self": 1.414589613111275,
	"children": {
	"env_step": {
	"total": 1637.3200555290337,
	"count": 63983,
	"self": 1504.1230797850653,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 132.3463596849656,
	"count": 63983,
	"self": 4.706007048048832,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 127.64035263691676,
	"count": 62552,
	"self": 127.64035263691676
	}
	}
	},
	"workers": {
	"total": 0.8506160590027321,
	"count": 63983,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2276.1567987270205,
	"count": 63983,
	"is_parallel": true,
	"self": 895.521353034901,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0020543230002658674,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005948570001237385,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001459466000142129,
	"count": 8,
	"is_parallel": true,
	"self": 0.001459466000142129
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04804656100031934,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006337940008052101,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005115260000820854,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005115260000820854
	},
	"communicator.exchange": {
	"total": 0.0452873549998003,
	"count": 1,
	"is_parallel": true,
	"self": 0.0452873549998003
	},
	"steps_from_proto": {
	"total": 0.0016138859996317478,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003391109994481667,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012747750001835811,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012747750001835811
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1380.6354456921194,
	"count": 63982,
	"is_parallel": true,
	"self": 34.525767212177016,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 23.840742276008314,
	"count": 63982,
	"is_parallel": true,
	"self": 23.840742276008314
	},
	"communicator.exchange": {
	"total": 1223.704609926931,
	"count": 63982,
	"is_parallel": true,
	"self": 1223.704609926931
	},
	"steps_from_proto": {
	"total": 98.56432627700315,
	"count": 63982,
	"is_parallel": true,
	"self": 20.079214052069347,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 78.4851122249338,
	"count": 511856,
	"is_parallel": true,
	"self": 78.4851122249338
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 638.810812357885,
	"count": 63983,
	"self": 2.6279607609471896,
	"children": {
	"process_trajectory": {
	"total": 129.42429262893575,
	"count": 63983,
	"self": 129.22864745593552,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.19564517300023,
	"count": 2,
	"self": 0.19564517300023
	}
	}
	},
	"_update_policy": {
	"total": 506.75855896800203,
	"count": 454,
	"self": 297.20957183900373,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 209.5489871289983,
	"count": 22839,
	"self": 209.5489871289983
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.770002750679851e-07,
	"count": 1,
	"self": 8.770002750679851e-07
	},
	"TrainerController._save_models": {
	"total": 0.08774689999972907,
	"count": 1,
	"self": 0.0014895069998601684,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0862573929998689,
	"count": 1,
	"self": 0.0862573929998689
	}
	}
	}
	}
	}
	}
	}