Pyramids course upload

744cf10 verified 7 months ago

18.3 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.8995862007141113,
	"min": 0.8995862007141113,
	"max": 1.454206109046936,
	"count": 6
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 26901.2265625,
	"min": 26901.2265625,
	"max": 44114.796875,
	"count": 6
	},
	"Pyramids.Step.mean": {
	"value": 179922.0,
	"min": 29882.0,
	"max": 179922.0,
	"count": 6
	},
	"Pyramids.Step.sum": {
	"value": 179922.0,
	"min": 29882.0,
	"max": 179922.0,
	"count": 6
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.08334647864103317,
	"min": -0.09363283962011337,
	"max": 0.028996169567108154,
	"count": 6
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": -20.086502075195312,
	"min": -22.565513610839844,
	"max": 6.872092247009277,
	"count": 6
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.06044967100024223,
	"min": 0.06044967100024223,
	"max": 0.319549560546875,
	"count": 6
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 14.568370819091797,
	"min": 14.568370819091797,
	"max": 75.73324584960938,
	"count": 6
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06991601909629647,
	"min": 0.0669309777444603,
	"max": 0.07281179393442894,
	"count": 6
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.908908248251854,
	"min": 0.5096825575410026,
	"max": 0.908908248251854,
	"count": 6
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.0012823803997391065,
	"min": 0.00018725260363460143,
	"max": 0.006188299495180815,
	"count": 6
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.016670945196608385,
	"min": 0.0024342838472498187,
	"max": 0.04331809646626571,
	"count": 6
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 5.151458282849999e-05,
	"min": 5.151458282849999e-05,
	"max": 0.00027575315093942855,
	"count": 6
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0006696895767704999,
	"min": 0.0006696895767704999,
	"max": 0.0025619672460110003,
	"count": 6
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1171715,
	"min": 0.1171715,
	"max": 0.19191771428571427,
	"count": 6
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.5232295,
	"min": 1.343424,
	"max": 1.9539890000000002,
	"count": 6
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0017254328500000003,
	"min": 0.0017254328500000003,
	"max": 0.009192579657142857,
	"count": 6
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.022430627050000006,
	"min": 0.022430627050000006,
	"max": 0.08542350110000001,
	"count": 6
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.052695635706186295,
	"min": 0.052695635706186295,
	"max": 0.39450564980506897,
	"count": 6
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.6850432753562927,
	"min": 0.6850432753562927,
	"max": 2.7615394592285156,
	"count": 6
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 958.0,
	"min": 958.0,
	"max": 999.0,
	"count": 6
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 32572.0,
	"min": 16809.0,
	"max": 32572.0,
	"count": 6
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.8363636860793288,
	"min": -0.9998875521123409,
	"max": -0.7836485349319198,
	"count": 6
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -27.600001640617847,
	"min": -31.99640166759491,
	"max": -14.825000911951065,
	"count": 6
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.8363636860793288,
	"min": -0.9998875521123409,
	"max": -0.7836485349319198,
	"count": 6
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -27.600001640617847,
	"min": -31.99640166759491,
	"max": -14.825000911951065,
	"count": 6
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.5387352874333208,
	"min": 0.5387352874333208,
	"max": 7.7710857483394005,
	"count": 6
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 17.778264485299587,
	"min": 17.778264485299587,
	"max": 132.1084577217698,
	"count": 6
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 6
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 6
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1759494890",
	"python_version": "3.10.12 \| packaged by conda-forge \| (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]",
	"command_line_arguments": "/root/.local/share/mamba/envs/u10/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsRND1 --no-graphics",
	"mlagents_version": "1.1.0",
	"mlagents_envs_version": "1.1.0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.8.0+cu128",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1759495475"
	},
	"total": 585.1926151550001,
	"count": 1,
	"self": 0.5460800729997572,
	"children": {
	"run_training.setup": {
	"total": 0.04039032899981976,
	"count": 1,
	"self": 0.04039032899981976
	},
	"TrainerController.start_learning": {
	"total": 584.6061447530005,
	"count": 1,
	"self": 0.4329372680385859,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.2851930990000255,
	"count": 1,
	"self": 3.2851930990000255
	},
	"TrainerController.advance": {
	"total": 580.5869333149617,
	"count": 12606,
	"self": 0.4788515179084243,
	"children": {
	"env_step": {
	"total": 379.204233546036,
	"count": 12606,
	"self": 347.5815240700663,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 31.359648098981324,
	"count": 12606,
	"self": 1.3449598949473511,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 30.014688204033973,
	"count": 12569,
	"self": 30.014688204033973
	}
	}
	},
	"workers": {
	"total": 0.2630613769883894,
	"count": 12606,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 583.1013726920082,
	"count": 12606,
	"is_parallel": true,
	"self": 269.2788808590044,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.004011348999938491,
	"count": 1,
	"is_parallel": true,
	"self": 0.001448401000288868,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002562947999649623,
	"count": 8,
	"is_parallel": true,
	"self": 0.002562947999649623
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.13084931000003053,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006335590001071978,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0011069160000261036,
	"count": 1,
	"is_parallel": true,
	"self": 0.0011069160000261036
	},
	"communicator.exchange": {
	"total": 0.1226994690000538,
	"count": 1,
	"is_parallel": true,
	"self": 0.1226994690000538
	},
	"steps_from_proto": {
	"total": 0.0064093659998434305,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004196439995212131,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.005989722000322217,
	"count": 8,
	"is_parallel": true,
	"self": 0.005989722000322217
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 313.8224918330038,
	"count": 12605,
	"is_parallel": true,
	"self": 9.168796041906262,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 5.948099299041587,
	"count": 12605,
	"is_parallel": true,
	"self": 5.948099299041587
	},
	"communicator.exchange": {
	"total": 269.25932263704635,
	"count": 12605,
	"is_parallel": true,
	"self": 269.25932263704635
	},
	"steps_from_proto": {
	"total": 29.446273855009622,
	"count": 12605,
	"is_parallel": true,
	"self": 6.432408007217873,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 23.01386584779175,
	"count": 100840,
	"is_parallel": true,
	"self": 23.01386584779175
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 200.90384825101728,
	"count": 12606,
	"self": 0.6625152340188833,
	"children": {
	"process_trajectory": {
	"total": 29.751444521000394,
	"count": 12606,
	"self": 29.751444521000394
	},
	"_update_policy": {
	"total": 170.489888495998,
	"count": 76,
	"self": 69.11183417899565,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 101.37805431700235,
	"count": 4563,
	"self": 101.37805431700235
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.630002750782296e-07,
	"count": 1,
	"self": 9.630002750782296e-07
	},
	"TrainerController._save_models": {
	"total": 0.301080107999951,
	"count": 1,
	"self": 0.005557440000302449,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.29552266799964855,
	"count": 1,
	"self": 0.29552266799964855
	}
	}
	}
	}
	}
	}
	}