First Push

4297701 verified over 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.42765557765960693,
	"min": 0.42765557765960693,
	"max": 1.444102168083191,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 12870.72265625,
	"min": 12870.72265625,
	"max": 43808.28515625,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989926.0,
	"min": 29898.0,
	"max": 989926.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989926.0,
	"min": 29898.0,
	"max": 989926.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.4740413427352905,
	"min": -0.09874321520328522,
	"max": 0.4740413427352905,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 129.8873291015625,
	"min": -23.895858764648438,
	"max": 129.8873291015625,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.03468049690127373,
	"min": -0.01794944517314434,
	"max": 0.389791876077652,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 9.502455711364746,
	"min": -4.415563583374023,
	"max": 92.38067626953125,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06914377205109869,
	"min": 0.06457618965941948,
	"max": 0.07314545342860987,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9680128087153815,
	"min": 0.512018174000269,
	"max": 1.0247384742496983,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014910683606839963,
	"min": 0.0007184465922459686,
	"max": 0.015259525284214884,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.20874957049575948,
	"min": 0.008621359106951623,
	"max": 0.22723277202692094,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.553368910814282e-06,
	"min": 7.553368910814282e-06,
	"max": 0.0002952352301596857,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010574716475139994,
	"min": 0.00010574716475139994,
	"max": 0.0035086301304566993,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10251775714285714,
	"min": 0.10251775714285714,
	"max": 0.19841174285714283,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4352486,
	"min": 1.3888821999999998,
	"max": 2.5695433000000003,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002615239385714284,
	"min": 0.0002615239385714284,
	"max": 0.00984133311142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0036613351399999976,
	"min": 0.0036613351399999976,
	"max": 0.11697737567,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.014955240301787853,
	"min": 0.014570656232535839,
	"max": 0.5851942300796509,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.2093733698129654,
	"min": 0.2039891928434372,
	"max": 4.096359729766846,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 382.60714285714283,
	"min": 373.3766233766234,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 32139.0,
	"min": 16697.0,
	"max": 32660.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.4744904537108683,
	"min": -0.9999500517733395,
	"max": 1.5850891702481218,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 123.85719811171293,
	"min": -31.998401656746864,
	"max": 123.85719811171293,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.4744904537108683,
	"min": -0.9999500517733395,
	"max": 1.5850891702481218,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 123.85719811171293,
	"min": -31.998401656746864,
	"max": 123.85719811171293,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.05839386045610289,
	"min": 0.05798116527395043,
	"max": 12.005578686209287,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.905084278312643,
	"min": 4.354132979293354,
	"max": 204.09483766555786,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1716768730",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.0+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1716770929"
	},
	"total": 2199.116553324,
	"count": 1,
	"self": 0.49149433599995973,
	"children": {
	"run_training.setup": {
	"total": 0.05905033400000548,
	"count": 1,
	"self": 0.05905033400000548
	},
	"TrainerController.start_learning": {
	"total": 2198.566008654,
	"count": 1,
	"self": 1.3728440019467598,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.583390558000019,
	"count": 1,
	"self": 3.583390558000019
	},
	"TrainerController.advance": {
	"total": 2193.5278139230536,
	"count": 63712,
	"self": 1.4751476040505622,
	"children": {
	"env_step": {
	"total": 1557.6710027870138,
	"count": 63712,
	"self": 1421.2972544070678,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 135.52909868896427,
	"count": 63712,
	"self": 4.8602303339473,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 130.66886835501697,
	"count": 62565,
	"self": 130.66886835501697
	}
	}
	},
	"workers": {
	"total": 0.8446496909817256,
	"count": 63712,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2193.1606817069996,
	"count": 63712,
	"is_parallel": true,
	"self": 896.3308822899546,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005354943999975603,
	"count": 1,
	"is_parallel": true,
	"self": 0.0037183160000040516,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016366279999715516,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016366279999715516
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05331802399996377,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006684659999223186,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005170709999902101,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005170709999902101
	},
	"communicator.exchange": {
	"total": 0.05034187100000054,
	"count": 1,
	"is_parallel": true,
	"self": 0.05034187100000054
	},
	"steps_from_proto": {
	"total": 0.0017906160000507043,
	"count": 1,
	"is_parallel": true,
	"self": 0.00037910000003194,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014115160000187643,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014115160000187643
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1296.829799417045,
	"count": 63711,
	"is_parallel": true,
	"self": 34.23944966314116,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 25.054391963900343,
	"count": 63711,
	"is_parallel": true,
	"self": 25.054391963900343
	},
	"communicator.exchange": {
	"total": 1135.802539698001,
	"count": 63711,
	"is_parallel": true,
	"self": 1135.802539698001
	},
	"steps_from_proto": {
	"total": 101.73341809200258,
	"count": 63711,
	"is_parallel": true,
	"self": 20.781884699940463,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 80.95153339206212,
	"count": 509688,
	"is_parallel": true,
	"self": 80.95153339206212
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 634.3816635319895,
	"count": 63712,
	"self": 2.5688455659959573,
	"children": {
	"process_trajectory": {
	"total": 133.11561347099212,
	"count": 63712,
	"self": 132.8561739279918,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.259439543000326,
	"count": 2,
	"self": 0.259439543000326
	}
	}
	},
	"_update_policy": {
	"total": 498.6972044950014,
	"count": 451,
	"self": 294.2666973749966,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 204.4305071200048,
	"count": 22785,
	"self": 204.4305071200048
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2280002010811586e-06,
	"count": 1,
	"self": 1.2280002010811586e-06
	},
	"TrainerController._save_models": {
	"total": 0.08195894299979045,
	"count": 1,
	"self": 0.0014768779997211823,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08048206500006927,
	"count": 1,
	"self": 0.08048206500006927
	}
	}
	}
	}
	}
	}
	}