| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.20314745604991913, | |
| "min": 0.20036353170871735, | |
| "max": 1.4018068313598633, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 6113.92578125, | |
| "min": 6046.169921875, | |
| "max": 42525.2109375, | |
| "count": 67 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2009974.0, | |
| "min": 29883.0, | |
| "max": 2009974.0, | |
| "count": 67 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2009974.0, | |
| "min": 29883.0, | |
| "max": 2009974.0, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.6510933637619019, | |
| "min": -0.14500658214092255, | |
| "max": 0.6842200756072998, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 182.30613708496094, | |
| "min": -34.94658660888672, | |
| "max": 193.63427734375, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.004276985768228769, | |
| "min": -0.02534239925444126, | |
| "max": 0.2799653708934784, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 1.1975560188293457, | |
| "min": -7.045186996459961, | |
| "max": 67.75161743164062, | |
| "count": 67 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06844937501133061, | |
| "min": 0.06541937366928527, | |
| "max": 0.07249765002953133, | |
| "count": 67 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9582912501586285, | |
| "min": 0.5307614199792834, | |
| "max": 1.0678972979555565, | |
| "count": 67 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.014101383147904873, | |
| "min": 0.00018255593427123036, | |
| "max": 0.018534353781086838, | |
| "count": 67 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.1974193640706682, | |
| "min": 0.002373227145525995, | |
| "max": 0.2594809529352157, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 0.00010050771649745, | |
| "min": 0.00010050771649745, | |
| "max": 0.00029840621303126253, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.0014071080309643, | |
| "min": 0.0014071080309643, | |
| "max": 0.003801528032824033, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.13350255, | |
| "min": 0.13350255, | |
| "max": 0.19946873750000002, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.8690357, | |
| "min": 1.5957499000000002, | |
| "max": 2.7523842333333333, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0033569047450000005, | |
| "min": 0.0033569047450000005, | |
| "max": 0.009946926876250001, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.04699666643000001, | |
| "min": 0.04699666643000001, | |
| "max": 0.12673087907, | |
| "count": 67 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.0056404173374176025, | |
| "min": 0.005199231207370758, | |
| "max": 0.3667435646057129, | |
| "count": 67 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.07896584272384644, | |
| "min": 0.07278923690319061, | |
| "max": 2.933948516845703, | |
| "count": 67 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 337.632183908046, | |
| "min": 290.4901960784314, | |
| "max": 999.0, | |
| "count": 67 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29374.0, | |
| "min": 15915.0, | |
| "max": 32718.0, | |
| "count": 67 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.5484908863224767, | |
| "min": -0.9998375521972775, | |
| "max": 1.6702784138421218, | |
| "count": 67 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 136.26719799637794, | |
| "min": -31.99480167031288, | |
| "max": 170.36839821189642, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.5484908863224767, | |
| "min": -0.9998375521972775, | |
| "max": 1.6702784138421218, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 136.26719799637794, | |
| "min": -31.99480167031288, | |
| "max": 170.36839821189642, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.019873120251759246, | |
| "min": 0.016427226377841594, | |
| "max": 7.391694875434041, | |
| "count": 67 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 1.7488345821548137, | |
| "min": 1.6065027146905777, | |
| "max": 118.26711800694466, | |
| "count": 67 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 67 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 67 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1749148958", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.7.1+cu126", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1749156362" | |
| }, | |
| "total": 7404.639835548, | |
| "count": 1, | |
| "self": 0.8150598689999242, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.03187451899975713, | |
| "count": 1, | |
| "self": 0.03187451899975713 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 7403.79290116, | |
| "count": 1, | |
| "self": 5.332359532886585, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.972464338000009, | |
| "count": 1, | |
| "self": 2.972464338000009 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 7395.355251487114, | |
| "count": 129924, | |
| "self": 5.793066790091871, | |
| "children": { | |
| "env_step": { | |
| "total": 4964.024566039887, | |
| "count": 129924, | |
| "self": 4599.533635196667, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 361.4889427231037, | |
| "count": 129924, | |
| "self": 16.866114986912635, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 344.6228277361911, | |
| "count": 126738, | |
| "self": 344.6228277361911 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 3.0019881201160388, | |
| "count": 129923, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 7386.281457720919, | |
| "count": 129923, | |
| "is_parallel": true, | |
| "self": 3177.5012284157865, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0030046709998714505, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0010919669994109427, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0019127040004605078, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0019127040004605078 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.06582260300001508, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0007003099995017692, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005332650002856099, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005332650002856099 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.06259613800011721, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.06259613800011721 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.001992890000110492, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004085670007043518, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0015843229994061403, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0015843229994061403 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 4208.780229305133, | |
| "count": 129922, | |
| "is_parallel": true, | |
| "self": 98.96128254718406, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 64.61660218688439, | |
| "count": 129922, | |
| "is_parallel": true, | |
| "self": 64.61660218688439 | |
| }, | |
| "communicator.exchange": { | |
| "total": 3772.3903442479054, | |
| "count": 129922, | |
| "is_parallel": true, | |
| "self": 3772.3903442479054 | |
| }, | |
| "steps_from_proto": { | |
| "total": 272.8120003231588, | |
| "count": 129922, | |
| "is_parallel": true, | |
| "self": 59.76042003351495, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 213.05158028964388, | |
| "count": 1039376, | |
| "is_parallel": true, | |
| "self": 213.05158028964388 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 2425.537618657135, | |
| "count": 129923, | |
| "self": 10.179566866062942, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 374.1836879440898, | |
| "count": 129923, | |
| "self": 373.49525974109065, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.6884282029991482, | |
| "count": 4, | |
| "self": 0.6884282029991482 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 2041.1743638469825, | |
| "count": 936, | |
| "self": 799.9037303269884, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 1241.2706335199941, | |
| "count": 46173, | |
| "self": 1241.2706335199941 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.9119997887173668e-06, | |
| "count": 1, | |
| "self": 1.9119997887173668e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.13282388999869, | |
| "count": 1, | |
| "self": 0.002962276998005109, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.12986161300068488, | |
| "count": 1, | |
| "self": 0.12986161300068488 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |