Initial commit

0e155b1 about 3 years ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 1.00198233127594,
	"min": 0.9921206831932068,
	"max": 1.4485609531402588,
	"count": 4
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 30011.375,
	"min": 30011.375,
	"max": 43943.546875,
	"count": 4
	},
	"Pyramids.Step.mean": {
	"value": 119947.0,
	"min": 29914.0,
	"max": 119947.0,
	"count": 4
	},
	"Pyramids.Step.sum": {
	"value": 119947.0,
	"min": 29914.0,
	"max": 119947.0,
	"count": 4
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.08380933851003647,
	"min": -0.08380933851003647,
	"max": 0.03136281296610832,
	"count": 4
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": -20.2818603515625,
	"min": -20.2818603515625,
	"max": 7.432986259460449,
	"count": 4
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.08611355721950531,
	"min": 0.08611355721950531,
	"max": 0.2662358582019806,
	"count": 4
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 20.839481353759766,
	"min": 20.839481353759766,
	"max": 64.4290771484375,
	"count": 4
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06898505029814996,
	"min": 0.06898505029814996,
	"max": 0.07291630261307913,
	"count": 4
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.8968056538759493,
	"min": 0.583330420904633,
	"max": 0.9145981951577791,
	"count": 4
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.001384501303736123,
	"min": 0.001384501303736123,
	"max": 0.007094622672303227,
	"count": 4
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.0179985169485696,
	"min": 0.0179985169485696,
	"max": 0.056756981378425816,
	"count": 4
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.0002893945189197769,
	"min": 0.0002893945189197769,
	"max": 0.0002984042755319083,
	"count": 4
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0037621287459570995,
	"min": 0.0023872342042552666,
	"max": 0.0038025975324674994,
	"count": 4
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1964648384615385,
	"min": 0.1964648384615385,
	"max": 0.19946809166666668,
	"count": 4
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.5540429000000007,
	"min": 1.5957447333333334,
	"max": 2.5675324999999996,
	"count": 4
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.009646837362307693,
	"min": 0.009646837362307693,
	"max": 0.009946862357499999,
	"count": 4
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.12540888571,
	"min": 0.07957489885999999,
	"max": 0.12675649675,
	"count": 4
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.07624217122793198,
	"min": 0.07624217122793198,
	"max": 0.5006290078163147,
	"count": 4
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.9911482334136963,
	"min": 0.9911482334136963,
	"max": 4.005032062530518,
	"count": 4
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 952.6470588235294,
	"min": 952.6470588235294,
	"max": 996.625,
	"count": 4
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 32390.0,
	"min": 15946.0,
	"max": 32800.0,
	"count": 4
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.8358471086796593,
	"min": -0.8725625551305711,
	"max": -0.7976242969885017,
	"count": 4
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -28.418801695108414,
	"min": -28.830801710486412,
	"max": -13.961000882089138,
	"count": 4
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.8358471086796593,
	"min": -0.8725625551305711,
	"max": -0.7976242969885017,
	"count": 4
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -28.418801695108414,
	"min": -28.830801710486412,
	"max": -13.961000882089138,
	"count": 4
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.7794637884944677,
	"min": 0.7794637884944677,
	"max": 10.226822283118963,
	"count": 4
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 26.501768808811903,
	"min": 26.501768808811903,
	"max": 163.6291565299034,
	"count": 4
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 4
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 4
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1674467848",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1674468135"
	},
	"total": 286.8594396850001,
	"count": 1,
	"self": 0.30682105500000034,
	"children": {
	"run_training.setup": {
	"total": 0.10416299700000309,
	"count": 1,
	"self": 0.10416299700000309
	},
	"TrainerController.start_learning": {
	"total": 286.4484556330001,
	"count": 1,
	"self": 0.17793223698390648,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.174762633,
	"count": 1,
	"self": 6.174762633
	},
	"TrainerController.advance": {
	"total": 279.9142511180162,
	"count": 9324,
	"self": 0.1896541740087514,
	"children": {
	"env_step": {
	"total": 183.5860191530079,
	"count": 9324,
	"self": 167.853302513024,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 15.622803599992949,
	"count": 9324,
	"self": 0.6379715359952343,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 14.984832063997715,
	"count": 9288,
	"self": 5.023445084994023,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 9.961386979003692,
	"count": 9288,
	"self": 9.961386979003692
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.1099130399909427,
	"count": 9323,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 285.7027269049919,
	"count": 9323,
	"is_parallel": true,
	"self": 132.44011913698967,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0018625420000262238,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007037320000335967,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011588099999926271,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011588099999926271
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.045178636999935406,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005328179997832194,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004357630000413337,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004357630000413337
	},
	"communicator.exchange": {
	"total": 0.04249145200003568,
	"count": 1,
	"is_parallel": true,
	"self": 0.04249145200003568
	},
	"steps_from_proto": {
	"total": 0.0017186040000751746,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004508870001700416,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001267716999905133,
	"count": 8,
	"is_parallel": true,
	"self": 0.001267716999905133
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 153.26260776800223,
	"count": 9322,
	"is_parallel": true,
	"self": 4.146317096021221,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 3.5863848909863236,
	"count": 9322,
	"is_parallel": true,
	"self": 3.5863848909863236
	},
	"communicator.exchange": {
	"total": 130.14465234200338,
	"count": 9322,
	"is_parallel": true,
	"self": 130.14465234200338
	},
	"steps_from_proto": {
	"total": 15.385253438991299,
	"count": 9322,
	"is_parallel": true,
	"self": 3.410272352995321,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 11.974981085995978,
	"count": 74576,
	"is_parallel": true,
	"self": 11.974981085995978
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 96.13857779099953,
	"count": 9323,
	"self": 0.2502447500029348,
	"children": {
	"process_trajectory": {
	"total": 21.763189877997547,
	"count": 9323,
	"self": 21.763189877997547
	},
	"_update_policy": {
	"total": 74.12514316299905,
	"count": 56,
	"self": 27.909818004999693,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 46.21532515799936,
	"count": 3393,
	"self": 46.21532515799936
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.3010001111979363e-06,
	"count": 1,
	"self": 1.3010001111979363e-06
	},
	"TrainerController._save_models": {
	"total": 0.18150834399989435,
	"count": 1,
	"self": 0.0018405879998226737,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.17966775600007168,
	"count": 1,
	"self": 0.17966775600007168
	}
	}
	}
	}
	}
	}
	}