ppo-SnowballTarget / run_logs /timers.json

First Push

19a9a48 about 3 years ago

19 kB

	{
	"name": "root",
	"gauges": {
	"SnowballTarget.Policy.Entropy.mean": {
	"value": 0.8279334902763367,
	"min": 0.8279334902763367,
	"max": 2.8590214252471924,
	"count": 20
	},
	"SnowballTarget.Policy.Entropy.sum": {
	"value": 7896.001953125,
	"min": 7896.001953125,
	"max": 29279.23828125,
	"count": 20
	},
	"SnowballTarget.Step.mean": {
	"value": 199984.0,
	"min": 9952.0,
	"max": 199984.0,
	"count": 20
	},
	"SnowballTarget.Step.sum": {
	"value": 199984.0,
	"min": 9952.0,
	"max": 199984.0,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
	"value": 12.960752487182617,
	"min": 0.2753119170665741,
	"max": 12.960752487182617,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
	"value": 2527.3466796875,
	"min": 53.4105110168457,
	"max": 2642.76611328125,
	"count": 20
	},
	"SnowballTarget.Environment.EpisodeLength.mean": {
	"value": 199.0,
	"min": 199.0,
	"max": 199.0,
	"count": 20
	},
	"SnowballTarget.Environment.EpisodeLength.sum": {
	"value": 8756.0,
	"min": 8756.0,
	"max": 10945.0,
	"count": 20
	},
	"SnowballTarget.Losses.PolicyLoss.mean": {
	"value": 0.07264678573390519,
	"min": 0.06446490807506694,
	"max": 0.07321259986024861,
	"count": 20
	},
	"SnowballTarget.Losses.PolicyLoss.sum": {
	"value": 0.29058714293562077,
	"min": 0.26223109220311513,
	"max": 0.3660629993012431,
	"count": 20
	},
	"SnowballTarget.Losses.ValueLoss.mean": {
	"value": 0.19491095789799504,
	"min": 0.12156432431291643,
	"max": 0.27539325730473385,
	"count": 20
	},
	"SnowballTarget.Losses.ValueLoss.sum": {
	"value": 0.7796438315919801,
	"min": 0.4862572972516657,
	"max": 1.3769662865236691,
	"count": 20
	},
	"SnowballTarget.Policy.LearningRate.mean": {
	"value": 8.082097306000005e-06,
	"min": 8.082097306000005e-06,
	"max": 0.000291882002706,
	"count": 20
	},
	"SnowballTarget.Policy.LearningRate.sum": {
	"value": 3.232838922400002e-05,
	"min": 3.232838922400002e-05,
	"max": 0.00138516003828,
	"count": 20
	},
	"SnowballTarget.Policy.Epsilon.mean": {
	"value": 0.10269400000000001,
	"min": 0.10269400000000001,
	"max": 0.19729400000000002,
	"count": 20
	},
	"SnowballTarget.Policy.Epsilon.sum": {
	"value": 0.41077600000000003,
	"min": 0.41077600000000003,
	"max": 0.96172,
	"count": 20
	},
	"SnowballTarget.Policy.Beta.mean": {
	"value": 0.0001444306000000001,
	"min": 0.0001444306000000001,
	"max": 0.0048649706,
	"count": 20
	},
	"SnowballTarget.Policy.Beta.sum": {
	"value": 0.0005777224000000004,
	"min": 0.0005777224000000004,
	"max": 0.023089828,
	"count": 20
	},
	"SnowballTarget.Environment.CumulativeReward.mean": {
	"value": 25.045454545454547,
	"min": 3.340909090909091,
	"max": 25.836363636363636,
	"count": 20
	},
	"SnowballTarget.Environment.CumulativeReward.sum": {
	"value": 1102.0,
	"min": 147.0,
	"max": 1421.0,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicReward.mean": {
	"value": 25.045454545454547,
	"min": 3.340909090909091,
	"max": 25.836363636363636,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicReward.sum": {
	"value": 1102.0,
	"min": 147.0,
	"max": 1421.0,
	"count": 20
	},
	"SnowballTarget.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 20
	},
	"SnowballTarget.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 20
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1674035472",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1674035911"
	},
	"total": 438.928908297,
	"count": 1,
	"self": 0.38872646999993776,
	"children": {
	"run_training.setup": {
	"total": 0.1035128830000076,
	"count": 1,
	"self": 0.1035128830000076
	},
	"TrainerController.start_learning": {
	"total": 438.4366689440001,
	"count": 1,
	"self": 0.5348161190139535,
	"children": {
	"TrainerController._reset_env": {
	"total": 9.630275627999936,
	"count": 1,
	"self": 9.630275627999936
	},
	"TrainerController.advance": {
	"total": 428.14202194398615,
	"count": 18201,
	"self": 0.263697386955414,
	"children": {
	"env_step": {
	"total": 427.87832455703074,
	"count": 18201,
	"self": 280.07090272503035,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 147.54148002299723,
	"count": 18201,
	"self": 1.4011753590028775,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 146.14030466399436,
	"count": 18201,
	"self": 33.370133937987475,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 112.77017072600688,
	"count": 18201,
	"self": 112.77017072600688
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.26594180900315223,
	"count": 18201,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 437.13143204398955,
	"count": 18201,
	"is_parallel": true,
	"self": 211.13834060199258,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005951294000055896,
	"count": 1,
	"is_parallel": true,
	"self": 0.003613513999994211,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023377800000616844,
	"count": 10,
	"is_parallel": true,
	"self": 0.0023377800000616844
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03607890499995392,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006189309998489989,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00033488300005046767,
	"count": 1,
	"is_parallel": true,
	"self": 0.00033488300005046767
	},
	"communicator.exchange": {
	"total": 0.033054273000061585,
	"count": 1,
	"is_parallel": true,
	"self": 0.033054273000061585
	},
	"steps_from_proto": {
	"total": 0.002070817999992869,
	"count": 1,
	"is_parallel": true,
	"self": 0.00047214399990025413,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0015986740000926147,
	"count": 10,
	"is_parallel": true,
	"self": 0.0015986740000926147
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 225.99309144199697,
	"count": 18200,
	"is_parallel": true,
	"self": 8.437238615998353,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 5.1142906330048845,
	"count": 18200,
	"is_parallel": true,
	"self": 5.1142906330048845
	},
	"communicator.exchange": {
	"total": 181.24482770000202,
	"count": 18200,
	"is_parallel": true,
	"self": 181.24482770000202
	},
	"steps_from_proto": {
	"total": 31.19673449299171,
	"count": 18200,
	"is_parallel": true,
	"self": 6.683066412021503,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 24.513668080970206,
	"count": 182000,
	"is_parallel": true,
	"self": 24.513668080970206
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 4.3729000026360154e-05,
	"count": 1,
	"self": 4.3729000026360154e-05,
	"children": {
	"thread_root": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"trainer_advance": {
	"total": 425.03856793990235,
	"count": 358624,
	"is_parallel": true,
	"self": 9.582208081875024,
	"children": {
	"process_trajectory": {
	"total": 245.9524048190283,
	"count": 358624,
	"is_parallel": true,
	"self": 245.2404350400284,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.7119697789999009,
	"count": 4,
	"is_parallel": true,
	"self": 0.7119697789999009
	}
	}
	},
	"_update_policy": {
	"total": 169.50395503899904,
	"count": 90,
	"is_parallel": true,
	"self": 44.94844377999607,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 124.55551125900297,
	"count": 4587,
	"is_parallel": true,
	"self": 124.55551125900297
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"TrainerController._save_models": {
	"total": 0.12951152400000865,
	"count": 1,
	"self": 0.0008794579998721019,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.12863206600013655,
	"count": 1,
	"self": 0.12863206600013655
	}
	}
	}
	}
	}
	}
	}