ppo-SnowballTarget / run_logs /timers.json

First Push

ed14733 over 2 years ago

18.4 kB

	{
	"name": "root",
	"gauges": {
	"SnowballTarget.Policy.Entropy.mean": {
	"value": 1.0076357126235962,
	"min": 1.0076357126235962,
	"max": 2.8541014194488525,
	"count": 20
	},
	"SnowballTarget.Policy.Entropy.sum": {
	"value": 9620.90625,
	"min": 9620.90625,
	"max": 29228.853515625,
	"count": 20
	},
	"SnowballTarget.Step.mean": {
	"value": 199984.0,
	"min": 9952.0,
	"max": 199984.0,
	"count": 20
	},
	"SnowballTarget.Step.sum": {
	"value": 199984.0,
	"min": 9952.0,
	"max": 199984.0,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
	"value": 1.2503714561462402,
	"min": 0.11449915915727615,
	"max": 1.2569438219070435,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
	"value": 243.8224334716797,
	"min": 22.21283721923828,
	"max": 255.97384643554688,
	"count": 20
	},
	"SnowballTarget.Environment.EpisodeLength.mean": {
	"value": 199.0,
	"min": 199.0,
	"max": 199.0,
	"count": 20
	},
	"SnowballTarget.Environment.EpisodeLength.sum": {
	"value": 8756.0,
	"min": 8756.0,
	"max": 10945.0,
	"count": 20
	},
	"SnowballTarget.Losses.PolicyLoss.mean": {
	"value": 0.06537453140624042,
	"min": 0.06079026495689166,
	"max": 0.07255646927874562,
	"count": 20
	},
	"SnowballTarget.Losses.PolicyLoss.sum": {
	"value": 0.26149812562496166,
	"min": 0.24316105982756664,
	"max": 0.36206743187344104,
	"count": 20
	},
	"SnowballTarget.Losses.ValueLoss.mean": {
	"value": 0.10795289358379795,
	"min": 0.043170824423820406,
	"max": 0.11508442762435651,
	"count": 20
	},
	"SnowballTarget.Losses.ValueLoss.sum": {
	"value": 0.4318115743351918,
	"min": 0.17268329769528162,
	"max": 0.5754221381217826,
	"count": 20
	},
	"SnowballTarget.Policy.LearningRate.mean": {
	"value": 8.082097306000005e-06,
	"min": 8.082097306000005e-06,
	"max": 0.000291882002706,
	"count": 20
	},
	"SnowballTarget.Policy.LearningRate.sum": {
	"value": 3.232838922400002e-05,
	"min": 3.232838922400002e-05,
	"max": 0.00138516003828,
	"count": 20
	},
	"SnowballTarget.Policy.Epsilon.mean": {
	"value": 0.10269400000000001,
	"min": 0.10269400000000001,
	"max": 0.19729400000000002,
	"count": 20
	},
	"SnowballTarget.Policy.Epsilon.sum": {
	"value": 0.41077600000000003,
	"min": 0.41077600000000003,
	"max": 0.96172,
	"count": 20
	},
	"SnowballTarget.Policy.Beta.mean": {
	"value": 0.0001444306000000001,
	"min": 0.0001444306000000001,
	"max": 0.0048649706,
	"count": 20
	},
	"SnowballTarget.Policy.Beta.sum": {
	"value": 0.0005777224000000004,
	"min": 0.0005777224000000004,
	"max": 0.023089828,
	"count": 20
	},
	"SnowballTarget.Environment.CumulativeReward.mean": {
	"value": 24.75,
	"min": 3.2954545454545454,
	"max": 24.75,
	"count": 20
	},
	"SnowballTarget.Environment.CumulativeReward.sum": {
	"value": 1089.0,
	"min": 145.0,
	"max": 1353.0,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicReward.mean": {
	"value": 24.75,
	"min": 3.2954545454545454,
	"max": 24.75,
	"count": 20
	},
	"SnowballTarget.Policy.ExtrinsicReward.sum": {
	"value": 1089.0,
	"min": 145.0,
	"max": 1353.0,
	"count": 20
	},
	"SnowballTarget.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 20
	},
	"SnowballTarget.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 20
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1687336504",
	"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1687336961"
	},
	"total": 457.6743351670001,
	"count": 1,
	"self": 0.38502534600013405,
	"children": {
	"run_training.setup": {
	"total": 0.04004001800001333,
	"count": 1,
	"self": 0.04004001800001333
	},
	"TrainerController.start_learning": {
	"total": 457.24926980299995,
	"count": 1,
	"self": 0.5385772319938269,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.060846866999896,
	"count": 1,
	"self": 4.060846866999896
	},
	"TrainerController.advance": {
	"total": 452.5134801930061,
	"count": 18202,
	"self": 0.24959090201070921,
	"children": {
	"env_step": {
	"total": 452.2638892909954,
	"count": 18202,
	"self": 331.93087227898627,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 120.07621832500104,
	"count": 18202,
	"self": 1.9188470700026983,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 118.15737125499834,
	"count": 18202,
	"self": 118.15737125499834
	}
	}
	},
	"workers": {
	"total": 0.25679868700808584,
	"count": 18202,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 455.5438302870066,
	"count": 18202,
	"is_parallel": true,
	"self": 213.67731299701074,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005608143000017662,
	"count": 1,
	"is_parallel": true,
	"self": 0.003908295999963229,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001699847000054433,
	"count": 10,
	"is_parallel": true,
	"self": 0.001699847000054433
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03421949099993071,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005817009999873335,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003506189999598064,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003506189999598064
	},
	"communicator.exchange": {
	"total": 0.0312768710000455,
	"count": 1,
	"is_parallel": true,
	"self": 0.0312768710000455
	},
	"steps_from_proto": {
	"total": 0.00201029999993807,
	"count": 1,
	"is_parallel": true,
	"self": 0.00036989000011544704,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001640409999822623,
	"count": 10,
	"is_parallel": true,
	"self": 0.001640409999822623
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 241.86651728999584,
	"count": 18201,
	"is_parallel": true,
	"self": 10.169303139990461,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 5.166734137998446,
	"count": 18201,
	"is_parallel": true,
	"self": 5.166734137998446
	},
	"communicator.exchange": {
	"total": 192.65408182500903,
	"count": 18201,
	"is_parallel": true,
	"self": 192.65408182500903
	},
	"steps_from_proto": {
	"total": 33.8763981869979,
	"count": 18201,
	"is_parallel": true,
	"self": 6.07507280794016,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 27.801325379057744,
	"count": 182010,
	"is_parallel": true,
	"self": 27.801325379057744
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 0.00011680600005092856,
	"count": 1,
	"self": 0.00011680600005092856,
	"children": {
	"thread_root": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"trainer_advance": {
	"total": 449.0632430999626,
	"count": 430333,
	"is_parallel": true,
	"self": 9.277428346986653,
	"children": {
	"process_trajectory": {
	"total": 245.28750594697613,
	"count": 430333,
	"is_parallel": true,
	"self": 244.17181640297622,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.1156895439999062,
	"count": 4,
	"is_parallel": true,
	"self": 1.1156895439999062
	}
	}
	},
	"_update_policy": {
	"total": 194.49830880599984,
	"count": 90,
	"is_parallel": true,
	"self": 76.03361529999768,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 118.46469350600216,
	"count": 4587,
	"is_parallel": true,
	"self": 118.46469350600216
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"TrainerController._save_models": {
	"total": 0.1362487050000709,
	"count": 1,
	"self": 0.0008559890002288739,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.13539271599984204,
	"count": 1,
	"self": 0.13539271599984204
	}
	}
	}
	}
	}
	}
	}