PPO-RND-Pyramids / run_logs /timers.json

First Model

525be54 about 3 years ago

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.5572478175163269,
	"min": 0.5386313199996948,
	"max": 1.3910027742385864,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 16574.779296875,
	"min": 16167.55859375,
	"max": 42197.4609375,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989962.0,
	"min": 29952.0,
	"max": 989962.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989962.0,
	"min": 29952.0,
	"max": 989962.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.19189460575580597,
	"min": -0.09870325028896332,
	"max": 0.20162059366703033,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 48.74123001098633,
	"min": -23.688779830932617,
	"max": 51.211631774902344,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.0066856518387794495,
	"min": -0.013917215168476105,
	"max": 0.5439726114273071,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -1.6981555223464966,
	"min": -3.534972667694092,
	"max": 128.9215087890625,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06850204886589696,
	"min": 0.06507357036092752,
	"max": 0.07289688525077552,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9590286841225574,
	"min": 0.48399625766631643,
	"max": 1.0372182905557565,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.008899715815304382,
	"min": 0.0001361964184250879,
	"max": 0.011019201556337064,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.12459602141426135,
	"min": 0.0019067498579512304,
	"max": 0.1542688217887189,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.659804589621429e-06,
	"min": 7.659804589621429e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010723726425470001,
	"min": 0.00010723726425470001,
	"max": 0.0036333232888923,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10255323571428573,
	"min": 0.10255323571428573,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4357453000000002,
	"min": 1.3886848,
	"max": 2.6111077,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002650682478571429,
	"min": 0.0002650682478571429,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.00371095547,
	"min": 0.00371095547,
	"max": 0.12112965923,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.01410889346152544,
	"min": 0.01410889346152544,
	"max": 0.3948425352573395,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.19752450287342072,
	"min": 0.19752450287342072,
	"max": 2.763897657394409,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 648.3125,
	"min": 607.3877551020408,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 31119.0,
	"min": 15984.0,
	"max": 32298.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 0.8932458052101234,
	"min": -1.0000000521540642,
	"max": 0.8932458052101234,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 42.875798650085926,
	"min": -31.989601641893387,
	"max": 42.875798650085926,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 0.8932458052101234,
	"min": -1.0000000521540642,
	"max": 0.8932458052101234,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 42.875798650085926,
	"min": -31.989601641893387,
	"max": 42.875798650085926,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.09404990300269371,
	"min": 0.09404990300269371,
	"max": 7.611463585868478,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.514395344129298,
	"min": 4.514395344129298,
	"max": 121.78341737389565,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1674758248",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1674760350"
	},
	"total": 2102.716744429,
	"count": 1,
	"self": 0.5249121119995834,
	"children": {
	"run_training.setup": {
	"total": 0.11594565199993667,
	"count": 1,
	"self": 0.11594565199993667
	},
	"TrainerController.start_learning": {
	"total": 2102.0758866650003,
	"count": 1,
	"self": 1.7838245098801053,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.298491405999812,
	"count": 1,
	"self": 6.298491405999812
	},
	"TrainerController.advance": {
	"total": 2093.905993407121,
	"count": 63299,
	"self": 1.7025431923084398,
	"children": {
	"env_step": {
	"total": 1407.0521682800663,
	"count": 63299,
	"self": 1277.6079131370125,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 128.3829707910054,
	"count": 63299,
	"self": 5.115100918948883,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 123.26786987205651,
	"count": 62573,
	"self": 41.0107970351246,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 82.25707283693191,
	"count": 62573,
	"self": 82.25707283693191
	}
	}
	}
	}
	},
	"workers": {
	"total": 1.0612843520484603,
	"count": 63299,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2095.8348141662673,
	"count": 63299,
	"is_parallel": true,
	"self": 941.1229038961274,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0018078029997923295,
	"count": 1,
	"is_parallel": true,
	"self": 0.000664938998852449,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011428640009398805,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011428640009398805
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04912068699923111,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005038569979660679,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005007650006518816,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005007650006518816
	},
	"communicator.exchange": {
	"total": 0.046332585000527615,
	"count": 1,
	"is_parallel": true,
	"self": 0.046332585000527615
	},
	"steps_from_proto": {
	"total": 0.0017834800000855466,
	"count": 1,
	"is_parallel": true,
	"self": 0.00046568000016122824,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013177999999243184,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013177999999243184
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1154.71191027014,
	"count": 63298,
	"is_parallel": true,
	"self": 30.957620933185353,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 25.639935032986614,
	"count": 63298,
	"is_parallel": true,
	"self": 25.639935032986614
	},
	"communicator.exchange": {
	"total": 986.0553037659283,
	"count": 63298,
	"is_parallel": true,
	"self": 986.0553037659283
	},
	"steps_from_proto": {
	"total": 112.05905053803963,
	"count": 63298,
	"is_parallel": true,
	"self": 27.4860797560259,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 84.57297078201373,
	"count": 506384,
	"is_parallel": true,
	"self": 84.57297078201373
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 685.1512819347463,
	"count": 63299,
	"self": 3.1412648536970664,
	"children": {
	"process_trajectory": {
	"total": 155.23856988605985,
	"count": 63299,
	"self": 155.04465968505974,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.19391020100010792,
	"count": 2,
	"self": 0.19391020100010792
	}
	}
	},
	"_update_policy": {
	"total": 526.7714471949894,
	"count": 451,
	"self": 201.44817089387652,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 325.32327630111286,
	"count": 22794,
	"self": 325.32327630111286
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.529994713375345e-07,
	"count": 1,
	"self": 9.529994713375345e-07
	},
	"TrainerController._save_models": {
	"total": 0.08757638899987796,
	"count": 1,
	"self": 0.001447713999368716,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08612867500050925,
	"count": 1,
	"self": 0.08612867500050925
	}
	}
	}
	}
	}
	}
	}