First Push

025e1f6 verified almost 2 years ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.15648406744003296,
	"min": 0.15526911616325378,
	"max": 1.4576489925384521,
	"count": 100
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 4682.00341796875,
	"min": 4618.32470703125,
	"max": 44219.23828125,
	"count": 100
	},
	"Pyramids.Step.mean": {
	"value": 2999950.0,
	"min": 29952.0,
	"max": 2999950.0,
	"count": 100
	},
	"Pyramids.Step.sum": {
	"value": 2999950.0,
	"min": 29952.0,
	"max": 2999950.0,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.8419708013534546,
	"min": -0.09999159723520279,
	"max": 0.8908884525299072,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 254.27517700195312,
	"min": -23.997983932495117,
	"max": 269.0483093261719,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.0005854564369656146,
	"min": -0.025869233533740044,
	"max": 0.3011578619480133,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -0.17680785059928894,
	"min": -6.726000785827637,
	"max": 72.88020324707031,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06635388502500904,
	"min": 0.06375473797067702,
	"max": 0.07373669026297643,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9289543903501266,
	"min": 0.4816754833897496,
	"max": 1.079091215909655,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01574389996727425,
	"min": 0.00020649086813176947,
	"max": 0.017026865324142444,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.2204145995418395,
	"min": 0.0028908721538447725,
	"max": 0.2486327111905934,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.560278051369048e-06,
	"min": 1.560278051369048e-06,
	"max": 0.00029838354339596195,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.1843892719166674e-05,
	"min": 2.1843892719166674e-05,
	"max": 0.003969440876853066,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10052005952380953,
	"min": 0.10052005952380953,
	"max": 0.19946118095238097,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4072808333333335,
	"min": 1.3962282666666668,
	"max": 2.7674191333333344,
	"count": 100
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 6.195394642857145e-05,
	"min": 6.195394642857145e-05,
	"max": 0.009946171977142856,
	"count": 100
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008673552500000003,
	"min": 0.0008673552500000003,
	"max": 0.13232237864,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.005206058733165264,
	"min": 0.0050305589102208614,
	"max": 0.529541015625,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.07288482040166855,
	"min": 0.07042782753705978,
	"max": 3.706787109375,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 206.6978417266187,
	"min": 204.82119205298014,
	"max": 999.0,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28731.0,
	"min": 15984.0,
	"max": 33496.0,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7805956389377082,
	"min": -1.0000000521540642,
	"max": 1.7843846004742843,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 245.72219817340374,
	"min": -29.802001617848873,
	"max": 267.411798119545,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7805956389377082,
	"min": -1.0000000521540642,
	"max": 1.7843846004742843,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 245.72219817340374,
	"min": -29.802001617848873,
	"max": 267.411798119545,
	"count": 100
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.011204389614051805,
	"min": 0.011204389614051805,
	"max": 10.77631295658648,
	"count": 100
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.5462057667391491,
	"min": 1.5462057667391491,
	"max": 172.42100730538368,
	"count": 100
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1710437298",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/home/tikhon/anaconda3/envs/mlagents/bin/mlagents-learn ../config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.0.0",
	"mlagents_envs_version": "1.0.0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1710441946"
	},
	"total": 4647.532118725001,
	"count": 1,
	"self": 0.31966334099888627,
	"children": {
	"run_training.setup": {
	"total": 0.018745831001069746,
	"count": 1,
	"self": 0.018745831001069746
	},
	"TrainerController.start_learning": {
	"total": 4647.193709553001,
	"count": 1,
	"self": 3.5560735466660844,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.5141093009988253,
	"count": 1,
	"self": 1.5141093009988253
	},
	"TrainerController.advance": {
	"total": 4642.067872695332,
	"count": 195069,
	"self": 3.4164983091650356,
	"children": {
	"env_step": {
	"total": 3056.4457490606,
	"count": 195069,
	"self": 2829.550677944624,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 224.5273600923192,
	"count": 195069,
	"self": 10.340624971253419,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 214.1867351210658,
	"count": 187547,
	"self": 214.1867351210658
	}
	}
	},
	"workers": {
	"total": 2.3677110236567387,
	"count": 195069,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 4642.366809390001,
	"count": 195069,
	"is_parallel": true,
	"self": 2068.1822051252075,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.001196270999571425,
	"count": 1,
	"is_parallel": true,
	"self": 0.00033221499870705884,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0008640560008643661,
	"count": 8,
	"is_parallel": true,
	"self": 0.0008640560008643661
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.0372296980003739,
	"count": 1,
	"is_parallel": true,
	"self": 0.0002497889981896151,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003989140004705405,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003989140004705405
	},
	"communicator.exchange": {
	"total": 0.035797853000985924,
	"count": 1,
	"is_parallel": true,
	"self": 0.035797853000985924
	},
	"steps_from_proto": {
	"total": 0.0007831420007278211,
	"count": 1,
	"is_parallel": true,
	"self": 0.00017009699877235107,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0006130450019554701,
	"count": 8,
	"is_parallel": true,
	"self": 0.0006130450019554701
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2574.184604264794,
	"count": 195068,
	"is_parallel": true,
	"self": 71.99591521421826,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 47.65340357073546,
	"count": 195068,
	"is_parallel": true,
	"self": 47.65340357073546
	},
	"communicator.exchange": {
	"total": 2247.579691982224,
	"count": 195068,
	"is_parallel": true,
	"self": 2247.579691982224
	},
	"steps_from_proto": {
	"total": 206.95559349761606,
	"count": 195068,
	"is_parallel": true,
	"self": 41.96395975608539,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 164.99163374153068,
	"count": 1560544,
	"is_parallel": true,
	"self": 164.99163374153068
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1582.2056253255669,
	"count": 195069,
	"self": 7.049938452297283,
	"children": {
	"process_trajectory": {
	"total": 250.09003616930022,
	"count": 195069,
	"self": 249.75688899029774,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3331471790024807,
	"count": 6,
	"self": 0.3331471790024807
	}
	}
	},
	"_update_policy": {
	"total": 1325.0656507039694,
	"count": 1397,
	"self": 719.2999167647304,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 605.765733939239,
	"count": 68331,
	"self": 605.765733939239
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 7.570015441160649e-07,
	"count": 1,
	"self": 7.570015441160649e-07
	},
	"TrainerController._save_models": {
	"total": 0.05565325300267432,
	"count": 1,
	"self": 0.0016590530030953232,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.053994199999578996,
	"count": 1,
	"self": 0.053994199999578996
	}
	}
	}
	}
	}
	}
	}