First Push

cc02649 over 2 years ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4323011040687561,
	"min": 0.4323011040687561,
	"max": 1.521894097328186,
	"count": 46
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 13038.201171875,
	"min": 13038.201171875,
	"max": 46168.1796875,
	"count": 46
	},
	"Pyramids.Step.mean": {
	"value": 1379889.0,
	"min": 29952.0,
	"max": 1379889.0,
	"count": 46
	},
	"Pyramids.Step.sum": {
	"value": 1379889.0,
	"min": 29952.0,
	"max": 1379889.0,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.6202417612075806,
	"min": -0.12486793100833893,
	"max": 0.6453419923782349,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 174.90817260742188,
	"min": -29.593700408935547,
	"max": 179.4050750732422,
	"count": 46
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.012686235830187798,
	"min": -0.020177382975816727,
	"max": 0.10471756756305695,
	"count": 46
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -3.5775184631347656,
	"min": -4.782039642333984,
	"max": 25.341651916503906,
	"count": 46
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07091114711191202,
	"min": 0.06393599365570475,
	"max": 0.07449721325344096,
	"count": 46
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9927560595667683,
	"min": 0.4811091471929103,
	"max": 1.1174581988016143,
	"count": 46
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.013107569443198255,
	"min": 0.0003153645406325535,
	"max": 0.014699944187480213,
	"count": 46
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.18350597220477557,
	"min": 0.004322338205057764,
	"max": 0.20579921862472297,
	"count": 46
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.00016352934549023333,
	"min": 0.00016352934549023333,
	"max": 0.00029838354339596195,
	"count": 46
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0022894108368632666,
	"min": 0.0020886848037717336,
	"max": 0.003969584076805333,
	"count": 46
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.15450976666666666,
	"min": 0.15450976666666666,
	"max": 0.19946118095238097,
	"count": 46
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.1631367333333333,
	"min": 1.3962282666666668,
	"max": 2.7231946666666667,
	"count": 46
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00545552569,
	"min": 0.00545552569,
	"max": 0.009946171977142856,
	"count": 46
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.07637735966,
	"min": 0.06962320384,
	"max": 0.13232714720000002,
	"count": 46
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.005336236208677292,
	"min": 0.005336236208677292,
	"max": 0.26477232575416565,
	"count": 46
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.07470730692148209,
	"min": 0.07470730692148209,
	"max": 1.8534061908721924,
	"count": 46
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 297.9375,
	"min": 297.1546391752577,
	"max": 999.0,
	"count": 46
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28602.0,
	"min": 15984.0,
	"max": 33129.0,
	"count": 46
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.6535793652700395,
	"min": -1.0000000521540642,
	"max": 1.702845345606509,
	"count": 46
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 160.39719843119383,
	"min": -30.9994016289711,
	"max": 165.17599852383137,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.6535793652700395,
	"min": -1.0000000521540642,
	"max": 1.702845345606509,
	"count": 46
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 160.39719843119383,
	"min": -30.9994016289711,
	"max": 165.17599852383137,
	"count": 46
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.016989419559921743,
	"min": 0.016989419559921743,
	"max": 5.501258888281882,
	"count": 46
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.647973697312409,
	"min": 1.647973697312409,
	"max": 88.02014221251011,
	"count": 46
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 46
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 46
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1698107012",
	"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.1.0+cu118",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1698110176"
	},
	"total": 3164.609970321,
	"count": 1,
	"self": 0.4864675460003127,
	"children": {
	"run_training.setup": {
	"total": 0.042338582999946084,
	"count": 1,
	"self": 0.042338582999946084
	},
	"TrainerController.start_learning": {
	"total": 3164.081164192,
	"count": 1,
	"self": 2.0965730678226464,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.4329820379998637,
	"count": 1,
	"self": 3.4329820379998637
	},
	"TrainerController.advance": {
	"total": 3158.548553360177,
	"count": 88580,
	"self": 2.178246579084771,
	"children": {
	"env_step": {
	"total": 2261.430189991037,
	"count": 88580,
	"self": 2063.367065181015,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 196.76392753203095,
	"count": 88580,
	"self": 6.740243861953559,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 190.0236836700774,
	"count": 86988,
	"self": 190.0236836700774
	}
	}
	},
	"workers": {
	"total": 1.2991972779911976,
	"count": 88579,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3157.3664632769987,
	"count": 88579,
	"is_parallel": true,
	"self": 1269.1054589470596,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0018875400000979425,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006164230001104443,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012711169999874983,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012711169999874983
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05493908999983432,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005921249999119027,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005522349999864673,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005522349999864673
	},
	"communicator.exchange": {
	"total": 0.05209911899987674,
	"count": 1,
	"is_parallel": true,
	"self": 0.05209911899987674
	},
	"steps_from_proto": {
	"total": 0.0016956110000592162,
	"count": 1,
	"is_parallel": true,
	"self": 0.00036968400013392966,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013259269999252865,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013259269999252865
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1888.2610043299392,
	"count": 88578,
	"is_parallel": true,
	"self": 49.84024531483192,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 36.26995800008808,
	"count": 88578,
	"is_parallel": true,
	"self": 36.26995800008808
	},
	"communicator.exchange": {
	"total": 1655.7077670529593,
	"count": 88578,
	"is_parallel": true,
	"self": 1655.7077670529593
	},
	"steps_from_proto": {
	"total": 146.44303396205987,
	"count": 88578,
	"is_parallel": true,
	"self": 30.148753674154705,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 116.29428028790517,
	"count": 708624,
	"is_parallel": true,
	"self": 116.29428028790517
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 894.9401167900551,
	"count": 88579,
	"self": 3.96228238894696,
	"children": {
	"process_trajectory": {
	"total": 179.12121907810092,
	"count": 88579,
	"self": 178.95132169610156,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.16989738199936255,
	"count": 2,
	"self": 0.16989738199936255
	}
	}
	},
	"_update_policy": {
	"total": 711.8566153230072,
	"count": 635,
	"self": 419.2086930179803,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 292.6479223050269,
	"count": 31677,
	"self": 292.6479223050269
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1800002539530396e-06,
	"count": 1,
	"self": 1.1800002539530396e-06
	},
	"TrainerController._save_models": {
	"total": 0.0030545460003850167,
	"count": 1,
	"self": 2.3812000108591747e-05,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.003030734000276425,
	"count": 1,
	"self": 0.003030734000276425
	}
	}
	}
	}
	}
	}
	}