ppo-SolarTracker / run_logs /timers.json

First Push

36b2463 verified 9 months ago

14.4 kB

	{
	"name": "root",
	"gauges": {
	"SearcherBrain.Policy.Entropy.mean": {
	"value": -1.5689488649368286,
	"min": -1.5689488649368286,
	"max": -1.2842600345611572,
	"count": 37
	},
	"SearcherBrain.Policy.Entropy.sum": {
	"value": -180742.90625,
	"min": -180792.109375,
	"max": -148193.328125,
	"count": 37
	},
	"SearcherBrain.Environment.EpisodeLength.mean": {
	"value": 599.0,
	"min": 599.0,
	"max": 600.0,
	"count": 37
	},
	"SearcherBrain.Environment.EpisodeLength.sum": {
	"value": 115008.0,
	"min": 115008.0,
	"max": 115200.0,
	"count": 37
	},
	"SearcherBrain.Step.mean": {
	"value": 35699496.0,
	"min": 31469776.0,
	"max": 35699496.0,
	"count": 142
	},
	"SearcherBrain.Step.sum": {
	"value": 35699496.0,
	"min": 31469776.0,
	"max": 35699496.0,
	"count": 142
	},
	"SearcherBrain.Policy.ExtrinsicValueEstimate.mean": {
	"value": 39.6043586730957,
	"min": 31.869272232055664,
	"max": 43.079132080078125,
	"count": 142
	},
	"SearcherBrain.Policy.ExtrinsicValueEstimate.sum": {
	"value": 1980.218017578125,
	"min": 547.5039672851562,
	"max": 2153.95654296875,
	"count": 142
	},
	"SearcherBrain.Environment.CumulativeReward.mean": {
	"value": 176.0731446659565,
	"min": 143.13208571255208,
	"max": 184.8177523803711,
	"count": 142
	},
	"SearcherBrain.Environment.CumulativeReward.sum": {
	"value": 8803.657233297825,
	"min": 2578.779571533203,
	"max": 9240.887619018555,
	"count": 142
	},
	"SearcherBrain.Policy.ExtrinsicReward.mean": {
	"value": 176.0731446659565,
	"min": 143.13208571255208,
	"max": 184.8177523803711,
	"count": 142
	},
	"SearcherBrain.Policy.ExtrinsicReward.sum": {
	"value": 8803.657233297825,
	"min": 2578.779571533203,
	"max": 9240.887619018555,
	"count": 142
	},
	"SearcherBrain.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 142
	},
	"SearcherBrain.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 142
	},
	"SearcherBrain.Losses.PolicyLoss.mean": {
	"value": 0.11566888390354708,
	"min": 0.09146672067137034,
	"max": 0.12758717909406794,
	"count": 36
	},
	"SearcherBrain.Losses.PolicyLoss.sum": {
	"value": 0.11566888390354708,
	"min": 0.09146672067137034,
	"max": 0.12758717909406794,
	"count": 36
	},
	"SearcherBrain.Losses.ValueLoss.mean": {
	"value": 7.1742678271399605,
	"min": 4.739377557237943,
	"max": 9.185592528846529,
	"count": 36
	},
	"SearcherBrain.Losses.ValueLoss.sum": {
	"value": 7.1742678271399605,
	"min": 4.739377557237943,
	"max": 9.185592528846529,
	"count": 36
	},
	"SearcherBrain.Policy.LearningRate.mean": {
	"value": 0.00019317334760889595,
	"min": 0.00019317334760889595,
	"max": 0.000205273375575552,
	"count": 36
	},
	"SearcherBrain.Policy.LearningRate.sum": {
	"value": 0.00019317334760889595,
	"min": 0.00019317334760889595,
	"max": 0.000205273375575552,
	"count": 36
	},
	"SearcherBrain.Policy.Epsilon.mean": {
	"value": 0.16439110399999998,
	"min": 0.16439110399999998,
	"max": 0.16842444800000003,
	"count": 36
	},
	"SearcherBrain.Policy.Epsilon.sum": {
	"value": 0.16439110399999998,
	"min": 0.16439110399999998,
	"max": 0.16842444800000003,
	"count": 36
	},
	"SearcherBrain.Policy.Beta.mean": {
	"value": 0.0032231160896,
	"min": 0.0032231160896,
	"max": 0.0034243799552000007,
	"count": 36
	},
	"SearcherBrain.Policy.Beta.sum": {
	"value": 0.0032231160896,
	"min": 0.0032231160896,
	"max": 0.0034243799552000007,
	"count": 36
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1744103183",
	"python_version": "3.10.10 (tags/v3.10.10:aad5f6a, Feb 7 2023, 17:20:36) [MSC v.1929 64 bit (AMD64)]",
	"command_line_arguments": "C:\\Users\\roque\\python-envs\\rl-env\\Scripts\\mlagents-learn ./config/solartracker_config_ppo.yaml --env=./envs/MultiSolarTrackerEnv --run-id=SolarTrackerPPO --resume",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cpu",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1744104712"
	},
	"total": 1529.1202356999984,
	"count": 1,
	"self": 0.28325869999753195,
	"children": {
	"run_training.setup": {
	"total": 0.08089520000066841,
	"count": 1,
	"self": 0.08089520000066841
	},
	"TrainerController.start_learning": {
	"total": 1528.7560818000002,
	"count": 1,
	"self": 0.44316530011201394,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.320846700000402,
	"count": 1,
	"self": 6.320846700000402
	},
	"TrainerController.advance": {
	"total": 1521.9105026998895,
	"count": 22237,
	"self": 0.5204243999578466,
	"children": {
	"env_step": {
	"total": 803.7725172000082,
	"count": 22237,
	"self": 744.6079042997972,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 58.866627000055814,
	"count": 22237,
	"self": 5.4749692000950745,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 53.39165779996074,
	"count": 22208,
	"self": 53.39165779996074
	}
	}
	},
	"workers": {
	"total": 0.29798590015525406,
	"count": 22237,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 1503.534177499967,
	"count": 22237,
	"is_parallel": true,
	"self": 905.5262203999082,
	"children": {
	"steps_from_proto": {
	"total": 0.0027493000015965663,
	"count": 1,
	"is_parallel": true,
	"self": 0.00037040000097476877,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023789000006217975,
	"count": 2,
	"is_parallel": true,
	"self": 0.0023789000006217975
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 598.0052078000572,
	"count": 22237,
	"is_parallel": true,
	"self": 14.79916039969612,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 36.35460820003391,
	"count": 22237,
	"is_parallel": true,
	"self": 36.35460820003391
	},
	"communicator.exchange": {
	"total": 517.9183317000679,
	"count": 22237,
	"is_parallel": true,
	"self": 517.9183317000679
	},
	"steps_from_proto": {
	"total": 28.93310750025921,
	"count": 22237,
	"is_parallel": true,
	"self": 6.41115339998214,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 22.52195410027707,
	"count": 44474,
	"is_parallel": true,
	"self": 22.52195410027707
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 717.6175610999235,
	"count": 22237,
	"self": 1.1822864997302531,
	"children": {
	"process_trajectory": {
	"total": 248.01313250019302,
	"count": 22237,
	"self": 247.27856620019702,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.7345662999960041,
	"count": 9,
	"self": 0.7345662999960041
	}
	}
	},
	"_update_policy": {
	"total": 468.4221421000002,
	"count": 37,
	"self": 38.10555700000259,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 430.3165850999976,
	"count": 6660,
	"self": 430.3165850999976
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.999995770864189e-07,
	"count": 1,
	"self": 8.999995770864189e-07
	},
	"TrainerController._save_models": {
	"total": 0.08156619999863324,
	"count": 1,
	"self": 0.0017178999987663701,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.07984829999986687,
	"count": 1,
	"self": 0.07984829999986687
	}
	}
	}
	}
	}
	}
	}