SamuelM0422's picture
First Push
36b2463 verified
{
"name": "root",
"gauges": {
"SearcherBrain.Policy.Entropy.mean": {
"value": -1.5689488649368286,
"min": -1.5689488649368286,
"max": -1.2842600345611572,
"count": 37
},
"SearcherBrain.Policy.Entropy.sum": {
"value": -180742.90625,
"min": -180792.109375,
"max": -148193.328125,
"count": 37
},
"SearcherBrain.Environment.EpisodeLength.mean": {
"value": 599.0,
"min": 599.0,
"max": 600.0,
"count": 37
},
"SearcherBrain.Environment.EpisodeLength.sum": {
"value": 115008.0,
"min": 115008.0,
"max": 115200.0,
"count": 37
},
"SearcherBrain.Step.mean": {
"value": 35699496.0,
"min": 31469776.0,
"max": 35699496.0,
"count": 142
},
"SearcherBrain.Step.sum": {
"value": 35699496.0,
"min": 31469776.0,
"max": 35699496.0,
"count": 142
},
"SearcherBrain.Policy.ExtrinsicValueEstimate.mean": {
"value": 39.6043586730957,
"min": 31.869272232055664,
"max": 43.079132080078125,
"count": 142
},
"SearcherBrain.Policy.ExtrinsicValueEstimate.sum": {
"value": 1980.218017578125,
"min": 547.5039672851562,
"max": 2153.95654296875,
"count": 142
},
"SearcherBrain.Environment.CumulativeReward.mean": {
"value": 176.0731446659565,
"min": 143.13208571255208,
"max": 184.8177523803711,
"count": 142
},
"SearcherBrain.Environment.CumulativeReward.sum": {
"value": 8803.657233297825,
"min": 2578.779571533203,
"max": 9240.887619018555,
"count": 142
},
"SearcherBrain.Policy.ExtrinsicReward.mean": {
"value": 176.0731446659565,
"min": 143.13208571255208,
"max": 184.8177523803711,
"count": 142
},
"SearcherBrain.Policy.ExtrinsicReward.sum": {
"value": 8803.657233297825,
"min": 2578.779571533203,
"max": 9240.887619018555,
"count": 142
},
"SearcherBrain.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 142
},
"SearcherBrain.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 142
},
"SearcherBrain.Losses.PolicyLoss.mean": {
"value": 0.11566888390354708,
"min": 0.09146672067137034,
"max": 0.12758717909406794,
"count": 36
},
"SearcherBrain.Losses.PolicyLoss.sum": {
"value": 0.11566888390354708,
"min": 0.09146672067137034,
"max": 0.12758717909406794,
"count": 36
},
"SearcherBrain.Losses.ValueLoss.mean": {
"value": 7.1742678271399605,
"min": 4.739377557237943,
"max": 9.185592528846529,
"count": 36
},
"SearcherBrain.Losses.ValueLoss.sum": {
"value": 7.1742678271399605,
"min": 4.739377557237943,
"max": 9.185592528846529,
"count": 36
},
"SearcherBrain.Policy.LearningRate.mean": {
"value": 0.00019317334760889595,
"min": 0.00019317334760889595,
"max": 0.000205273375575552,
"count": 36
},
"SearcherBrain.Policy.LearningRate.sum": {
"value": 0.00019317334760889595,
"min": 0.00019317334760889595,
"max": 0.000205273375575552,
"count": 36
},
"SearcherBrain.Policy.Epsilon.mean": {
"value": 0.16439110399999998,
"min": 0.16439110399999998,
"max": 0.16842444800000003,
"count": 36
},
"SearcherBrain.Policy.Epsilon.sum": {
"value": 0.16439110399999998,
"min": 0.16439110399999998,
"max": 0.16842444800000003,
"count": 36
},
"SearcherBrain.Policy.Beta.mean": {
"value": 0.0032231160896,
"min": 0.0032231160896,
"max": 0.0034243799552000007,
"count": 36
},
"SearcherBrain.Policy.Beta.sum": {
"value": 0.0032231160896,
"min": 0.0032231160896,
"max": 0.0034243799552000007,
"count": 36
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1744103183",
"python_version": "3.10.10 (tags/v3.10.10:aad5f6a, Feb 7 2023, 17:20:36) [MSC v.1929 64 bit (AMD64)]",
"command_line_arguments": "C:\\Users\\roque\\python-envs\\rl-env\\Scripts\\mlagents-learn ./config/solartracker_config_ppo.yaml --env=./envs/MultiSolarTrackerEnv --run-id=SolarTrackerPPO --resume",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.6.0+cpu",
"numpy_version": "1.23.5",
"end_time_seconds": "1744104712"
},
"total": 1529.1202356999984,
"count": 1,
"self": 0.28325869999753195,
"children": {
"run_training.setup": {
"total": 0.08089520000066841,
"count": 1,
"self": 0.08089520000066841
},
"TrainerController.start_learning": {
"total": 1528.7560818000002,
"count": 1,
"self": 0.44316530011201394,
"children": {
"TrainerController._reset_env": {
"total": 6.320846700000402,
"count": 1,
"self": 6.320846700000402
},
"TrainerController.advance": {
"total": 1521.9105026998895,
"count": 22237,
"self": 0.5204243999578466,
"children": {
"env_step": {
"total": 803.7725172000082,
"count": 22237,
"self": 744.6079042997972,
"children": {
"SubprocessEnvManager._take_step": {
"total": 58.866627000055814,
"count": 22237,
"self": 5.4749692000950745,
"children": {
"TorchPolicy.evaluate": {
"total": 53.39165779996074,
"count": 22208,
"self": 53.39165779996074
}
}
},
"workers": {
"total": 0.29798590015525406,
"count": 22237,
"self": 0.0,
"children": {
"worker_root": {
"total": 1503.534177499967,
"count": 22237,
"is_parallel": true,
"self": 905.5262203999082,
"children": {
"steps_from_proto": {
"total": 0.0027493000015965663,
"count": 1,
"is_parallel": true,
"self": 0.00037040000097476877,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0023789000006217975,
"count": 2,
"is_parallel": true,
"self": 0.0023789000006217975
}
}
},
"UnityEnvironment.step": {
"total": 598.0052078000572,
"count": 22237,
"is_parallel": true,
"self": 14.79916039969612,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 36.35460820003391,
"count": 22237,
"is_parallel": true,
"self": 36.35460820003391
},
"communicator.exchange": {
"total": 517.9183317000679,
"count": 22237,
"is_parallel": true,
"self": 517.9183317000679
},
"steps_from_proto": {
"total": 28.93310750025921,
"count": 22237,
"is_parallel": true,
"self": 6.41115339998214,
"children": {
"_process_rank_one_or_two_observation": {
"total": 22.52195410027707,
"count": 44474,
"is_parallel": true,
"self": 22.52195410027707
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 717.6175610999235,
"count": 22237,
"self": 1.1822864997302531,
"children": {
"process_trajectory": {
"total": 248.01313250019302,
"count": 22237,
"self": 247.27856620019702,
"children": {
"RLTrainer._checkpoint": {
"total": 0.7345662999960041,
"count": 9,
"self": 0.7345662999960041
}
}
},
"_update_policy": {
"total": 468.4221421000002,
"count": 37,
"self": 38.10555700000259,
"children": {
"TorchPPOOptimizer.update": {
"total": 430.3165850999976,
"count": 6660,
"self": 430.3165850999976
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.999995770864189e-07,
"count": 1,
"self": 8.999995770864189e-07
},
"TrainerController._save_models": {
"total": 0.08156619999863324,
"count": 1,
"self": 0.0017178999987663701,
"children": {
"RLTrainer._checkpoint": {
"total": 0.07984829999986687,
"count": 1,
"self": 0.07984829999986687
}
}
}
}
}
}
}