| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.5697529315948486, | |
| "min": 0.5697529315948486, | |
| "max": 1.4282350540161133, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 17083.47265625, | |
| "min": 17083.47265625, | |
| "max": 43326.9375, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 989958.0, | |
| "min": 29952.0, | |
| "max": 989958.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 989958.0, | |
| "min": 29952.0, | |
| "max": 989958.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.027781447395682335, | |
| "min": -0.1567494124174118, | |
| "max": 0.10649461299180984, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 6.806454658508301, | |
| "min": -37.14961242675781, | |
| "max": 26.410663604736328, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": -0.09998150169849396, | |
| "min": -0.10298889875411987, | |
| "max": 0.6416728496551514, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": -24.495468139648438, | |
| "min": -25.54124641418457, | |
| "max": 152.0764617919922, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06580670452386897, | |
| "min": 0.06420853877676838, | |
| "max": 0.07175141374133338, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9212938633341656, | |
| "min": 0.48710751419233944, | |
| "max": 1.0241472059318695, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.01111924657790533, | |
| "min": 0.0004095529458446011, | |
| "max": 0.014578841951562237, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.15566945209067462, | |
| "min": 0.005324188295979814, | |
| "max": 0.20122647359237497, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 7.454518943764286e-06, | |
| "min": 7.454518943764286e-06, | |
| "max": 0.00029515063018788575, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.0001043632652127, | |
| "min": 0.0001043632652127, | |
| "max": 0.0035073866308712003, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10248480714285713, | |
| "min": 0.10248480714285713, | |
| "max": 0.19838354285714285, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4347872999999998, | |
| "min": 1.3886848, | |
| "max": 2.5691288000000005, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0002582322335714286, | |
| "min": 0.0002582322335714286, | |
| "max": 0.00983851593142857, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0036152512700000005, | |
| "min": 0.0036152512700000005, | |
| "max": 0.11693596712000001, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.017260180786252022, | |
| "min": 0.01671287976205349, | |
| "max": 0.701418399810791, | |
| "count": 33 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.2416425347328186, | |
| "min": 0.23398031294345856, | |
| "max": 4.909928798675537, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 786.2162162162163, | |
| "min": 745.8947368421053, | |
| "max": 999.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29090.0, | |
| "min": 15984.0, | |
| "max": 33200.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 0.04995785339882499, | |
| "min": -1.0000000521540642, | |
| "max": 0.3417729368886432, | |
| "count": 33 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 1.8983984291553497, | |
| "min": -30.993601590394974, | |
| "max": 12.645598664879799, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 0.04995785339882499, | |
| "min": -1.0000000521540642, | |
| "max": 0.3417729368886432, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 1.8983984291553497, | |
| "min": -30.993601590394974, | |
| "max": 12.645598664879799, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.14105907934687198, | |
| "min": 0.1294292282388621, | |
| "max": 13.87622656673193, | |
| "count": 33 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 5.360245015181135, | |
| "min": 4.788881444837898, | |
| "max": 222.01962506771088, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 33 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1769141633", | |
| "python_version": "3.8.20 (default, Sep 7 2024, 18:35:08) \n[GCC 11.4.0]", | |
| "command_line_arguments": "/home/cfmy/rl/deep-rl-class-zh/.venv38/bin/mlagents-learn --force ./ml-agents/config/ppo/PyramidsRND.yaml --env=./trained-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids_Training --no-graphics", | |
| "mlagents_version": "0.29.0.dev0", | |
| "mlagents_envs_version": "0.29.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.8.1+cu102", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1769143283" | |
| }, | |
| "total": 1649.3432424259954, | |
| "count": 1, | |
| "self": 0.5271806520031532, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.023424899991368875, | |
| "count": 1, | |
| "self": 0.023424899991368875 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 1648.792636874001, | |
| "count": 1, | |
| "self": 1.3130523440631805, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.4656410420138855, | |
| "count": 1, | |
| "self": 2.4656410420138855 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 1644.9661176809168, | |
| "count": 63242, | |
| "self": 1.279258410053444, | |
| "children": { | |
| "env_step": { | |
| "total": 1170.0897326112463, | |
| "count": 63242, | |
| "self": 1097.9548885850818, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 71.33310817070014, | |
| "count": 63242, | |
| "self": 3.0629787500802195, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 68.27012942061992, | |
| "count": 62566, | |
| "self": 14.928763125877595, | |
| "children": { | |
| "TorchPolicy.sample_actions": { | |
| "total": 53.34136629474233, | |
| "count": 62566, | |
| "self": 53.34136629474233 | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.8017358554643579, | |
| "count": 63242, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 1645.669839021968, | |
| "count": 63242, | |
| "is_parallel": true, | |
| "self": 628.1513156488363, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0018416250095469877, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006031470111338422, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012384779984131455, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012384779984131455 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.03076878099818714, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00022137799533084035, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0003743050037883222, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003743050037883222 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.029574961998150684, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.029574961998150684 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0005981360009172931, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00016027498350013047, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.00043786101741716266, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.00043786101741716266 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1017.5185233731318, | |
| "count": 63241, | |
| "is_parallel": true, | |
| "self": 14.65468421546393, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 9.33519983770384, | |
| "count": 63241, | |
| "is_parallel": true, | |
| "self": 9.33519983770384 | |
| }, | |
| "communicator.exchange": { | |
| "total": 955.8037445731752, | |
| "count": 63241, | |
| "is_parallel": true, | |
| "self": 955.8037445731752 | |
| }, | |
| "steps_from_proto": { | |
| "total": 37.72489474678878, | |
| "count": 63241, | |
| "is_parallel": true, | |
| "self": 10.440495088492753, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 27.284399658296024, | |
| "count": 505928, | |
| "is_parallel": true, | |
| "self": 27.284399658296024 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 473.59712665961706, | |
| "count": 63242, | |
| "self": 2.243827484344365, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 91.52122798137134, | |
| "count": 63242, | |
| "self": 91.40228566036967, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.11894232100166846, | |
| "count": 2, | |
| "self": 0.11894232100166846 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 379.83207119390136, | |
| "count": 447, | |
| "self": 110.84842566719453, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 268.9836455267068, | |
| "count": 22779, | |
| "self": 268.9836455267068 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 6.990012479946017e-07, | |
| "count": 1, | |
| "self": 6.990012479946017e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.04782510800578166, | |
| "count": 1, | |
| "self": 0.0008432119939243421, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.046981896011857316, | |
| "count": 1, | |
| "self": 0.046981896011857316 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |