FredericProtat's picture
Second Push
a2d60b7
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.16728255152702332,
"min": 0.15525735914707184,
"max": 0.21002553403377533,
"count": 34
},
"Pyramids.Policy.Entropy.sum": {
"value": 5053.271484375,
"min": 1868.0673828125,
"max": 6280.603515625,
"count": 34
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 234.51181102362204,
"min": 212.17948717948718,
"max": 283.64761904761906,
"count": 34
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29783.0,
"min": 8275.0,
"max": 31880.0,
"count": 34
},
"Pyramids.Step.mean": {
"value": 2999883.0,
"min": 2009983.0,
"max": 2999883.0,
"count": 34
},
"Pyramids.Step.sum": {
"value": 2999883.0,
"min": 2009983.0,
"max": 2999883.0,
"count": 34
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.7479361891746521,
"min": 0.6622505784034729,
"max": 0.8450698852539062,
"count": 34
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 224.380859375,
"min": 73.65901184082031,
"max": 252.65277099609375,
"count": 34
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.005168822593986988,
"min": -0.012601537629961967,
"max": 0.01932157576084137,
"count": 34
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 1.5506467819213867,
"min": -3.742656707763672,
"max": 5.680543422698975,
"count": 34
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.7497338478959452,
"min": 1.6608981324566736,
"max": 1.787820503497735,
"count": 34
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 222.21619868278503,
"min": 69.72499963641167,
"max": 244.80299776792526,
"count": 34
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.7497338478959452,
"min": 1.6608981324566736,
"max": 1.787820503497735,
"count": 34
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 222.21619868278503,
"min": 69.72499963641167,
"max": 244.80299776792526,
"count": 34
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.01949155884766532,
"min": 0.019372238134383223,
"max": 0.028201485868443604,
"count": 34
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.4754279736534954,
"min": 0.8830385050969198,
"max": 3.0416997363208793,
"count": 34
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.07110694913851966,
"min": 0.06405901443975467,
"max": 0.07133843297612788,
"count": 34
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9954972879392753,
"min": 0.27638910769019276,
"max": 1.0520664500654675,
"count": 34
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.01526131886429302,
"min": 0.012369724602710143,
"max": 0.016298255188782248,
"count": 34
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.21365846410010228,
"min": 0.06191515453004589,
"max": 0.23520687879257218,
"count": 34
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.5590351946404768e-06,
"min": 1.5590351946404768e-06,
"max": 9.947719184095832e-05,
"count": 34
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.1826492724966673e-05,
"min": 2.1826492724966673e-05,
"max": 0.0014621597126137666,
"count": 34
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10051964523809527,
"min": 0.10051964523809527,
"max": 0.13315904166666664,
"count": 34
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4072750333333337,
"min": 0.5326361666666666,
"max": 1.9873862333333334,
"count": 34
},
"Pyramids.Policy.Beta.mean": {
"value": 6.191255928571431e-05,
"min": 6.191255928571431e-05,
"max": 0.0033225882625,
"count": 34
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0008667758300000004,
"min": 0.0008667758300000004,
"max": 0.048839884709999996,
"count": 34
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.008113382384181023,
"min": 0.007795785553753376,
"max": 0.010242822580039501,
"count": 34
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.11358735710382462,
"min": 0.040971290320158005,
"max": 0.14452455937862396,
"count": 34
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 34
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 34
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1693050399",
"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsTraining --no-graphics --resume",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1693053095"
},
"total": 2695.543802821001,
"count": 1,
"self": 1.1324325500017949,
"children": {
"run_training.setup": {
"total": 0.040259501000036835,
"count": 1,
"self": 0.040259501000036835
},
"TrainerController.start_learning": {
"total": 2694.371110769999,
"count": 1,
"self": 1.6563902417110512,
"children": {
"TrainerController._reset_env": {
"total": 5.44096331899982,
"count": 1,
"self": 5.44096331899982
},
"TrainerController.advance": {
"total": 2687.100431038287,
"count": 65705,
"self": 1.5864545440545044,
"children": {
"env_step": {
"total": 2001.4026687082624,
"count": 65705,
"self": 1886.4337987335402,
"children": {
"SubprocessEnvManager._take_step": {
"total": 114.04875525803072,
"count": 65705,
"self": 4.902434129653557,
"children": {
"TorchPolicy.evaluate": {
"total": 109.14632112837717,
"count": 62569,
"self": 109.14632112837717
}
}
},
"workers": {
"total": 0.920114716691387,
"count": 65705,
"self": 0.0,
"children": {
"worker_root": {
"total": 2687.969531494088,
"count": 65705,
"is_parallel": true,
"self": 926.9245235840926,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0019770689996221336,
"count": 1,
"is_parallel": true,
"self": 0.0006251910008359118,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0013518779987862217,
"count": 8,
"is_parallel": true,
"self": 0.0013518779987862217
}
}
},
"UnityEnvironment.step": {
"total": 0.08333673800007091,
"count": 1,
"is_parallel": true,
"self": 0.0005924659999436699,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00046607700005552033,
"count": 1,
"is_parallel": true,
"self": 0.00046607700005552033
},
"communicator.exchange": {
"total": 0.07168196800012083,
"count": 1,
"is_parallel": true,
"self": 0.07168196800012083
},
"steps_from_proto": {
"total": 0.010596226999950886,
"count": 1,
"is_parallel": true,
"self": 0.009075192998352577,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0015210340015983093,
"count": 8,
"is_parallel": true,
"self": 0.0015210340015983093
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1761.0450079099955,
"count": 65704,
"is_parallel": true,
"self": 34.77587164081251,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 23.156331481118286,
"count": 65704,
"is_parallel": true,
"self": 23.156331481118286
},
"communicator.exchange": {
"total": 1592.8627225269947,
"count": 65704,
"is_parallel": true,
"self": 1592.8627225269947
},
"steps_from_proto": {
"total": 110.25008226107002,
"count": 65704,
"is_parallel": true,
"self": 22.365261638236916,
"children": {
"_process_rank_one_or_two_observation": {
"total": 87.8848206228331,
"count": 525632,
"is_parallel": true,
"self": 87.8848206228331
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 684.11130778597,
"count": 65705,
"self": 3.081327651087122,
"children": {
"process_trajectory": {
"total": 120.54025942088992,
"count": 65705,
"self": 120.27275603989074,
"children": {
"RLTrainer._checkpoint": {
"total": 0.26750338099918736,
"count": 2,
"self": 0.26750338099918736
}
}
},
"_update_policy": {
"total": 560.4897207139929,
"count": 473,
"self": 366.8761716950967,
"children": {
"TorchPPOOptimizer.update": {
"total": 193.61354901889626,
"count": 22752,
"self": 193.61354901889626
}
}
}
}
}
}
},
"trainer_threads": {
"total": 2.3588001567986794e-05,
"count": 1,
"self": 2.3588001567986794e-05
},
"TrainerController._save_models": {
"total": 0.1733025829998951,
"count": 1,
"self": 0.0039729189993522596,
"children": {
"RLTrainer._checkpoint": {
"total": 0.16932966400054283,
"count": 1,
"self": 0.16932966400054283
}
}
}
}
}
}
}