| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.18455518782138824, | |
| "min": 0.1723124235868454, | |
| "max": 1.4637889862060547, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 5586.8544921875, | |
| "min": 5155.587890625, | |
| "max": 44405.50390625, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 2999992.0, | |
| "min": 29952.0, | |
| "max": 2999992.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 2999992.0, | |
| "min": 29952.0, | |
| "max": 2999992.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.7142572402954102, | |
| "min": -0.19251509010791779, | |
| "max": 0.7864418625831604, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 213.5629119873047, | |
| "min": -45.626075744628906, | |
| "max": 230.42745971679688, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.007587899453938007, | |
| "min": -0.022064711898565292, | |
| "max": 0.29288187623023987, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 2.268781900405884, | |
| "min": -5.935407638549805, | |
| "max": 70.87741088867188, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06870236093511332, | |
| "min": 0.06492414296302568, | |
| "max": 0.07379775105662355, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9618330530915866, | |
| "min": 0.5161230830956068, | |
| "max": 1.100909610608748, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.0156872090212616, | |
| "min": 0.0003961381215027364, | |
| "max": 0.016854510903829664, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.2196209262976624, | |
| "min": 0.005545933701038309, | |
| "max": 0.24974252536291408, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 1.5847851860571435e-06, | |
| "min": 1.5847851860571435e-06, | |
| "max": 0.00029838354339596195, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 2.2186992604800008e-05, | |
| "min": 2.2186992604800008e-05, | |
| "max": 0.0038435695188101995, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10052822857142858, | |
| "min": 0.10052822857142858, | |
| "max": 0.19946118095238097, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4073952, | |
| "min": 1.3962282666666668, | |
| "max": 2.7225395333333333, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 6.27700342857143e-05, | |
| "min": 6.27700342857143e-05, | |
| "max": 0.009946171977142856, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0008787804800000003, | |
| "min": 0.0008787804800000003, | |
| "max": 0.12813086102000001, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.006940221879631281, | |
| "min": 0.006549749057739973, | |
| "max": 0.48526662588119507, | |
| "count": 100 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.09716310352087021, | |
| "min": 0.09169648587703705, | |
| "max": 3.3968663215637207, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 234.1875, | |
| "min": 229.37007874015748, | |
| "max": 999.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 29976.0, | |
| "min": 15984.0, | |
| "max": 33084.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.7658124904846773, | |
| "min": -1.0000000521540642, | |
| "max": 1.7658124904846773, | |
| "count": 100 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 226.0239987820387, | |
| "min": -31.998401671648026, | |
| "max": 226.0239987820387, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.7658124904846773, | |
| "min": -1.0000000521540642, | |
| "max": 1.7658124904846773, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 226.0239987820387, | |
| "min": -31.998401671648026, | |
| "max": 226.0239987820387, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.017038425120290412, | |
| "min": 0.016417352189890825, | |
| "max": 9.023397007025778, | |
| "count": 100 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 2.180918415397173, | |
| "min": 1.9111183179775253, | |
| "max": 144.37435211241245, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 100 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1743658307", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/home/jichuanh/miniconda3/envs/rl-3.10.12/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.6.0+cu124", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1743664658" | |
| }, | |
| "total": 6351.261859285063, | |
| "count": 1, | |
| "self": 0.32121283293236047, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.02177169208880514, | |
| "count": 1, | |
| "self": 0.02177169208880514 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 6350.918874760042, | |
| "count": 1, | |
| "self": 3.5374433528631926, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 1.6831322179641575, | |
| "count": 1, | |
| "self": 1.6831322179641575 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 6345.613099310198, | |
| "count": 194177, | |
| "self": 3.1432087251450866, | |
| "children": { | |
| "env_step": { | |
| "total": 4450.582966240705, | |
| "count": 194177, | |
| "self": 4099.023449446424, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 349.4796111759497, | |
| "count": 194177, | |
| "self": 10.215328793041408, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 339.2642823829083, | |
| "count": 187559, | |
| "self": 339.2642823829083 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 2.079905618331395, | |
| "count": 194177, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 6342.9303860571235, | |
| "count": 194177, | |
| "is_parallel": true, | |
| "self": 2558.890832758858, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0012643409427255392, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00037214194890111685, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0008921989938244224, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0008921989938244224 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.05491540802177042, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0006107420194894075, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0005876090144738555, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005876090144738555 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.051999189890921116, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.051999189890921116 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0017178670968860388, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003785090520977974, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013393580447882414, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013393580447882414 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 3784.0395532982657, | |
| "count": 194176, | |
| "is_parallel": true, | |
| "self": 110.62808475561906, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 75.90329294558614, | |
| "count": 194176, | |
| "is_parallel": true, | |
| "self": 75.90329294558614 | |
| }, | |
| "communicator.exchange": { | |
| "total": 3279.898296020343, | |
| "count": 194176, | |
| "is_parallel": true, | |
| "self": 3279.898296020343 | |
| }, | |
| "steps_from_proto": { | |
| "total": 317.6098795767175, | |
| "count": 194176, | |
| "is_parallel": true, | |
| "self": 67.21519750030711, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 250.3946820764104, | |
| "count": 1553408, | |
| "is_parallel": true, | |
| "self": 250.3946820764104 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1891.8869243443478, | |
| "count": 194177, | |
| "self": 7.538049260387197, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 314.02709195623174, | |
| "count": 194177, | |
| "self": 313.491454832023, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.5356371242087334, | |
| "count": 6, | |
| "self": 0.5356371242087334 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 1570.3217831277288, | |
| "count": 1394, | |
| "self": 775.8074594498612, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 794.5143236778677, | |
| "count": 68307, | |
| "self": 794.5143236778677 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 6.939517334103584e-07, | |
| "count": 1, | |
| "self": 6.939517334103584e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.0851991850649938, | |
| "count": 1, | |
| "self": 0.000828032149001956, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.08437115291599184, | |
| "count": 1, | |
| "self": 0.08437115291599184 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |