ppo-pyramids / run_logs /timers.json
MartinVanBuren's picture
First commit, default config
9a16608 verified
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.3393213450908661,
"min": 0.3314994275569916,
"max": 1.379373550415039,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 10049.3408203125,
"min": 10008.630859375,
"max": 39019.71875,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989933.0,
"min": 29952.0,
"max": 989933.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989933.0,
"min": 29952.0,
"max": 989933.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.6254141330718994,
"min": -0.08404293656349182,
"max": 0.6912244558334351,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 180.74468994140625,
"min": -20.338390350341797,
"max": 203.21998596191406,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.02734558656811714,
"min": -0.02242613397538662,
"max": 0.4648740589618683,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 7.90287446975708,
"min": -5.9877777099609375,
"max": 102.73716735839844,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06841825248838398,
"min": 0.06641222656305348,
"max": 0.07352544943484582,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9578555348373757,
"min": 0.4401610603170662,
"max": 1.0786804384260904,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.016256701561533624,
"min": 0.002270949388138241,
"max": 0.016508740748880278,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.22759382186147073,
"min": 0.022709493881382412,
"max": 0.2318545042265517,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.4898546462714276e-06,
"min": 7.4898546462714276e-06,
"max": 0.00029514240161919995,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00010485796504779999,
"min": 0.00010485796504779999,
"max": 0.0035089250303584,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10249658571428573,
"min": 0.10249658571428573,
"max": 0.19838080000000002,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4349522000000001,
"min": 1.1902848000000001,
"max": 2.5696416,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.0002594089128571429,
"min": 0.0002594089128571429,
"max": 0.009838241919999999,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.00363172478,
"min": 0.00363172478,
"max": 0.11698719584000002,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.01445481926202774,
"min": 0.01445481926202774,
"max": 0.5669408440589905,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.20236746966838837,
"min": 0.20236746966838837,
"max": 3.4016449451446533,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 285.0857142857143,
"min": 273.0093457943925,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29934.0,
"min": 15984.0,
"max": 33015.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.697030171470822,
"min": -1.0000000521540642,
"max": 1.7269906436450013,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 179.88519817590714,
"min": -30.24240168184042,
"max": 184.78799887001514,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.697030171470822,
"min": -1.0000000521540642,
"max": 1.7269906436450013,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 179.88519817590714,
"min": -30.24240168184042,
"max": 184.78799887001514,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.04323365747651858,
"min": 0.04323365747651858,
"max": 11.171785168349743,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 4.58276769251097,
"min": 4.501126918883529,
"max": 178.7485626935959,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1727570619",
"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]",
"command_line_arguments": "venv/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids1 --no-graphics --resume",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.4.1+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1727572792"
},
"total": 2173.1502576000003,
"count": 1,
"self": 0.4818422999996983,
"children": {
"run_training.setup": {
"total": 0.01389500000004773,
"count": 1,
"self": 0.01389500000004773
},
"TrainerController.start_learning": {
"total": 2172.6545203000005,
"count": 1,
"self": 1.5007186000343609,
"children": {
"TrainerController._reset_env": {
"total": 1.388296800000262,
"count": 1,
"self": 1.388296800000262
},
"TrainerController.advance": {
"total": 2169.6940161999664,
"count": 64084,
"self": 1.4004572000094413,
"children": {
"env_step": {
"total": 1451.9032732999935,
"count": 64084,
"self": 1339.2555544999796,
"children": {
"SubprocessEnvManager._take_step": {
"total": 111.717396799972,
"count": 64084,
"self": 4.25997569997935,
"children": {
"TorchPolicy.evaluate": {
"total": 107.45742109999264,
"count": 62432,
"self": 107.45742109999264
}
}
},
"workers": {
"total": 0.9303220000419969,
"count": 64084,
"self": 0.0,
"children": {
"worker_root": {
"total": 2169.356929600043,
"count": 64084,
"is_parallel": true,
"self": 931.6386182001056,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0019157000001541746,
"count": 1,
"is_parallel": true,
"self": 0.0005667000004905276,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001348999999663647,
"count": 8,
"is_parallel": true,
"self": 0.001348999999663647
}
}
},
"UnityEnvironment.step": {
"total": 0.03984710000031555,
"count": 1,
"is_parallel": true,
"self": 0.0002482999998392188,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00021070000002509914,
"count": 1,
"is_parallel": true,
"self": 0.00021070000002509914
},
"communicator.exchange": {
"total": 0.03852080000024216,
"count": 1,
"is_parallel": true,
"self": 0.03852080000024216
},
"steps_from_proto": {
"total": 0.0008673000002090703,
"count": 1,
"is_parallel": true,
"self": 0.00026889999890045146,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0005984000013086188,
"count": 8,
"is_parallel": true,
"self": 0.0005984000013086188
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1237.7183113999372,
"count": 64083,
"is_parallel": true,
"self": 17.496068099939748,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 17.851628199996867,
"count": 64083,
"is_parallel": true,
"self": 17.851628199996867
},
"communicator.exchange": {
"total": 1148.1017410999953,
"count": 64083,
"is_parallel": true,
"self": 1148.1017410999953
},
"steps_from_proto": {
"total": 54.268874000005326,
"count": 64083,
"is_parallel": true,
"self": 14.00552580009753,
"children": {
"_process_rank_one_or_two_observation": {
"total": 40.263348199907796,
"count": 512664,
"is_parallel": true,
"self": 40.263348199907796
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 716.3902856999634,
"count": 64084,
"self": 3.2933098999124013,
"children": {
"process_trajectory": {
"total": 98.82236180005157,
"count": 64084,
"self": 98.51106890005167,
"children": {
"RLTrainer._checkpoint": {
"total": 0.3112928999998985,
"count": 2,
"self": 0.3112928999998985
}
}
},
"_update_policy": {
"total": 614.2746139999995,
"count": 454,
"self": 229.39425380004286,
"children": {
"TorchPPOOptimizer.update": {
"total": 384.8803601999566,
"count": 22755,
"self": 384.8803601999566
}
}
}
}
}
}
},
"trainer_threads": {
"total": 7.999997251317836e-07,
"count": 1,
"self": 7.999997251317836e-07
},
"TrainerController._save_models": {
"total": 0.07148789999973815,
"count": 1,
"self": 0.009067400000276393,
"children": {
"RLTrainer._checkpoint": {
"total": 0.062420499999461754,
"count": 1,
"self": 0.062420499999461754
}
}
}
}
}
}
}