ppo-Pyramids / run_logs /timers.json
mmichiels13's picture
First Push
469616c verified
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.33215370774269104,
"min": 0.32744649052619934,
"max": 1.3892465829849243,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 9932.724609375,
"min": 9833.873046875,
"max": 42144.18359375,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989953.0,
"min": 29939.0,
"max": 989953.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989953.0,
"min": 29939.0,
"max": 989953.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.5937961339950562,
"min": -0.11402159184217453,
"max": 0.6218114495277405,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 164.48153686523438,
"min": -27.593225479125977,
"max": 180.7646942138672,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": -0.012516348622739315,
"min": -0.012516348622739315,
"max": 0.2709921598434448,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": -3.4670286178588867,
"min": -3.4670286178588867,
"max": 64.22514343261719,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06869396578350316,
"min": 0.06459258985151314,
"max": 0.07344745011081477,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9617155209690443,
"min": 0.4829088080640623,
"max": 1.073747740963168,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.016333643093731916,
"min": 0.000436349039498401,
"max": 0.01675893164929348,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.22867100331224682,
"min": 0.005672537513479213,
"max": 0.24195401150192244,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.352561834892862e-06,
"min": 7.352561834892862e-06,
"max": 0.00029515063018788575,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00010293586568850007,
"min": 0.00010293586568850007,
"max": 0.0036338635887122,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10245082142857144,
"min": 0.10245082142857144,
"max": 0.19838354285714285,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4343115000000002,
"min": 1.3886848,
"max": 2.6112878000000004,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00025483706071428587,
"min": 0.00025483706071428587,
"max": 0.00983851593142857,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.003567718850000002,
"min": 0.003567718850000002,
"max": 0.12114765121999999,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.01031650323420763,
"min": 0.01031650323420763,
"max": 0.505388617515564,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.14443103969097137,
"min": 0.14443103969097137,
"max": 3.537720203399658,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 318.67045454545456,
"min": 311.1595744680851,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 28043.0,
"min": 16866.0,
"max": 32555.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.6589677935016567,
"min": -0.9997933854659399,
"max": 1.6675616807125984,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 144.33019803464413,
"min": -29.993801563978195,
"max": 163.84699787199497,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.6589677935016567,
"min": -0.9997933854659399,
"max": 1.6675616807125984,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 144.33019803464413,
"min": -29.993801563978195,
"max": 163.84699787199497,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.03371351445913342,
"min": 0.03371351445913342,
"max": 10.180521801990622,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.933075757944607,
"min": 2.933075757944607,
"max": 173.06887063384056,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1767328587",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.8.0+cu128",
"numpy_version": "1.23.5",
"end_time_seconds": "1767330780"
},
"total": 2192.7339807959997,
"count": 1,
"self": 0.4831833419993927,
"children": {
"run_training.setup": {
"total": 0.030265897999925073,
"count": 1,
"self": 0.030265897999925073
},
"TrainerController.start_learning": {
"total": 2192.2205315560004,
"count": 1,
"self": 1.305473461992733,
"children": {
"TrainerController._reset_env": {
"total": 2.8169025019997207,
"count": 1,
"self": 2.8169025019997207
},
"TrainerController.advance": {
"total": 2188.021086805009,
"count": 64008,
"self": 1.344332832382861,
"children": {
"env_step": {
"total": 1544.5402321089496,
"count": 64008,
"self": 1399.1370038446803,
"children": {
"SubprocessEnvManager._take_step": {
"total": 144.5966223262658,
"count": 64008,
"self": 4.532296451163347,
"children": {
"TorchPolicy.evaluate": {
"total": 140.06432587510244,
"count": 62547,
"self": 140.06432587510244
}
}
},
"workers": {
"total": 0.8066059380034858,
"count": 64008,
"self": 0.0,
"children": {
"worker_root": {
"total": 2185.762246034932,
"count": 64008,
"is_parallel": true,
"self": 899.4077341828397,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0025492999993730336,
"count": 1,
"is_parallel": true,
"self": 0.00076713799717254,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0017821620022004936,
"count": 8,
"is_parallel": true,
"self": 0.0017821620022004936
}
}
},
"UnityEnvironment.step": {
"total": 0.06180092899921874,
"count": 1,
"is_parallel": true,
"self": 0.0015726219990028767,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0004742460005218163,
"count": 1,
"is_parallel": true,
"self": 0.0004742460005218163
},
"communicator.exchange": {
"total": 0.057037986000068486,
"count": 1,
"is_parallel": true,
"self": 0.057037986000068486
},
"steps_from_proto": {
"total": 0.0027160749996255618,
"count": 1,
"is_parallel": true,
"self": 0.00034630899972398765,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.002369765999901574,
"count": 8,
"is_parallel": true,
"self": 0.002369765999901574
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1286.3545118520924,
"count": 64007,
"is_parallel": true,
"self": 32.66002140382807,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 22.41888816665596,
"count": 64007,
"is_parallel": true,
"self": 22.41888816665596
},
"communicator.exchange": {
"total": 1127.1192455026085,
"count": 64007,
"is_parallel": true,
"self": 1127.1192455026085
},
"steps_from_proto": {
"total": 104.1563567789999,
"count": 64007,
"is_parallel": true,
"self": 22.140710835261416,
"children": {
"_process_rank_one_or_two_observation": {
"total": 82.01564594373849,
"count": 512056,
"is_parallel": true,
"self": 82.01564594373849
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 642.1365218636765,
"count": 64008,
"self": 2.5777785456539277,
"children": {
"process_trajectory": {
"total": 121.43874129000687,
"count": 64008,
"self": 121.24616865700591,
"children": {
"RLTrainer._checkpoint": {
"total": 0.19257263300096383,
"count": 2,
"self": 0.19257263300096383
}
}
},
"_update_policy": {
"total": 518.1200020280157,
"count": 456,
"self": 287.8494104679867,
"children": {
"TorchPPOOptimizer.update": {
"total": 230.27059156002906,
"count": 22842,
"self": 230.27059156002906
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.929990483215079e-07,
"count": 1,
"self": 9.929990483215079e-07
},
"TrainerController._save_models": {
"total": 0.07706779399995867,
"count": 1,
"self": 0.0010116329995071283,
"children": {
"RLTrainer._checkpoint": {
"total": 0.07605616100045154,
"count": 1,
"self": 0.07605616100045154
}
}
}
}
}
}
}