ppo-Pyramids / run_logs /timers.json
Jackman4399's picture
First Commit
0ce6c92 verified
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.1447216421365738,
"min": 0.13826455175876617,
"max": 1.4020991325378418,
"count": 100
},
"Pyramids.Policy.Entropy.sum": {
"value": 4311.54736328125,
"min": 4110.32861328125,
"max": 42534.078125,
"count": 100
},
"Pyramids.Step.mean": {
"value": 2999906.0,
"min": 29952.0,
"max": 2999906.0,
"count": 100
},
"Pyramids.Step.sum": {
"value": 2999906.0,
"min": 29952.0,
"max": 2999906.0,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.8354078531265259,
"min": -0.0898745059967041,
"max": 0.8648101091384888,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 253.9639892578125,
"min": -21.65975570678711,
"max": 264.8953857421875,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": -0.0005675681750290096,
"min": -0.035647984594106674,
"max": 0.46989473700523376,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": -0.17254072427749634,
"min": -10.765690803527832,
"max": 111.36505126953125,
"count": 100
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06839243630834278,
"min": 0.0642259741154822,
"max": 0.07358057845950634,
"count": 100
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.957494108316799,
"min": 0.5010699693236671,
"max": 1.0933743211207911,
"count": 100
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.016001959951522406,
"min": 0.00025777547377551656,
"max": 0.016716235349858402,
"count": 100
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.22402743932131366,
"min": 0.003608856632857232,
"max": 0.2459002963550316,
"count": 100
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.4866280759190479e-06,
"min": 1.4866280759190479e-06,
"max": 0.00029838354339596195,
"count": 100
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.081279306286667e-05,
"min": 2.081279306286667e-05,
"max": 0.0039273246908918,
"count": 100
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10049550952380955,
"min": 0.10049550952380955,
"max": 0.19946118095238097,
"count": 100
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4069371333333336,
"min": 1.3962282666666668,
"max": 2.7674318,
"count": 100
},
"Pyramids.Policy.Beta.mean": {
"value": 5.950140142857143e-05,
"min": 5.950140142857143e-05,
"max": 0.009946171977142856,
"count": 100
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0008330196200000001,
"min": 0.0008330196200000001,
"max": 0.13091990918000002,
"count": 100
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.007116465829312801,
"min": 0.006912874523550272,
"max": 0.6042035222053528,
"count": 100
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.09963051974773407,
"min": 0.09678024053573608,
"max": 4.229424476623535,
"count": 100
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 201.31724137931033,
"min": 201.31724137931033,
"max": 999.0,
"count": 100
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29191.0,
"min": 15984.0,
"max": 33183.0,
"count": 100
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.7986827498879927,
"min": -1.0000000521540642,
"max": 1.7986827498879927,
"count": 100
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 260.8089987337589,
"min": -31.998801663517952,
"max": 264.99019791185856,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.7986827498879927,
"min": -1.0000000521540642,
"max": 1.7986827498879927,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 260.8089987337589,
"min": -31.998801663517952,
"max": 264.99019791185856,
"count": 100
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.014916455586127744,
"min": 0.01485513350705366,
"max": 12.990806862711906,
"count": 100
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.162886059988523,
"min": 2.0054430234522442,
"max": 207.8529098033905,
"count": 100
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1705861383",
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.1.2+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1705868597"
},
"total": 7214.083407328002,
"count": 1,
"self": 0.4380659300022671,
"children": {
"run_training.setup": {
"total": 0.05346922899843776,
"count": 1,
"self": 0.05346922899843776
},
"TrainerController.start_learning": {
"total": 7213.591872169001,
"count": 1,
"self": 4.133439108494713,
"children": {
"TrainerController._reset_env": {
"total": 1.945490416001121,
"count": 1,
"self": 1.945490416001121
},
"TrainerController.advance": {
"total": 7207.428359766509,
"count": 194806,
"self": 4.374350660815253,
"children": {
"env_step": {
"total": 5307.503929227729,
"count": 194806,
"self": 4916.2963640494945,
"children": {
"SubprocessEnvManager._take_step": {
"total": 388.60030352147623,
"count": 194806,
"self": 14.44554687132404,
"children": {
"TorchPolicy.evaluate": {
"total": 374.1547566501522,
"count": 187553,
"self": 374.1547566501522
}
}
},
"workers": {
"total": 2.6072616567580553,
"count": 194806,
"self": 0.0,
"children": {
"worker_root": {
"total": 7198.002033440398,
"count": 194806,
"is_parallel": true,
"self": 2652.01298088737,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0016610250004305271,
"count": 1,
"is_parallel": true,
"self": 0.0005324970006768126,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011285279997537145,
"count": 8,
"is_parallel": true,
"self": 0.0011285279997537145
}
}
},
"UnityEnvironment.step": {
"total": 0.050383321999106556,
"count": 1,
"is_parallel": true,
"self": 0.0006207539972820086,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0005093529998703161,
"count": 1,
"is_parallel": true,
"self": 0.0005093529998703161
},
"communicator.exchange": {
"total": 0.04745358100080921,
"count": 1,
"is_parallel": true,
"self": 0.04745358100080921
},
"steps_from_proto": {
"total": 0.001799634001145023,
"count": 1,
"is_parallel": true,
"self": 0.0003732880013558315,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014263459997891914,
"count": 8,
"is_parallel": true,
"self": 0.0014263459997891914
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 4545.989052553028,
"count": 194805,
"is_parallel": true,
"self": 106.6345271078826,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 77.94749165817848,
"count": 194805,
"is_parallel": true,
"self": 77.94749165817848
},
"communicator.exchange": {
"total": 4051.6340534070277,
"count": 194805,
"is_parallel": true,
"self": 4051.6340534070277
},
"steps_from_proto": {
"total": 309.7729803799393,
"count": 194805,
"is_parallel": true,
"self": 63.342609213239484,
"children": {
"_process_rank_one_or_two_observation": {
"total": 246.43037116669984,
"count": 1558440,
"is_parallel": true,
"self": 246.43037116669984
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1895.550079877965,
"count": 194806,
"self": 8.632492726152122,
"children": {
"process_trajectory": {
"total": 395.10480879086754,
"count": 194806,
"self": 394.5252831978669,
"children": {
"RLTrainer._checkpoint": {
"total": 0.5795255930006533,
"count": 6,
"self": 0.5795255930006533
}
}
},
"_update_policy": {
"total": 1491.8127783609452,
"count": 1394,
"self": 888.6532884770731,
"children": {
"TorchPPOOptimizer.update": {
"total": 603.1594898838721,
"count": 68406,
"self": 603.1594898838721
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.819988579489291e-07,
"count": 1,
"self": 8.819988579489291e-07
},
"TrainerController._save_models": {
"total": 0.08458199599772342,
"count": 1,
"self": 0.001658498997130664,
"children": {
"RLTrainer._checkpoint": {
"total": 0.08292349700059276,
"count": 1,
"self": 0.08292349700059276
}
}
}
}
}
}
}