mgmeskill's picture
First push
10bdb42
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.1732717901468277,
"min": 0.16883191466331482,
"max": 1.4750075340270996,
"count": 100
},
"Pyramids.Policy.Entropy.sum": {
"value": 5167.65771484375,
"min": 5016.333984375,
"max": 44745.828125,
"count": 100
},
"Pyramids.Step.mean": {
"value": 2999998.0,
"min": 29944.0,
"max": 2999998.0,
"count": 100
},
"Pyramids.Step.sum": {
"value": 2999998.0,
"min": 29944.0,
"max": 2999998.0,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.8625621795654297,
"min": -0.10248949378728867,
"max": 0.8698307275772095,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 271.70709228515625,
"min": -24.59747886657715,
"max": 271.70709228515625,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.004970206879079342,
"min": -0.02576282247900963,
"max": 0.41658225655555725,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 1.565615177154541,
"min": -7.213590145111084,
"max": 98.72999572753906,
"count": 100
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06808245780948531,
"min": 0.0638794918890331,
"max": 0.07363917369657837,
"count": 100
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9531544093327943,
"min": 0.4957619199670461,
"max": 1.0592665975181814,
"count": 100
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.01619220309490853,
"min": 5.462268124734433e-05,
"max": 0.018284210662213373,
"count": 100
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.22669084332871944,
"min": 0.0007100948562154763,
"max": 0.25597894927098724,
"count": 100
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.5276709193809485e-06,
"min": 1.5276709193809485e-06,
"max": 0.0002984110862439238,
"count": 100
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.138739287133328e-05,
"min": 2.138739287133328e-05,
"max": 0.0037592103469299325,
"count": 100
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10050919047619046,
"min": 0.10050919047619046,
"max": 0.19947036190476192,
"count": 100
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4071286666666665,
"min": 1.3962925333333334,
"max": 2.6774824000000006,
"count": 100
},
"Pyramids.Policy.Beta.mean": {
"value": 6.086812857142845e-05,
"min": 6.086812857142845e-05,
"max": 0.009947089154285714,
"count": 100
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0008521537999999982,
"min": 0.0008521537999999982,
"max": 0.12532169966,
"count": 100
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.005503428168594837,
"min": 0.005443856120109558,
"max": 0.40362200140953064,
"count": 100
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.07704799622297287,
"min": 0.07621398568153381,
"max": 2.8253540992736816,
"count": 100
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 192.23225806451612,
"min": 192.23225806451612,
"max": 999.0,
"count": 100
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29796.0,
"min": 16615.0,
"max": 32833.0,
"count": 100
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.8077677302783535,
"min": -0.9999750521965325,
"max": 1.8077677302783535,
"count": 100
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 280.2039981931448,
"min": -31.99920167028904,
"max": 280.2039981931448,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.8077677302783535,
"min": -0.9999750521965325,
"max": 1.8077677302783535,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 280.2039981931448,
"min": -31.99920167028904,
"max": 280.2039981931448,
"count": 100
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.011040707466646938,
"min": 0.011040707466646938,
"max": 8.34357355009107,
"count": 100
},
"Pyramids.Policy.RndReward.sum": {
"value": 1.7113096573302755,
"min": 1.611937693465734,
"max": 141.8407503515482,
"count": 100
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1691108191",
"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1691115862"
},
"total": 7671.008981160001,
"count": 1,
"self": 0.5333794560010574,
"children": {
"run_training.setup": {
"total": 0.05706278700006351,
"count": 1,
"self": 0.05706278700006351
},
"TrainerController.start_learning": {
"total": 7670.418538917,
"count": 1,
"self": 4.3863660430461096,
"children": {
"TrainerController._reset_env": {
"total": 5.0868495209999764,
"count": 1,
"self": 5.0868495209999764
},
"TrainerController.advance": {
"total": 7660.843329399954,
"count": 194826,
"self": 4.426356907940317,
"children": {
"env_step": {
"total": 5607.0756717761915,
"count": 194826,
"self": 5272.292259553346,
"children": {
"SubprocessEnvManager._take_step": {
"total": 332.2392115490071,
"count": 194826,
"self": 14.541813471979935,
"children": {
"TorchPolicy.evaluate": {
"total": 317.6973980770272,
"count": 187558,
"self": 317.6973980770272
}
}
},
"workers": {
"total": 2.544200673837736,
"count": 194826,
"self": 0.0,
"children": {
"worker_root": {
"total": 7653.047324228084,
"count": 194826,
"is_parallel": true,
"self": 2739.9415117831577,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0028090659999406853,
"count": 1,
"is_parallel": true,
"self": 0.000783813000111877,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0020252529998288082,
"count": 8,
"is_parallel": true,
"self": 0.0020252529998288082
}
}
},
"UnityEnvironment.step": {
"total": 0.045778663999954006,
"count": 1,
"is_parallel": true,
"self": 0.0005522519999203723,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0004893160000847274,
"count": 1,
"is_parallel": true,
"self": 0.0004893160000847274
},
"communicator.exchange": {
"total": 0.04286552700000357,
"count": 1,
"is_parallel": true,
"self": 0.04286552700000357
},
"steps_from_proto": {
"total": 0.0018715689999453389,
"count": 1,
"is_parallel": true,
"self": 0.0003429679998134816,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0015286010001318573,
"count": 8,
"is_parallel": true,
"self": 0.0015286010001318573
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 4913.105812444926,
"count": 194825,
"is_parallel": true,
"self": 106.07971303896011,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 69.742620872197,
"count": 194825,
"is_parallel": true,
"self": 69.742620872197
},
"communicator.exchange": {
"total": 4411.053334296899,
"count": 194825,
"is_parallel": true,
"self": 4411.053334296899
},
"steps_from_proto": {
"total": 326.23014423686993,
"count": 194825,
"is_parallel": true,
"self": 64.20461575541594,
"children": {
"_process_rank_one_or_two_observation": {
"total": 262.025528481454,
"count": 1558600,
"is_parallel": true,
"self": 262.025528481454
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2049.3413007158224,
"count": 194826,
"self": 8.248276518858347,
"children": {
"process_trajectory": {
"total": 350.4150544439759,
"count": 194826,
"self": 349.70366725497445,
"children": {
"RLTrainer._checkpoint": {
"total": 0.7113871890014707,
"count": 6,
"self": 0.7113871890014707
}
}
},
"_update_policy": {
"total": 1690.677969752988,
"count": 1393,
"self": 1105.4793974299164,
"children": {
"TorchPPOOptimizer.update": {
"total": 585.1985723230715,
"count": 68376,
"self": 585.1985723230715
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.539999155094847e-07,
"count": 1,
"self": 9.539999155094847e-07
},
"TrainerController._save_models": {
"total": 0.10199299899977632,
"count": 1,
"self": 0.0013946660001238342,
"children": {
"RLTrainer._checkpoint": {
"total": 0.10059833299965248,
"count": 1,
"self": 0.10059833299965248
}
}
}
}
}
}
}