| { |
| "name": "root", |
| "gauges": { |
| "SoccerTwos.Policy.Entropy.mean": { |
| "value": 1.3616080284118652, |
| "min": 1.2583924531936646, |
| "max": 3.295762062072754, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.Entropy.sum": { |
| "value": 28277.875, |
| "min": 22359.94140625, |
| "max": 110288.1953125, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.mean": { |
| "value": 53.07446808510638, |
| "min": 38.864, |
| "max": 999.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.EpisodeLength.sum": { |
| "value": 19956.0, |
| "min": 14884.0, |
| "max": 25296.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Self-play.ELO.mean": { |
| "value": 1598.0596790498014, |
| "min": 1195.0944019587976, |
| "max": 1728.4064925176488, |
| "count": 4996 |
| }, |
| "SoccerTwos.Self-play.ELO.sum": { |
| "value": 300435.21966136264, |
| "min": 2392.146529634802, |
| "max": 397665.68492539297, |
| "count": 4996 |
| }, |
| "SoccerTwos.Step.mean": { |
| "value": 49999920.0, |
| "min": 9664.0, |
| "max": 49999920.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Step.sum": { |
| "value": 49999920.0, |
| "min": 9664.0, |
| "max": 49999920.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
| "value": -0.025699233636260033, |
| "min": -0.13865908980369568, |
| "max": 0.1619817018508911, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
| "value": -4.805756568908691, |
| "min": -25.709543228149414, |
| "max": 27.536890029907227, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
| "value": -0.026782628148794174, |
| "min": -0.14225316047668457, |
| "max": 0.16532564163208008, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
| "value": -5.0083513259887695, |
| "min": -25.85490608215332, |
| "max": 28.10536003112793, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.mean": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.CumulativeReward.sum": { |
| "value": 0.0, |
| "min": 0.0, |
| "max": 0.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { |
| "value": -0.04190160373952937, |
| "min": -0.625, |
| "max": 0.3768250048160553, |
| "count": 5000 |
| }, |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { |
| "value": -7.835599899291992, |
| "min": -67.18280017375946, |
| "max": 62.96679985523224, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { |
| "value": -0.04190160373952937, |
| "min": -0.625, |
| "max": 0.3768250048160553, |
| "count": 5000 |
| }, |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { |
| "value": -7.835599899291992, |
| "min": -67.18280017375946, |
| "max": 62.96679985523224, |
| "count": 5000 |
| }, |
| "SoccerTwos.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 5000 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.mean": { |
| "value": 0.017462212400278076, |
| "min": 0.009035884733990921, |
| "max": 0.025665317429229617, |
| "count": 2425 |
| }, |
| "SoccerTwos.Losses.PolicyLoss.sum": { |
| "value": 0.017462212400278076, |
| "min": 0.009035884733990921, |
| "max": 0.025665317429229617, |
| "count": 2425 |
| }, |
| "SoccerTwos.Losses.ValueLoss.mean": { |
| "value": 0.1065414510667324, |
| "min": 0.0008842718370336418, |
| "max": 0.12906330823898315, |
| "count": 2425 |
| }, |
| "SoccerTwos.Losses.ValueLoss.sum": { |
| "value": 0.1065414510667324, |
| "min": 0.0008842718370336418, |
| "max": 0.12906330823898315, |
| "count": 2425 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.mean": { |
| "value": 0.10812452683846156, |
| "min": 0.0008870263952606668, |
| "max": 0.13241908450921377, |
| "count": 2425 |
| }, |
| "SoccerTwos.Losses.BaselineLoss.sum": { |
| "value": 0.10812452683846156, |
| "min": 0.0008870263952606668, |
| "max": 0.13241908450921377, |
| "count": 2425 |
| }, |
| "SoccerTwos.Policy.LearningRate.mean": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 2425 |
| }, |
| "SoccerTwos.Policy.LearningRate.sum": { |
| "value": 0.0003, |
| "min": 0.0003, |
| "max": 0.0003, |
| "count": 2425 |
| }, |
| "SoccerTwos.Policy.Epsilon.mean": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 2425 |
| }, |
| "SoccerTwos.Policy.Epsilon.sum": { |
| "value": 0.20000000000000007, |
| "min": 0.20000000000000007, |
| "max": 0.20000000000000007, |
| "count": 2425 |
| }, |
| "SoccerTwos.Policy.Beta.mean": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 2425 |
| }, |
| "SoccerTwos.Policy.Beta.sum": { |
| "value": 0.005000000000000001, |
| "min": 0.005000000000000001, |
| "max": 0.005000000000000001, |
| "count": 2425 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1683853768", |
| "python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", |
| "command_line_arguments": "/home/ark/.miniconda3/envs/deep-rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
| "mlagents_version": "0.31.0.dev0", |
| "mlagents_envs_version": "0.31.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.11.0+cu113", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1683906274" |
| }, |
| "total": 52506.21998502896, |
| "count": 1, |
| "self": 0.2684874410042539, |
| "children": { |
| "run_training.setup": { |
| "total": 0.01312148297438398, |
| "count": 1, |
| "self": 0.01312148297438398 |
| }, |
| "TrainerController.start_learning": { |
| "total": 52505.93837610498, |
| "count": 1, |
| "self": 61.689565332082566, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 7.803456781432033, |
| "count": 250, |
| "self": 7.803456781432033 |
| }, |
| "TrainerController.advance": { |
| "total": 52436.307568769495, |
| "count": 3457468, |
| "self": 65.59610899613472, |
| "children": { |
| "env_step": { |
| "total": 39085.2176601697, |
| "count": 3457468, |
| "self": 29407.445092021197, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 9640.886361224926, |
| "count": 3457468, |
| "self": 285.5095421230071, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 9355.376819101919, |
| "count": 6277032, |
| "self": 9355.376819101919 |
| } |
| } |
| }, |
| "workers": { |
| "total": 36.88620692357654, |
| "count": 3457468, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 52438.728711235744, |
| "count": 3457468, |
| "is_parallel": true, |
| "self": 28772.39803970972, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.009463751979637891, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.008115717966575176, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013480340130627155, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013480340130627155 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.022137401974759996, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003626939724199474, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00036192400148138404, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00036192400148138404 |
| }, |
| "communicator.exchange": { |
| "total": 0.02030703501077369, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.02030703501077369 |
| }, |
| "steps_from_proto": { |
| "total": 0.001105748990084976, |
| "count": 2, |
| "is_parallel": true, |
| "self": 0.0002536699757911265, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0008520790142938495, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0008520790142938495 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 23665.917796976806, |
| "count": 3457467, |
| "is_parallel": true, |
| "self": 1429.4596847074572, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 932.3081354034366, |
| "count": 3457467, |
| "is_parallel": true, |
| "self": 932.3081354034366 |
| }, |
| "communicator.exchange": { |
| "total": 17250.80261331302, |
| "count": 3457467, |
| "is_parallel": true, |
| "self": 17250.80261331302 |
| }, |
| "steps_from_proto": { |
| "total": 4053.3473635528935, |
| "count": 6914934, |
| "is_parallel": true, |
| "self": 799.3124663241324, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 3254.034897228761, |
| "count": 27659736, |
| "is_parallel": true, |
| "self": 3254.034897228761 |
| } |
| } |
| } |
| } |
| }, |
| "steps_from_proto": { |
| "total": 0.41287454921985045, |
| "count": 498, |
| "is_parallel": true, |
| "self": 0.08557594433659688, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.3272986048832536, |
| "count": 1992, |
| "is_parallel": true, |
| "self": 0.3272986048832536 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 13285.49379960366, |
| "count": 3457468, |
| "self": 466.44135415990604, |
| "children": { |
| "process_trajectory": { |
| "total": 5813.522965371667, |
| "count": 3457468, |
| "self": 5799.7422991369385, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 13.780666234728415, |
| "count": 100, |
| "self": 13.780666234728415 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 7005.529480072088, |
| "count": 2425, |
| "self": 4734.089757825423, |
| "children": { |
| "TorchPOCAOptimizer.update": { |
| "total": 2271.439722246665, |
| "count": 72750, |
| "self": 2271.439722246665 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.9560102373361588e-06, |
| "count": 1, |
| "self": 1.9560102373361588e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.13778326596366242, |
| "count": 1, |
| "self": 0.0009318289812654257, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.136851436982397, |
| "count": 1, |
| "self": 0.136851436982397 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |