{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 3.2958028316497803, "min": 3.2958028316497803, "max": 3.2958028316497803, "count": 1 }, "SoccerTwos.Policy.Entropy.sum": { "value": 105465.6875, "min": 105465.6875, "max": 105465.6875, "count": 1 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 698.7272727272727, "min": 698.7272727272727, "max": 698.7272727272727, "count": 1 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 30744.0, "min": 30744.0, "max": 30744.0, "count": 1 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1200.786063550971, "min": 1200.786063550971, "max": 1200.786063550971, "count": 1 }, "SoccerTwos.Self-play.ELO.sum": { "value": 14409.432762611652, "min": 14409.432762611652, "max": 14409.432762611652, "count": 1 }, "SoccerTwos.Step.mean": { "value": 9394.0, "min": 9394.0, "max": 9394.0, "count": 1 }, "SoccerTwos.Step.sum": { "value": 9394.0, "min": 9394.0, "max": 9394.0, "count": 1 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.058177243918180466, "min": -0.058177243918180466, "max": -0.058177243918180466, "count": 1 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -0.9308359026908875, "min": -0.9308359026908875, "max": -0.9308359026908875, "count": 1 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.058177318423986435, "min": -0.058177318423986435, "max": -0.058177318423986435, "count": 1 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -0.930837094783783, "min": -0.930837094783783, "max": -0.930837094783783, "count": 1 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.2280499991029501, "min": 0.2280499991029501, "max": 0.2280499991029501, "count": 1 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 3.6487999856472015, "min": 3.6487999856472015, "max": 3.6487999856472015, "count": 1 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.2280499991029501, "min": 0.2280499991029501, "max": 0.2280499991029501, "count": 1 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 3.6487999856472015, "min": 3.6487999856472015, "max": 3.6487999856472015, "count": 1 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1681223005", "python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", "command_line_arguments": "/home/chenoi1/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1", "numpy_version": "1.21.2", "end_time_seconds": "1681223018" }, "total": 13.249850724998396, "count": 1, "self": 0.1672355659902678, "children": { "run_training.setup": { "total": 0.0042988070053979754, "count": 1, "self": 0.0042988070053979754 }, "TrainerController.start_learning": { "total": 13.07831635200273, "count": 1, "self": 0.011767759955546353, "children": { "TrainerController._reset_env": { "total": 0.4217625719975331, "count": 1, "self": 0.4217625719975331 }, "TrainerController.advance": { "total": 12.575316353053495, "count": 1005, "self": 0.010046016963315196, "children": { "env_step": { "total": 11.140344572013419, "count": 1005, "self": 9.702086679979402, "children": { "SubprocessEnvManager._take_step": { "total": 1.4315269190483377, "count": 1005, "self": 0.053430459040100686, "children": { "TorchPolicy.evaluate": { "total": 1.378096460008237, "count": 2000, "self": 1.378096460008237 } } }, "workers": { "total": 0.006730972985678818, "count": 1005, "self": 0.0, "children": { "worker_root": { "total": 12.088104250993638, "count": 1005, "is_parallel": true, "self": 3.5890393360023154, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0010192339977947995, "count": 2, "is_parallel": true, "self": 0.0002415489943814464, "children": { "_process_rank_one_or_two_observation": { "total": 0.0007776850034133531, "count": 8, "is_parallel": true, "self": 0.0007776850034133531 } } }, "UnityEnvironment.step": { "total": 0.015718985996500123, "count": 1, "is_parallel": true, "self": 0.0002712439963943325, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00020645099721150473, "count": 1, "is_parallel": true, "self": 0.00020645099721150473 }, "communicator.exchange": { "total": 0.0144167560065398, "count": 1, "is_parallel": true, "self": 0.0144167560065398 }, "steps_from_proto": { "total": 0.0008245349963544868, "count": 2, "is_parallel": true, "self": 0.00016168800357263535, "children": { "_process_rank_one_or_two_observation": { "total": 0.0006628469927818514, "count": 8, "is_parallel": true, "self": 0.0006628469927818514 } } } } } } }, "UnityEnvironment.step": { "total": 8.499064914991322, "count": 1004, "is_parallel": true, "self": 0.2413430271553807, "children": { "UnityEnvironment._generate_step_input": { "total": 0.15519495191256283, "count": 1004, "is_parallel": true, "self": 0.15519495191256283 }, "communicator.exchange": { "total": 7.336020654060121, "count": 1004, "is_parallel": true, "self": 7.336020654060121 }, "steps_from_proto": { "total": 0.7665062818632578, "count": 2008, "is_parallel": true, "self": 0.13431615439913003, "children": { "_process_rank_one_or_two_observation": { "total": 0.6321901274641277, "count": 8032, "is_parallel": true, "self": 0.6321901274641277 } } } } } } } } } } }, "trainer_advance": { "total": 1.424925764076761, "count": 1005, "self": 0.08028618992102565, "children": { "process_trajectory": { "total": 1.3446395741557353, "count": 1005, "self": 1.3446395741557353 } } } } }, "trainer_threads": { "total": 4.609973984770477e-07, "count": 1, "self": 4.609973984770477e-07 }, "TrainerController._save_models": { "total": 0.06946920599875739, "count": 1, "self": 0.0011421669987612404, "children": { "RLTrainer._checkpoint": { "total": 0.06832703899999615, "count": 1, "self": 0.06832703899999615 } } } } } } }