{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 2.4907772541046143, "min": 1.1685776710510254, "max": 3.1593832969665527, "count": 99 }, "SoccerTwos.Policy.Entropy.sum": { "value": 245570.71875, "min": 107051.890625, "max": 366161.34375, "count": 99 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 984.2692307692307, "min": 664.921052631579, "max": 999.0, "count": 99 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 102364.0, "min": 63904.0, "max": 121016.0, "count": 99 }, "SoccerTwos.Step.mean": { "value": 9999542.0, "min": 5099622.0, "max": 9999542.0, "count": 99 }, "SoccerTwos.Step.sum": { "value": 9999542.0, "min": 5099622.0, "max": 9999542.0, "count": 99 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.0001826496300054714, "min": -0.01437555905431509, "max": 0.017843715846538544, "count": 99 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -0.009315131232142448, "min": -0.8481580018997192, "max": 0.9278731942176819, "count": 99 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.00024330221640411764, "min": -0.013751156628131866, "max": 0.018771987408399582, "count": 99 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -0.012408412992954254, "min": -0.8792648315429688, "max": 0.9761433005332947, "count": 99 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 99 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 99 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.0392156862745098, "min": -0.2734444447689586, "max": 0.07507936538211883, "count": 99 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -2.0, "min": -19.68800002336502, "max": 4.730000019073486, "count": 99 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.0392156862745098, "min": -0.2734444447689586, "max": 0.07507936538211883, "count": 99 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -2.0, "min": -19.68800002336502, "max": 4.730000019073486, "count": 99 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 99 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 99 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.017561657571786782, "min": 0.01264058340683126, "max": 0.019526855821762487, "count": 98 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.035123315143573565, "min": 0.013353993123746476, "max": 0.05705379659581619, "count": 98 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.00041136964250351184, "min": 3.481565622218439e-10, "max": 0.0038090936238101376, "count": 98 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.0008227392850070237, "min": 6.220758618101661e-10, "max": 0.010206666128942743, "count": 98 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.00041130511440758594, "min": 3.4311148498006936e-10, "max": 0.0038083288168612246, "count": 98 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.0008226102288151719, "min": 6.582947282963837e-10, "max": 0.010377476842647108, "count": 98 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 98 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0006, "min": 0.0003, "max": 0.0009, "count": 98 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.19999999999999993, "max": 0.20000000000000007, "count": 98 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.40000000000000013, "min": 0.19999999999999993, "max": 0.6000000000000002, "count": 98 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005, "max": 0.005000000000000001, "count": 98 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.010000000000000002, "min": 0.005, "max": 0.015000000000000003, "count": 98 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1223.7534638982459, "min": 1210.1671495708435, "max": 1226.8819693882956, "count": 32 }, "SoccerTwos.Self-play.ELO.sum": { "value": 2447.5069277964917, "min": 2420.334299141687, "max": 41242.957665294176, "count": 32 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1765546652", "python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", "command_line_arguments": "/zhome/b6/d/203017/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume", "mlagents_version": "1.2.0.dev0", "mlagents_envs_version": "1.2.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.8.0+cu128", "numpy_version": "1.23.5", "end_time_seconds": "1765554821" }, "total": 8169.391451666976, "count": 1, "self": 0.3792129899957217, "children": { "run_training.setup": { "total": 0.05216734399436973, "count": 1, "self": 0.05216734399436973 }, "TrainerController.start_learning": { "total": 8168.9600713329855, "count": 1, "self": 6.423729272006312, "children": { "TrainerController._reset_env": { "total": 6.558995136030717, "count": 26, "self": 6.558995136030717 }, "TrainerController.advance": { "total": 8155.0617587179295, "count": 317123, "self": 6.362516603490803, "children": { "env_step": { "total": 6535.787821058155, "count": 317123, "self": 4537.74635747078, "children": { "SubprocessEnvManager._take_step": { "total": 1994.202184700087, "count": 317123, "self": 46.02341712030466, "children": { "TorchPolicy.evaluate": { "total": 1948.1787675797823, "count": 630866, "self": 1948.1787675797823 } } }, "workers": { "total": 3.8392788872879464, "count": 317123, "self": 0.0, "children": { "worker_root": { "total": 8155.599799093412, "count": 317123, "is_parallel": true, "self": 4466.816637556563, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.004833491984754801, "count": 2, "is_parallel": true, "self": 0.0027776629431173205, "children": { "_process_rank_one_or_two_observation": { "total": 0.0020558290416374803, "count": 8, "is_parallel": true, "self": 0.0020558290416374803 } } }, "UnityEnvironment.step": { "total": 0.029922885005362332, "count": 1, "is_parallel": true, "self": 0.0007064379460643977, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0005496130033861846, "count": 1, "is_parallel": true, "self": 0.0005496130033861846 }, "communicator.exchange": { "total": 0.026616044022375718, "count": 1, "is_parallel": true, "self": 0.026616044022375718 }, "steps_from_proto": { "total": 0.002050790033536032, "count": 2, "is_parallel": true, "self": 0.0004255690728314221, "children": { "_process_rank_one_or_two_observation": { "total": 0.0016252209607046098, "count": 8, "is_parallel": true, "self": 0.0016252209607046098 } } } } } } }, "steps_from_proto": { "total": 0.04827410803409293, "count": 50, "is_parallel": true, "self": 0.009163186972727999, "children": { "_process_rank_one_or_two_observation": { "total": 0.039110921061364934, "count": 200, "is_parallel": true, "self": 0.039110921061364934 } } }, "UnityEnvironment.step": { "total": 3688.7348874288145, "count": 317122, "is_parallel": true, "self": 186.91520221577957, "children": { "UnityEnvironment._generate_step_input": { "total": 129.14363695765496, "count": 317122, "is_parallel": true, "self": 129.14363695765496 }, "communicator.exchange": { "total": 2813.859523506253, "count": 317122, "is_parallel": true, "self": 2813.859523506253 }, "steps_from_proto": { "total": 558.816524749127, "count": 634244, "is_parallel": true, "self": 101.99654760936392, "children": { "_process_rank_one_or_two_observation": { "total": 456.81997713976307, "count": 2536976, "is_parallel": true, "self": 456.81997713976307 } } } } } } } } } } }, "trainer_advance": { "total": 1612.9114210562839, "count": 317123, "self": 66.02497788210167, "children": { "process_trajectory": { "total": 460.47966692826594, "count": 317123, "self": 451.7735055142839, "children": { "RLTrainer._checkpoint": { "total": 8.706161413982045, "count": 10, "self": 8.706161413982045 } } }, "_update_policy": { "total": 1086.4067762459163, "count": 208, "self": 692.196635984903, "children": { "TorchPOCAOptimizer.update": { "total": 394.2101402610133, "count": 6801, "self": 394.2101402610133 } } } } } } }, "trainer_threads": { "total": 9.190116543322802e-07, "count": 1, "self": 9.190116543322802e-07 }, "TrainerController._save_models": { "total": 0.915587288007373, "count": 1, "self": 0.03353284898912534, "children": { "RLTrainer._checkpoint": { "total": 0.8820544390182476, "count": 1, "self": 0.8820544390182476 } } } } } } }