poca-SoccerTwos / run_logs /timers.json
Balab2021's picture
First Push
a071d94 verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 3.295729160308838,
"min": 3.2957284450531006,
"max": 3.295729160308838,
"count": 2
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 93335.046875,
"min": 93335.046875,
"max": 105463.3125,
"count": 2
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 702.2,
"min": 702.2,
"max": 780.3333333333334,
"count": 2
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 14044.0,
"min": 14044.0,
"max": 28092.0,
"count": 2
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1200.9928540150988,
"min": 1200.5792730868427,
"max": 1200.9928540150988,
"count": 2
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 7205.9571240905925,
"min": 7203.475638521056,
"max": 7205.9571240905925,
"count": 2
},
"SoccerTwos.Step.mean": {
"value": 19326.0,
"min": 9064.0,
"max": 19326.0,
"count": 2
},
"SoccerTwos.Step.sum": {
"value": 19326.0,
"min": 9064.0,
"max": 19326.0,
"count": 2
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.025762788951396942,
"min": -0.025770632550120354,
"max": -0.025762788951396942,
"count": 2
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.33491626381874084,
"min": -0.33501821756362915,
"max": -0.33491626381874084,
"count": 2
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.02579621784389019,
"min": -0.025808317586779594,
"max": -0.02579621784389019,
"count": 2
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.3353508412837982,
"min": -0.3355081379413605,
"max": -0.3353508412837982,
"count": 2
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 2
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 2
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.01926153439741868,
"min": -0.01926153439741868,
"max": 0.041876921286949746,
"count": 2
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -0.25039994716644287,
"min": -0.25039994716644287,
"max": 0.5443999767303467,
"count": 2
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.01926153439741868,
"min": -0.01926153439741868,
"max": 0.041876921286949746,
"count": 2
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -0.25039994716644287,
"min": -0.25039994716644287,
"max": 0.5443999767303467,
"count": 2
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 2
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 2
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1739327023",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/linux/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.6.0+cu124",
"numpy_version": "1.23.5",
"end_time_seconds": "1739327115"
},
"total": 91.3590518559995,
"count": 1,
"self": 0.5813182309993863,
"children": {
"run_training.setup": {
"total": 0.037224699999569566,
"count": 1,
"self": 0.037224699999569566
},
"TrainerController.start_learning": {
"total": 90.74050892500054,
"count": 1,
"self": 0.098852832978082,
"children": {
"TrainerController._reset_env": {
"total": 4.207128800999271,
"count": 1,
"self": 4.207128800999271
},
"TrainerController.advance": {
"total": 86.43452588502441,
"count": 1889,
"self": 0.10271048397407867,
"children": {
"env_step": {
"total": 74.05656635300329,
"count": 1889,
"self": 58.877999243075465,
"children": {
"SubprocessEnvManager._take_step": {
"total": 15.13365142796647,
"count": 1889,
"self": 0.9496862819141825,
"children": {
"TorchPolicy.evaluate": {
"total": 14.183965146052287,
"count": 3770,
"self": 14.183965146052287
}
}
},
"workers": {
"total": 0.04491568196135631,
"count": 1889,
"self": 0.0,
"children": {
"worker_root": {
"total": 88.87652832899221,
"count": 1889,
"is_parallel": true,
"self": 39.063370873960594,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.004659684002035647,
"count": 2,
"is_parallel": true,
"self": 0.0012968069968337659,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.003362877005201881,
"count": 8,
"is_parallel": true,
"self": 0.003362877005201881
}
}
},
"UnityEnvironment.step": {
"total": 0.08096612200097297,
"count": 1,
"is_parallel": true,
"self": 0.0014558850016328506,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.000837006000438123,
"count": 1,
"is_parallel": true,
"self": 0.000837006000438123
},
"communicator.exchange": {
"total": 0.07441111799926148,
"count": 1,
"is_parallel": true,
"self": 0.07441111799926148
},
"steps_from_proto": {
"total": 0.004262112999640522,
"count": 2,
"is_parallel": true,
"self": 0.0008486339993396541,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0034134790003008675,
"count": 8,
"is_parallel": true,
"self": 0.0034134790003008675
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 49.813157455031615,
"count": 1888,
"is_parallel": true,
"self": 2.9011671101015963,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 2.0474009170084173,
"count": 1888,
"is_parallel": true,
"self": 2.0474009170084173
},
"communicator.exchange": {
"total": 35.63251080200462,
"count": 1888,
"is_parallel": true,
"self": 35.63251080200462
},
"steps_from_proto": {
"total": 9.232078625916984,
"count": 3776,
"is_parallel": true,
"self": 1.7188067538590985,
"children": {
"_process_rank_one_or_two_observation": {
"total": 7.513271872057885,
"count": 15104,
"is_parallel": true,
"self": 7.513271872057885
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 12.275249048047044,
"count": 1889,
"self": 0.3977916850362817,
"children": {
"process_trajectory": {
"total": 11.065535048010133,
"count": 1889,
"self": 11.065535048010133
},
"_update_policy": {
"total": 0.8119223150006292,
"count": 1,
"self": 0.8119223150006292
}
}
}
}
},
"trainer_threads": {
"total": 1.405998773407191e-06,
"count": 1,
"self": 1.405998773407191e-06
}
}
}
}
}