poca-SoccerTwos / run_logs /timers.json
debisoft's picture
6th Push
c44d494 verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.5435189008712769,
"min": 1.4646319150924683,
"max": 1.6610451936721802,
"count": 500
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 31759.4453125,
"min": 25814.9765625,
"max": 36021.5078125,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 58.79761904761905,
"min": 42.716814159292035,
"max": 82.63333333333334,
"count": 500
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19756.0,
"min": 18480.0,
"max": 20628.0,
"count": 500
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1641.0530434980756,
"min": 1581.3414240873562,
"max": 1645.42222380018,
"count": 500
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 275696.9113076767,
"min": 194048.29977610603,
"max": 373368.55337094323,
"count": 500
},
"SoccerTwos.Step.mean": {
"value": 14999981.0,
"min": 10009960.0,
"max": 14999981.0,
"count": 500
},
"SoccerTwos.Step.sum": {
"value": 14999981.0,
"min": 10009960.0,
"max": 14999981.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.0025916770100593567,
"min": -0.11438218504190445,
"max": 0.07807338982820511,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.4379934072494507,
"min": -23.128673553466797,
"max": 14.677797317504883,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.0026981872506439686,
"min": -0.11424611508846283,
"max": 0.07508175075054169,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 0.45599365234375,
"min": -23.13912582397461,
"max": 14.11536979675293,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.02577988283168635,
"min": -0.3560073624359318,
"max": 0.2735396422578033,
"count": 500
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -4.356800198554993,
"min": -58.029200077056885,
"max": 46.228199541568756,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.02577988283168635,
"min": -0.3560073624359318,
"max": 0.2735396422578033,
"count": 500
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -4.356800198554993,
"min": -58.029200077056885,
"max": 46.228199541568756,
"count": 500
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 500
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.012675322993891314,
"min": 0.008311386445226769,
"max": 0.016500145032963095,
"count": 121
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.012675322993891314,
"min": 0.008311386445226769,
"max": 0.016500145032963095,
"count": 121
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.12124239106973013,
"min": 0.10481940135359764,
"max": 0.1345561275879542,
"count": 121
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.12124239106973013,
"min": 0.10481940135359764,
"max": 0.1345561275879542,
"count": 121
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.12398228074113528,
"min": 0.10591413453221321,
"max": 0.1369128222266833,
"count": 121
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.12398228074113528,
"min": 0.10591413453221321,
"max": 0.1369128222266833,
"count": 121
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.00019999999999999996,
"min": 0.00019999999999999996,
"max": 0.00019999999999999996,
"count": 121
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.00019999999999999996,
"min": 0.00019999999999999996,
"max": 0.00019999999999999996,
"count": 121
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 121
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 121
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 121
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 121
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1761011053",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/home/ada/work/ai/venv3.10/bin/mlagents-learn ./config/poca/SoccerTwosGo.yaml --resume --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.9.0+cu128",
"numpy_version": "1.23.5",
"end_time_seconds": "1761019758"
},
"total": 8704.57901644602,
"count": 1,
"self": 0.9726788210100494,
"children": {
"run_training.setup": {
"total": 0.024575264018494636,
"count": 1,
"self": 0.024575264018494636
},
"TrainerController.start_learning": {
"total": 8703.581762360991,
"count": 1,
"self": 7.502892200194765,
"children": {
"TrainerController._reset_env": {
"total": 2.129385295906104,
"count": 26,
"self": 2.129385295906104
},
"TrainerController.advance": {
"total": 8691.612080165913,
"count": 347303,
"self": 6.230914909858257,
"children": {
"env_step": {
"total": 6704.959744712687,
"count": 347303,
"self": 5021.182745416998,
"children": {
"SubprocessEnvManager._take_step": {
"total": 1678.7599376246217,
"count": 347303,
"self": 39.04678861272987,
"children": {
"TorchPolicy.evaluate": {
"total": 1639.7131490118918,
"count": 627670,
"self": 1639.7131490118918
}
}
},
"workers": {
"total": 5.017061671067495,
"count": 347303,
"self": 0.0,
"children": {
"worker_root": {
"total": 8685.496602965024,
"count": 347303,
"is_parallel": true,
"self": 4470.667818740127,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.002683888975298032,
"count": 2,
"is_parallel": true,
"self": 0.000585997971938923,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.002097891003359109,
"count": 8,
"is_parallel": true,
"self": 0.002097891003359109
}
}
},
"UnityEnvironment.step": {
"total": 0.021987969987094402,
"count": 1,
"is_parallel": true,
"self": 0.0004761809832416475,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00046435699914582074,
"count": 1,
"is_parallel": true,
"self": 0.00046435699914582074
},
"communicator.exchange": {
"total": 0.01973794001969509,
"count": 1,
"is_parallel": true,
"self": 0.01973794001969509
},
"steps_from_proto": {
"total": 0.0013094919850118458,
"count": 2,
"is_parallel": true,
"self": 0.00024246098473668098,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0010670310002751648,
"count": 8,
"is_parallel": true,
"self": 0.0010670310002751648
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.05173607706092298,
"count": 50,
"is_parallel": true,
"self": 0.008709836401976645,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.043026240658946335,
"count": 200,
"is_parallel": true,
"self": 0.043026240658946335
}
}
},
"UnityEnvironment.step": {
"total": 4214.7770481478365,
"count": 347302,
"is_parallel": true,
"self": 237.83366664528148,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 162.09566081810044,
"count": 347302,
"is_parallel": true,
"self": 162.09566081810044
},
"communicator.exchange": {
"total": 3184.5067745028355,
"count": 347302,
"is_parallel": true,
"self": 3184.5067745028355
},
"steps_from_proto": {
"total": 630.3409461816191,
"count": 694604,
"is_parallel": true,
"self": 106.73629873536993,
"children": {
"_process_rank_one_or_two_observation": {
"total": 523.6046474462491,
"count": 2778416,
"is_parallel": true,
"self": 523.6046474462491
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1980.4214205433673,
"count": 347303,
"self": 60.59123472208739,
"children": {
"process_trajectory": {
"total": 951.9022839034442,
"count": 347303,
"self": 928.9015034834156,
"children": {
"RLTrainer._checkpoint": {
"total": 23.000780420028605,
"count": 10,
"self": 23.000780420028605
}
}
},
"_update_policy": {
"total": 967.9279019178357,
"count": 121,
"self": 540.7814483185066,
"children": {
"TorchPOCAOptimizer.update": {
"total": 427.1464535993291,
"count": 3630,
"self": 427.1464535993291
}
}
}
}
}
}
},
"trainer_threads": {
"total": 5.709880497306585e-07,
"count": 1,
"self": 5.709880497306585e-07
},
"TrainerController._save_models": {
"total": 2.33740412798943,
"count": 1,
"self": 0.15179298998555169,
"children": {
"RLTrainer._checkpoint": {
"total": 2.1856111380038783,
"count": 1,
"self": 2.1856111380038783
}
}
}
}
}
}
}