6th Push

c44d494 verified 6 months ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5435189008712769,
	"min": 1.4646319150924683,
	"max": 1.6610451936721802,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 31759.4453125,
	"min": 25814.9765625,
	"max": 36021.5078125,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 58.79761904761905,
	"min": 42.716814159292035,
	"max": 82.63333333333334,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19756.0,
	"min": 18480.0,
	"max": 20628.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1641.0530434980756,
	"min": 1581.3414240873562,
	"max": 1645.42222380018,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 275696.9113076767,
	"min": 194048.29977610603,
	"max": 373368.55337094323,
	"count": 500
	},
	"SoccerTwos.Step.mean": {
	"value": 14999981.0,
	"min": 10009960.0,
	"max": 14999981.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 14999981.0,
	"min": 10009960.0,
	"max": 14999981.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.0025916770100593567,
	"min": -0.11438218504190445,
	"max": 0.07807338982820511,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -0.4379934072494507,
	"min": -23.128673553466797,
	"max": 14.677797317504883,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.0026981872506439686,
	"min": -0.11424611508846283,
	"max": 0.07508175075054169,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 0.45599365234375,
	"min": -23.13912582397461,
	"max": 14.11536979675293,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.02577988283168635,
	"min": -0.3560073624359318,
	"max": 0.2735396422578033,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -4.356800198554993,
	"min": -58.029200077056885,
	"max": 46.228199541568756,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.02577988283168635,
	"min": -0.3560073624359318,
	"max": 0.2735396422578033,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -4.356800198554993,
	"min": -58.029200077056885,
	"max": 46.228199541568756,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.012675322993891314,
	"min": 0.008311386445226769,
	"max": 0.016500145032963095,
	"count": 121
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.012675322993891314,
	"min": 0.008311386445226769,
	"max": 0.016500145032963095,
	"count": 121
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.12124239106973013,
	"min": 0.10481940135359764,
	"max": 0.1345561275879542,
	"count": 121
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.12124239106973013,
	"min": 0.10481940135359764,
	"max": 0.1345561275879542,
	"count": 121
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.12398228074113528,
	"min": 0.10591413453221321,
	"max": 0.1369128222266833,
	"count": 121
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.12398228074113528,
	"min": 0.10591413453221321,
	"max": 0.1369128222266833,
	"count": 121
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.00019999999999999996,
	"min": 0.00019999999999999996,
	"max": 0.00019999999999999996,
	"count": 121
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.00019999999999999996,
	"min": 0.00019999999999999996,
	"max": 0.00019999999999999996,
	"count": 121
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 121
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 121
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 121
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 121
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1761011053",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/home/ada/work/ai/venv3.10/bin/mlagents-learn ./config/poca/SoccerTwosGo.yaml --resume --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.9.0+cu128",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1761019758"
	},
	"total": 8704.57901644602,
	"count": 1,
	"self": 0.9726788210100494,
	"children": {
	"run_training.setup": {
	"total": 0.024575264018494636,
	"count": 1,
	"self": 0.024575264018494636
	},
	"TrainerController.start_learning": {
	"total": 8703.581762360991,
	"count": 1,
	"self": 7.502892200194765,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.129385295906104,
	"count": 26,
	"self": 2.129385295906104
	},
	"TrainerController.advance": {
	"total": 8691.612080165913,
	"count": 347303,
	"self": 6.230914909858257,
	"children": {
	"env_step": {
	"total": 6704.959744712687,
	"count": 347303,
	"self": 5021.182745416998,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1678.7599376246217,
	"count": 347303,
	"self": 39.04678861272987,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1639.7131490118918,
	"count": 627670,
	"self": 1639.7131490118918
	}
	}
	},
	"workers": {
	"total": 5.017061671067495,
	"count": 347303,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 8685.496602965024,
	"count": 347303,
	"is_parallel": true,
	"self": 4470.667818740127,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002683888975298032,
	"count": 2,
	"is_parallel": true,
	"self": 0.000585997971938923,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002097891003359109,
	"count": 8,
	"is_parallel": true,
	"self": 0.002097891003359109
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.021987969987094402,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004761809832416475,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00046435699914582074,
	"count": 1,
	"is_parallel": true,
	"self": 0.00046435699914582074
	},
	"communicator.exchange": {
	"total": 0.01973794001969509,
	"count": 1,
	"is_parallel": true,
	"self": 0.01973794001969509
	},
	"steps_from_proto": {
	"total": 0.0013094919850118458,
	"count": 2,
	"is_parallel": true,
	"self": 0.00024246098473668098,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0010670310002751648,
	"count": 8,
	"is_parallel": true,
	"self": 0.0010670310002751648
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.05173607706092298,
	"count": 50,
	"is_parallel": true,
	"self": 0.008709836401976645,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.043026240658946335,
	"count": 200,
	"is_parallel": true,
	"self": 0.043026240658946335
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4214.7770481478365,
	"count": 347302,
	"is_parallel": true,
	"self": 237.83366664528148,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 162.09566081810044,
	"count": 347302,
	"is_parallel": true,
	"self": 162.09566081810044
	},
	"communicator.exchange": {
	"total": 3184.5067745028355,
	"count": 347302,
	"is_parallel": true,
	"self": 3184.5067745028355
	},
	"steps_from_proto": {
	"total": 630.3409461816191,
	"count": 694604,
	"is_parallel": true,
	"self": 106.73629873536993,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 523.6046474462491,
	"count": 2778416,
	"is_parallel": true,
	"self": 523.6046474462491
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1980.4214205433673,
	"count": 347303,
	"self": 60.59123472208739,
	"children": {
	"process_trajectory": {
	"total": 951.9022839034442,
	"count": 347303,
	"self": 928.9015034834156,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 23.000780420028605,
	"count": 10,
	"self": 23.000780420028605
	}
	}
	},
	"_update_policy": {
	"total": 967.9279019178357,
	"count": 121,
	"self": 540.7814483185066,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 427.1464535993291,
	"count": 3630,
	"self": 427.1464535993291
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.709880497306585e-07,
	"count": 1,
	"self": 5.709880497306585e-07
	},
	"TrainerController._save_models": {
	"total": 2.33740412798943,
	"count": 1,
	"self": 0.15179298998555169,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.1856111380038783,
	"count": 1,
	"self": 2.1856111380038783
	}
	}
	}
	}
	}
	}
	}