Push about 3.9m steps of SoccerTwos

8921bc6 almost 3 years ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.9089889526367188,
	"min": 1.8442237377166748,
	"max": 3.213865041732788,
	"count": 472
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 35919.53515625,
	"min": 29317.10546875,
	"max": 120344.625,
	"count": 472
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 62.17948717948718,
	"min": 42.51304347826087,
	"max": 999.0,
	"count": 472
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19400.0,
	"min": 11112.0,
	"max": 28436.0,
	"count": 472
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1556.9494059513054,
	"min": 1184.4253004330594,
	"max": 1576.660508881427,
	"count": 471
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 242884.10732840362,
	"min": 2370.6947943219175,
	"max": 334525.03998778446,
	"count": 471
	},
	"SoccerTwos.Step.mean": {
	"value": 5039949.0,
	"min": 329805.0,
	"max": 5039949.0,
	"count": 472
	},
	"SoccerTwos.Step.sum": {
	"value": 5039949.0,
	"min": 329805.0,
	"max": 5039949.0,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.010436630807816982,
	"min": -0.09697045385837555,
	"max": 0.1714733988046646,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -1.6385509967803955,
	"min": -16.600444793701172,
	"max": 23.41659164428711,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.01028787437826395,
	"min": -0.09972328692674637,
	"max": 0.17430460453033447,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -1.6151962280273438,
	"min": -17.1435546875,
	"max": 23.17365837097168,
	"count": 472
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 472
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.10489171933216654,
	"min": -0.5669750012457371,
	"max": 0.44391110796987276,
	"count": 472
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 16.467999935150146,
	"min": -50.66320013999939,
	"max": 46.512000262737274,
	"count": 472
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.10489171933216654,
	"min": -0.5669750012457371,
	"max": 0.44391110796987276,
	"count": 472
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 16.467999935150146,
	"min": -50.66320013999939,
	"max": 46.512000262737274,
	"count": 472
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 472
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 472
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016275092681947476,
	"min": 0.010151559529488926,
	"max": 0.024196836646297015,
	"count": 227
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.016275092681947476,
	"min": 0.010151559529488926,
	"max": 0.024196836646297015,
	"count": 227
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09684030537803968,
	"min": 0.0013416305688830714,
	"max": 0.11689281612634658,
	"count": 227
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09684030537803968,
	"min": 0.0013416305688830714,
	"max": 0.11689281612634658,
	"count": 227
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09833643784125647,
	"min": 0.0013579658038603763,
	"max": 0.11826808328429858,
	"count": 227
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09833643784125647,
	"min": 0.0013579658038603763,
	"max": 0.11826808328429858,
	"count": 227
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 227
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 227
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 227
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 227
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 227
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 227
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1688468546",
	"python_version": "3.10.10 (main, Mar 21 2023, 18:45:11) [GCC 11.2.0]",
	"command_line_arguments": "/opt/conda/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1688485154"
	},
	"total": 16607.525235416368,
	"count": 1,
	"self": 0.013366627972573042,
	"children": {
	"run_training.setup": {
	"total": 0.015603977721184492,
	"count": 1,
	"self": 0.015603977721184492
	},
	"TrainerController.start_learning": {
	"total": 16607.496264810674,
	"count": 1,
	"self": 8.919515123125166,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.5175714301876724,
	"count": 25,
	"self": 1.5175714301876724
	},
	"TrainerController.advance": {
	"total": 16596.756896799896,
	"count": 322264,
	"self": 7.916705624666065,
	"children": {
	"env_step": {
	"total": 5911.727526604664,
	"count": 322264,
	"self": 4514.543463871349,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1392.023328505922,
	"count": 322264,
	"self": 49.78212635125965,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1342.2412021546625,
	"count": 595496,
	"self": 1342.2412021546625
	}
	}
	},
	"workers": {
	"total": 5.1607342273928225,
	"count": 322264,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 16555.016848264262,
	"count": 322264,
	"is_parallel": true,
	"self": 12923.445410506334,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.00312175415456295,
	"count": 2,
	"is_parallel": true,
	"self": 0.0008582943119108677,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0022634598426520824,
	"count": 8,
	"is_parallel": true,
	"self": 0.0022634598426520824
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.026854357682168484,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006880271248519421,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005317311733961105,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005317311733961105
	},
	"communicator.exchange": {
	"total": 0.023468355182558298,
	"count": 1,
	"is_parallel": true,
	"self": 0.023468355182558298
	},
	"steps_from_proto": {
	"total": 0.002166244201362133,
	"count": 2,
	"is_parallel": true,
	"self": 0.000483611598610878,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001682632602751255,
	"count": 8,
	"is_parallel": true,
	"self": 0.001682632602751255
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.053547489922493696,
	"count": 48,
	"is_parallel": true,
	"self": 0.010899828281253576,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.04264766164124012,
	"count": 192,
	"is_parallel": true,
	"self": 0.04264766164124012
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 3631.5178902680054,
	"count": 322263,
	"is_parallel": true,
	"self": 189.9846967374906,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 131.83427887735888,
	"count": 322263,
	"is_parallel": true,
	"self": 131.83427887735888
	},
	"communicator.exchange": {
	"total": 2676.0341983493418,
	"count": 322263,
	"is_parallel": true,
	"self": 2676.0341983493418
	},
	"steps_from_proto": {
	"total": 633.6647163038142,
	"count": 644526,
	"is_parallel": true,
	"self": 126.69072948535904,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 506.97398681845516,
	"count": 2578104,
	"is_parallel": true,
	"self": 506.97398681845516
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 10677.112664570566,
	"count": 322264,
	"self": 69.58496827818453,
	"children": {
	"process_trajectory": {
	"total": 1633.3974608271383,
	"count": 322264,
	"self": 1630.1399948387407,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 3.2574659883975983,
	"count": 10,
	"self": 3.2574659883975983
	}
	}
	},
	"_update_policy": {
	"total": 8974.130235465243,
	"count": 228,
	"self": 946.202926828526,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 8027.9273086367175,
	"count": 6840,
	"self": 8027.9273086367175
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 2.514570951461792e-06,
	"count": 1,
	"self": 2.514570951461792e-06
	},
	"TrainerController._save_models": {
	"total": 0.30227894289419055,
	"count": 1,
	"self": 0.005925939884036779,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.29635300301015377,
	"count": 1,
	"self": 0.29635300301015377
	}
	}
	}
	}
	}
	}
	}