No defaults - 20M

bcef2b0 over 2 years ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 0.9073097109794617,
	"min": 0.8696509003639221,
	"max": 3.295811414718628,
	"count": 2200
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 35856.87890625,
	"min": 21059.609375,
	"max": 1019961.375,
	"count": 2200
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 24.602040816326532,
	"min": 17.152416356877325,
	"max": 392.75,
	"count": 2200
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19288.0,
	"min": 17756.0,
	"max": 21412.0,
	"count": 2200
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1533.4588753226842,
	"min": 1200.328406833094,
	"max": 1579.4606048764724,
	"count": 2200
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 601115.8791264922,
	"min": 2409.9434577136913,
	"max": 781900.3774073822,
	"count": 2200
	},
	"SoccerTwos.Step.mean": {
	"value": 21999994.0,
	"min": 9958.0,
	"max": 21999994.0,
	"count": 2200
	},
	"SoccerTwos.Step.sum": {
	"value": 21999994.0,
	"min": 9958.0,
	"max": 21999994.0,
	"count": 2200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.0006931066163815558,
	"min": -0.11423704773187637,
	"max": 0.23437894880771637,
	"count": 2200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 0.27100467681884766,
	"min": -49.42055130004883,
	"max": 68.4496078491211,
	"count": 2200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.0009028149652294815,
	"min": -0.11388174444437027,
	"max": 0.21143116056919098,
	"count": 2200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 0.3530006408691406,
	"min": -50.347877502441406,
	"max": 67.15494537353516,
	"count": 2200
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2200
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2200
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.052163681105884444,
	"min": -0.3903066684802373,
	"max": 0.5489372896440958,
	"count": 2200
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 20.395999312400818,
	"min": -103.09040009975433,
	"max": 141.59099984169006,
	"count": 2200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.052163681105884444,
	"min": -0.3903066684802373,
	"max": 0.5489372896440958,
	"count": 2200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 20.395999312400818,
	"min": -103.09040009975433,
	"max": 141.59099984169006,
	"count": 2200
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2200
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2200
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.016792847060908875,
	"min": 0.01056482947509115,
	"max": 0.024503496209702765,
	"count": 1065
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.016792847060908875,
	"min": 0.01056482947509115,
	"max": 0.024503496209702765,
	"count": 1065
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.11256088341275851,
	"min": 0.005557317488516371,
	"max": 0.12470681170622508,
	"count": 1065
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.11256088341275851,
	"min": 0.005557317488516371,
	"max": 0.12470681170622508,
	"count": 1065
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.11302393625179927,
	"min": 0.005690486178112527,
	"max": 0.12509485532840092,
	"count": 1065
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.11302393625179927,
	"min": 0.005690486178112527,
	"max": 0.12509485532840092,
	"count": 1065
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 1.933272083181791e-07,
	"min": 1.933272083181791e-07,
	"max": 0.0002997203455477637,
	"count": 1065
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 1.933272083181791e-07,
	"min": 1.933272083181791e-07,
	"max": 0.0002997203455477637,
	"count": 1065
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.25,
	"min": 0.25,
	"max": 0.25,
	"count": 1065
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.25,
	"min": 0.25,
	"max": 0.25,
	"count": 1065
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 1.6434468181818088e-05,
	"min": 1.6434468181818088e-05,
	"max": 0.009990687503636362,
	"count": 1065
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 1.6434468181818088e-05,
	"min": 1.6434468181818088e-05,
	"max": 0.009990687503636362,
	"count": 1065
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1693348019",
	"python_version": "3.9.17 (main, Jul 5 2023, 20:41:20) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/mgmeskill/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=Downstrike-20M --no-graphics --num-envs=32",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1693373657"
	},
	"total": 25638.07527213078,
	"count": 1,
	"self": 0.836282589007169,
	"children": {
	"run_training.setup": {
	"total": 0.17577498173341155,
	"count": 1,
	"self": 0.17577498173341155
	},
	"TrainerController.start_learning": {
	"total": 25637.06321456004,
	"count": 1,
	"self": 8.342477745376527,
	"children": {
	"TrainerController._reset_env": {
	"total": 271.783062253613,
	"count": 1088,
	"self": 271.783062253613
	},
	"TrainerController.advance": {
	"total": 25356.61511585163,
	"count": 108628,
	"self": 3.1089843809604645,
	"children": {
	"env_step": {
	"total": 15745.96533632977,
	"count": 108628,
	"self": 5440.94653446367,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 10292.108620898332,
	"count": 3116235,
	"self": 255.61927175475284,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 10036.48934914358,
	"count": 5628498,
	"self": 10036.48934914358
	}
	}
	},
	"workers": {
	"total": 12.910180967766792,
	"count": 108628,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 818588.5154348165,
	"count": 3112826,
	"is_parallel": true,
	"self": 780482.6229405664,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.07693493086844683,
	"count": 64,
	"is_parallel": true,
	"self": 0.015927689615637064,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.06100724125280976,
	"count": 256,
	"is_parallel": true,
	"self": 0.06100724125280976
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.719481447711587,
	"count": 32,
	"is_parallel": true,
	"self": 0.020501975435763597,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.013642964884638786,
	"count": 32,
	"is_parallel": true,
	"self": 0.013642964884638786
	},
	"communicator.exchange": {
	"total": 0.627972015645355,
	"count": 32,
	"is_parallel": true,
	"self": 0.627972015645355
	},
	"steps_from_proto": {
	"total": 0.05736449174582958,
	"count": 64,
	"is_parallel": true,
	"self": 0.01029907027259469,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.04706542147323489,
	"count": 256,
	"is_parallel": true,
	"self": 0.04706542147323489
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 38019.55847894726,
	"count": 3112794,
	"is_parallel": true,
	"self": 2457.6824236582033,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 1512.2425317005254,
	"count": 3112794,
	"is_parallel": true,
	"self": 1512.2425317005254
	},
	"communicator.exchange": {
	"total": 27368.108181226067,
	"count": 3112794,
	"is_parallel": true,
	"self": 27368.108181226067
	},
	"steps_from_proto": {
	"total": 6681.525342362467,
	"count": 6225588,
	"is_parallel": true,
	"self": 1143.5824937582947,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 5537.9428486041725,
	"count": 24902352,
	"is_parallel": true,
	"self": 5537.9428486041725
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 86.33401530282572,
	"count": 69568,
	"is_parallel": true,
	"self": 14.690878832247108,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 71.64313647057861,
	"count": 278272,
	"is_parallel": true,
	"self": 71.64313647057861
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 9607.5407951409,
	"count": 108628,
	"self": 132.7211998142302,
	"children": {
	"process_trajectory": {
	"total": 4697.321105179377,
	"count": 108628,
	"self": 4693.751423222944,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 3.5696819564327598,
	"count": 11,
	"self": 3.5696819564327598
	}
	}
	},
	"_update_policy": {
	"total": 4777.498490147293,
	"count": 1065,
	"self": 2678.744994345121,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 2098.7534958021715,
	"count": 31950,
	"self": 2098.7534958021715
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 6.621703505516052e-07,
	"count": 1,
	"self": 6.621703505516052e-07
	},
	"TrainerController._save_models": {
	"total": 0.3225580472499132,
	"count": 1,
	"self": 0.0020071682520210743,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.32055087899789214,
	"count": 1,
	"self": 0.32055087899789214
	}
	}
	}
	}
	}
	}
	}